{ "best_metric": 0.12089719269034979, "best_model_checkpoint": "./wav2vec2-base-german-cv9/checkpoint-177850", "epoch": 49.999859451862264, "global_step": 177850, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.01, "learning_rate": 1.6305875737981447e-07, "loss": 12.2032, "step": 30 }, { "epoch": 0.02, "learning_rate": 3.3174023053134664e-07, "loss": 12.7588, "step": 60 }, { "epoch": 0.03, "learning_rate": 5.004217036828789e-07, "loss": 11.4436, "step": 90 }, { "epoch": 0.03, "learning_rate": 6.691031768344111e-07, "loss": 12.2914, "step": 120 }, { "epoch": 0.04, "learning_rate": 8.377846499859433e-07, "loss": 11.2155, "step": 150 }, { "epoch": 0.05, "learning_rate": 1.0064661231374754e-06, "loss": 10.696, "step": 180 }, { "epoch": 0.06, "learning_rate": 1.1751475962890077e-06, "loss": 10.2185, "step": 210 }, { "epoch": 0.07, "learning_rate": 1.3438290694405398e-06, "loss": 7.9571, "step": 240 }, { "epoch": 0.08, "learning_rate": 1.512510542592072e-06, "loss": 6.4243, "step": 270 }, { "epoch": 0.08, "learning_rate": 1.6811920157436041e-06, "loss": 4.8724, "step": 300 }, { "epoch": 0.09, "learning_rate": 1.8498734888951364e-06, "loss": 3.9775, "step": 330 }, { "epoch": 0.1, "learning_rate": 2.0185549620466685e-06, "loss": 3.7284, "step": 360 }, { "epoch": 0.11, "learning_rate": 2.1872364351982008e-06, "loss": 3.5572, "step": 390 }, { "epoch": 0.12, "learning_rate": 2.355917908349733e-06, "loss": 3.4845, "step": 420 }, { "epoch": 0.13, "learning_rate": 2.5245993815012653e-06, "loss": 3.5107, "step": 450 }, { "epoch": 0.13, "learning_rate": 2.6932808546527976e-06, "loss": 3.3341, "step": 480 }, { "epoch": 0.14, "learning_rate": 2.8619623278043295e-06, "loss": 3.3489, "step": 510 }, { "epoch": 0.15, "learning_rate": 3.0306438009558618e-06, "loss": 3.2479, "step": 540 }, { "epoch": 0.16, "learning_rate": 3.199325274107394e-06, "loss": 3.2032, "step": 570 }, { "epoch": 0.17, "learning_rate": 3.3680067472589263e-06, "loss": 3.1983, "step": 600 }, { "epoch": 0.18, "learning_rate": 3.5366882204104586e-06, "loss": 3.1298, "step": 630 }, { "epoch": 0.19, "learning_rate": 3.7053696935619905e-06, "loss": 3.1466, "step": 660 }, { "epoch": 0.19, "learning_rate": 3.874051166713523e-06, "loss": 3.1242, "step": 690 }, { "epoch": 0.2, "learning_rate": 4.042732639865055e-06, "loss": 3.11, "step": 720 }, { "epoch": 0.21, "learning_rate": 4.211414113016587e-06, "loss": 3.0988, "step": 750 }, { "epoch": 0.22, "learning_rate": 4.38009558616812e-06, "loss": 3.0706, "step": 780 }, { "epoch": 0.23, "learning_rate": 4.548777059319652e-06, "loss": 3.0548, "step": 810 }, { "epoch": 0.24, "learning_rate": 4.717458532471184e-06, "loss": 3.024, "step": 840 }, { "epoch": 0.24, "learning_rate": 4.8861400056227165e-06, "loss": 3.0499, "step": 870 }, { "epoch": 0.25, "learning_rate": 5.054821478774248e-06, "loss": 3.0314, "step": 900 }, { "epoch": 0.26, "learning_rate": 5.22350295192578e-06, "loss": 3.0053, "step": 930 }, { "epoch": 0.27, "learning_rate": 5.3921844250773125e-06, "loss": 3.0105, "step": 960 }, { "epoch": 0.28, "learning_rate": 5.560865898228845e-06, "loss": 2.9906, "step": 990 }, { "epoch": 0.29, "learning_rate": 5.729547371380377e-06, "loss": 2.9944, "step": 1020 }, { "epoch": 0.3, "learning_rate": 5.898228844531909e-06, "loss": 2.9826, "step": 1050 }, { "epoch": 0.3, "learning_rate": 6.066910317683442e-06, "loss": 2.9734, "step": 1080 }, { "epoch": 0.31, "learning_rate": 6.235591790834974e-06, "loss": 2.9778, "step": 1110 }, { "epoch": 0.32, "learning_rate": 6.404273263986506e-06, "loss": 2.9687, "step": 1140 }, { "epoch": 0.33, "learning_rate": 6.572954737138038e-06, "loss": 2.9713, "step": 1170 }, { "epoch": 0.34, "learning_rate": 6.74163621028957e-06, "loss": 2.974, "step": 1200 }, { "epoch": 0.35, "learning_rate": 6.910317683441102e-06, "loss": 2.9678, "step": 1230 }, { "epoch": 0.35, "learning_rate": 7.0789991565926345e-06, "loss": 2.9642, "step": 1260 }, { "epoch": 0.36, "learning_rate": 7.247680629744166e-06, "loss": 2.9497, "step": 1290 }, { "epoch": 0.37, "learning_rate": 7.416362102895699e-06, "loss": 2.9682, "step": 1320 }, { "epoch": 0.38, "learning_rate": 7.5850435760472305e-06, "loss": 2.9605, "step": 1350 }, { "epoch": 0.39, "learning_rate": 7.753725049198764e-06, "loss": 2.9447, "step": 1380 }, { "epoch": 0.4, "learning_rate": 7.922406522350296e-06, "loss": 2.9573, "step": 1410 }, { "epoch": 0.4, "learning_rate": 8.091087995501828e-06, "loss": 2.9415, "step": 1440 }, { "epoch": 0.41, "learning_rate": 8.25976946865336e-06, "loss": 2.9516, "step": 1470 }, { "epoch": 0.42, "learning_rate": 8.428450941804893e-06, "loss": 2.95, "step": 1500 }, { "epoch": 0.43, "learning_rate": 8.597132414956425e-06, "loss": 2.9408, "step": 1530 }, { "epoch": 0.44, "learning_rate": 8.765813888107957e-06, "loss": 2.9465, "step": 1560 }, { "epoch": 0.45, "learning_rate": 8.934495361259488e-06, "loss": 2.9343, "step": 1590 }, { "epoch": 0.46, "learning_rate": 9.103176834411022e-06, "loss": 2.9493, "step": 1620 }, { "epoch": 0.46, "learning_rate": 9.271858307562552e-06, "loss": 2.9469, "step": 1650 }, { "epoch": 0.47, "learning_rate": 9.440539780714085e-06, "loss": 2.9335, "step": 1680 }, { "epoch": 0.48, "learning_rate": 9.609221253865617e-06, "loss": 2.9465, "step": 1710 }, { "epoch": 0.49, "learning_rate": 9.77790272701715e-06, "loss": 2.9322, "step": 1740 }, { "epoch": 0.5, "learning_rate": 9.946584200168682e-06, "loss": 2.9458, "step": 1770 }, { "epoch": 0.51, "learning_rate": 1.0115265673320214e-05, "loss": 2.9356, "step": 1800 }, { "epoch": 0.51, "learning_rate": 1.0283947146471746e-05, "loss": 2.9323, "step": 1830 }, { "epoch": 0.52, "learning_rate": 1.0452628619623278e-05, "loss": 2.9469, "step": 1860 }, { "epoch": 0.53, "learning_rate": 1.062131009277481e-05, "loss": 2.9314, "step": 1890 }, { "epoch": 0.54, "learning_rate": 1.0789991565926343e-05, "loss": 2.938, "step": 1920 }, { "epoch": 0.55, "learning_rate": 1.0958673039077875e-05, "loss": 2.9337, "step": 1950 }, { "epoch": 0.56, "learning_rate": 1.1127354512229408e-05, "loss": 2.9256, "step": 1980 }, { "epoch": 0.57, "learning_rate": 1.129603598538094e-05, "loss": 2.932, "step": 2010 }, { "epoch": 0.57, "learning_rate": 1.1464717458532472e-05, "loss": 2.9211, "step": 2040 }, { "epoch": 0.58, "learning_rate": 1.1633398931684004e-05, "loss": 2.9309, "step": 2070 }, { "epoch": 0.59, "learning_rate": 1.1802080404835537e-05, "loss": 2.9275, "step": 2100 }, { "epoch": 0.6, "learning_rate": 1.1970761877987069e-05, "loss": 2.9213, "step": 2130 }, { "epoch": 0.61, "learning_rate": 1.2139443351138601e-05, "loss": 2.9525, "step": 2160 }, { "epoch": 0.62, "learning_rate": 1.2308124824290134e-05, "loss": 2.9197, "step": 2190 }, { "epoch": 0.62, "learning_rate": 1.2476806297441664e-05, "loss": 2.9257, "step": 2220 }, { "epoch": 0.63, "learning_rate": 1.2645487770593198e-05, "loss": 2.9156, "step": 2250 }, { "epoch": 0.64, "learning_rate": 1.2814169243744729e-05, "loss": 2.9045, "step": 2280 }, { "epoch": 0.65, "learning_rate": 1.2982850716896261e-05, "loss": 2.858, "step": 2310 }, { "epoch": 0.66, "learning_rate": 1.3151532190047793e-05, "loss": 2.7263, "step": 2340 }, { "epoch": 0.67, "learning_rate": 1.3320213663199327e-05, "loss": 2.6023, "step": 2370 }, { "epoch": 0.67, "learning_rate": 1.3488895136350856e-05, "loss": 2.412, "step": 2400 }, { "epoch": 0.68, "learning_rate": 1.365757660950239e-05, "loss": 2.2819, "step": 2430 }, { "epoch": 0.69, "learning_rate": 1.3826258082653922e-05, "loss": 2.1276, "step": 2460 }, { "epoch": 0.7, "learning_rate": 1.3994939555805456e-05, "loss": 1.9495, "step": 2490 }, { "epoch": 0.71, "learning_rate": 1.4163621028956985e-05, "loss": 1.7862, "step": 2520 }, { "epoch": 0.72, "learning_rate": 1.433230250210852e-05, "loss": 1.6618, "step": 2550 }, { "epoch": 0.73, "learning_rate": 1.4500983975260052e-05, "loss": 1.5095, "step": 2580 }, { "epoch": 0.73, "learning_rate": 1.4669665448411586e-05, "loss": 1.4625, "step": 2610 }, { "epoch": 0.74, "learning_rate": 1.4838346921563114e-05, "loss": 1.3446, "step": 2640 }, { "epoch": 0.75, "learning_rate": 1.5007028394714648e-05, "loss": 1.2631, "step": 2670 }, { "epoch": 0.76, "learning_rate": 1.517570986786618e-05, "loss": 1.2598, "step": 2700 }, { "epoch": 0.77, "learning_rate": 1.534439134101771e-05, "loss": 1.1956, "step": 2730 }, { "epoch": 0.78, "learning_rate": 1.5513072814169244e-05, "loss": 1.1249, "step": 2760 }, { "epoch": 0.78, "learning_rate": 1.5681754287320776e-05, "loss": 1.1259, "step": 2790 }, { "epoch": 0.79, "learning_rate": 1.5850435760472308e-05, "loss": 1.0686, "step": 2820 }, { "epoch": 0.8, "learning_rate": 1.601911723362384e-05, "loss": 1.0721, "step": 2850 }, { "epoch": 0.81, "learning_rate": 1.6187798706775373e-05, "loss": 1.0029, "step": 2880 }, { "epoch": 0.82, "learning_rate": 1.6356480179926905e-05, "loss": 1.0331, "step": 2910 }, { "epoch": 0.83, "learning_rate": 1.6525161653078437e-05, "loss": 0.9962, "step": 2940 }, { "epoch": 0.83, "learning_rate": 1.669384312622997e-05, "loss": 0.9536, "step": 2970 }, { "epoch": 0.84, "learning_rate": 1.6862524599381502e-05, "loss": 0.9659, "step": 3000 }, { "epoch": 0.85, "learning_rate": 1.7031206072533034e-05, "loss": 0.8696, "step": 3030 }, { "epoch": 0.86, "learning_rate": 1.7199887545684566e-05, "loss": 0.9237, "step": 3060 }, { "epoch": 0.87, "learning_rate": 1.73685690188361e-05, "loss": 0.8709, "step": 3090 }, { "epoch": 0.88, "learning_rate": 1.753725049198763e-05, "loss": 0.8687, "step": 3120 }, { "epoch": 0.89, "learning_rate": 1.7705931965139163e-05, "loss": 0.8936, "step": 3150 }, { "epoch": 0.89, "learning_rate": 1.7874613438290696e-05, "loss": 0.8026, "step": 3180 }, { "epoch": 0.9, "learning_rate": 1.8043294911442228e-05, "loss": 0.8476, "step": 3210 }, { "epoch": 0.91, "learning_rate": 1.821197638459376e-05, "loss": 0.7849, "step": 3240 }, { "epoch": 0.92, "learning_rate": 1.8380657857745292e-05, "loss": 0.7881, "step": 3270 }, { "epoch": 0.93, "learning_rate": 1.854933933089682e-05, "loss": 0.8008, "step": 3300 }, { "epoch": 0.94, "learning_rate": 1.8718020804048357e-05, "loss": 0.7813, "step": 3330 }, { "epoch": 0.94, "learning_rate": 1.888670227719989e-05, "loss": 0.7709, "step": 3360 }, { "epoch": 0.95, "learning_rate": 1.905538375035142e-05, "loss": 0.7513, "step": 3390 }, { "epoch": 0.96, "learning_rate": 1.922406522350295e-05, "loss": 0.7527, "step": 3420 }, { "epoch": 0.97, "learning_rate": 1.9392746696654486e-05, "loss": 0.7578, "step": 3450 }, { "epoch": 0.98, "learning_rate": 1.956142816980602e-05, "loss": 0.692, "step": 3480 }, { "epoch": 0.99, "learning_rate": 1.973010964295755e-05, "loss": 0.7196, "step": 3510 }, { "epoch": 1.0, "learning_rate": 1.989879111610908e-05, "loss": 0.6827, "step": 3540 }, { "epoch": 1.0, "eval_loss": 0.6694612503051758, "eval_runtime": 479.6772, "eval_samples_per_second": 33.425, "eval_steps_per_second": 1.047, "eval_wer": 0.6247048708255428, "step": 3557 }, { "epoch": 1.0, "learning_rate": 2.0067472589260615e-05, "loss": 0.7322, "step": 3570 }, { "epoch": 1.01, "learning_rate": 2.0236154062412148e-05, "loss": 0.6911, "step": 3600 }, { "epoch": 1.02, "learning_rate": 2.040483553556368e-05, "loss": 0.6838, "step": 3630 }, { "epoch": 1.03, "learning_rate": 2.057351700871521e-05, "loss": 0.7403, "step": 3660 }, { "epoch": 1.04, "learning_rate": 2.074219848186674e-05, "loss": 0.6329, "step": 3690 }, { "epoch": 1.05, "learning_rate": 2.0910879955018277e-05, "loss": 0.7176, "step": 3720 }, { "epoch": 1.05, "learning_rate": 2.107956142816981e-05, "loss": 0.6629, "step": 3750 }, { "epoch": 1.06, "learning_rate": 2.1248242901321338e-05, "loss": 0.6463, "step": 3780 }, { "epoch": 1.07, "learning_rate": 2.141692437447287e-05, "loss": 0.6654, "step": 3810 }, { "epoch": 1.08, "learning_rate": 2.1585605847624406e-05, "loss": 0.6117, "step": 3840 }, { "epoch": 1.09, "learning_rate": 2.1754287320775935e-05, "loss": 0.6467, "step": 3870 }, { "epoch": 1.1, "learning_rate": 2.1922968793927467e-05, "loss": 0.6177, "step": 3900 }, { "epoch": 1.1, "learning_rate": 2.2091650267079e-05, "loss": 0.6371, "step": 3930 }, { "epoch": 1.11, "learning_rate": 2.2260331740230535e-05, "loss": 0.6435, "step": 3960 }, { "epoch": 1.12, "learning_rate": 2.2429013213382064e-05, "loss": 0.5747, "step": 3990 }, { "epoch": 1.13, "learning_rate": 2.2597694686533596e-05, "loss": 0.6323, "step": 4020 }, { "epoch": 1.14, "learning_rate": 2.276637615968513e-05, "loss": 0.5872, "step": 4050 }, { "epoch": 1.15, "learning_rate": 2.293505763283666e-05, "loss": 0.6117, "step": 4080 }, { "epoch": 1.16, "learning_rate": 2.3103739105988193e-05, "loss": 0.6378, "step": 4110 }, { "epoch": 1.16, "learning_rate": 2.3272420579139725e-05, "loss": 0.5582, "step": 4140 }, { "epoch": 1.17, "learning_rate": 2.3441102052291258e-05, "loss": 0.5966, "step": 4170 }, { "epoch": 1.18, "learning_rate": 2.360978352544279e-05, "loss": 0.5798, "step": 4200 }, { "epoch": 1.19, "learning_rate": 2.3778464998594322e-05, "loss": 0.5712, "step": 4230 }, { "epoch": 1.2, "learning_rate": 2.3947146471745854e-05, "loss": 0.6294, "step": 4260 }, { "epoch": 1.21, "learning_rate": 2.4115827944897387e-05, "loss": 0.5199, "step": 4290 }, { "epoch": 1.21, "learning_rate": 2.428450941804892e-05, "loss": 0.5899, "step": 4320 }, { "epoch": 1.22, "learning_rate": 2.445319089120045e-05, "loss": 0.5548, "step": 4350 }, { "epoch": 1.23, "learning_rate": 2.4621872364351984e-05, "loss": 0.5549, "step": 4380 }, { "epoch": 1.24, "learning_rate": 2.4790553837503516e-05, "loss": 0.5868, "step": 4410 }, { "epoch": 1.25, "learning_rate": 2.4959235310655048e-05, "loss": 0.5235, "step": 4440 }, { "epoch": 1.26, "learning_rate": 2.5127916783806584e-05, "loss": 0.554, "step": 4470 }, { "epoch": 1.27, "learning_rate": 2.529659825695811e-05, "loss": 0.5417, "step": 4500 }, { "epoch": 1.27, "learning_rate": 2.546527973010964e-05, "loss": 0.5507, "step": 4530 }, { "epoch": 1.28, "learning_rate": 2.5633961203261174e-05, "loss": 0.553, "step": 4560 }, { "epoch": 1.29, "learning_rate": 2.580264267641271e-05, "loss": 0.5236, "step": 4590 }, { "epoch": 1.3, "learning_rate": 2.5971324149564242e-05, "loss": 0.539, "step": 4620 }, { "epoch": 1.31, "learning_rate": 2.6140005622715774e-05, "loss": 0.5365, "step": 4650 }, { "epoch": 1.32, "learning_rate": 2.6308687095867306e-05, "loss": 0.5051, "step": 4680 }, { "epoch": 1.32, "learning_rate": 2.647736856901884e-05, "loss": 0.5507, "step": 4710 }, { "epoch": 1.33, "learning_rate": 2.6646050042170368e-05, "loss": 0.4849, "step": 4740 }, { "epoch": 1.34, "learning_rate": 2.68147315153219e-05, "loss": 0.5283, "step": 4770 }, { "epoch": 1.35, "learning_rate": 2.6983412988473432e-05, "loss": 0.5033, "step": 4800 }, { "epoch": 1.36, "learning_rate": 2.7152094461624968e-05, "loss": 0.4936, "step": 4830 }, { "epoch": 1.37, "learning_rate": 2.73207759347765e-05, "loss": 0.5279, "step": 4860 }, { "epoch": 1.37, "learning_rate": 2.7489457407928032e-05, "loss": 0.4744, "step": 4890 }, { "epoch": 1.38, "learning_rate": 2.7658138881079565e-05, "loss": 0.5037, "step": 4920 }, { "epoch": 1.39, "learning_rate": 2.7826820354231094e-05, "loss": 0.4915, "step": 4950 }, { "epoch": 1.4, "learning_rate": 2.7995501827382626e-05, "loss": 0.4876, "step": 4980 }, { "epoch": 1.41, "learning_rate": 2.8164183300534158e-05, "loss": 0.5335, "step": 5010 }, { "epoch": 1.42, "learning_rate": 2.833286477368569e-05, "loss": 0.4636, "step": 5040 }, { "epoch": 1.43, "learning_rate": 2.8501546246837223e-05, "loss": 0.5002, "step": 5070 }, { "epoch": 1.43, "learning_rate": 2.867022771998876e-05, "loss": 0.4758, "step": 5100 }, { "epoch": 1.44, "learning_rate": 2.883890919314029e-05, "loss": 0.4738, "step": 5130 }, { "epoch": 1.45, "learning_rate": 2.9007590666291823e-05, "loss": 0.5203, "step": 5160 }, { "epoch": 1.46, "learning_rate": 2.9176272139443352e-05, "loss": 0.443, "step": 5190 }, { "epoch": 1.47, "learning_rate": 2.9344953612594884e-05, "loss": 0.4962, "step": 5220 }, { "epoch": 1.48, "learning_rate": 2.9513635085746416e-05, "loss": 0.4682, "step": 5250 }, { "epoch": 1.48, "learning_rate": 2.968231655889795e-05, "loss": 0.457, "step": 5280 }, { "epoch": 1.49, "learning_rate": 2.985099803204948e-05, "loss": 0.5142, "step": 5310 }, { "epoch": 1.5, "learning_rate": 3.0019679505201017e-05, "loss": 0.4314, "step": 5340 }, { "epoch": 1.51, "learning_rate": 3.018836097835255e-05, "loss": 0.4743, "step": 5370 }, { "epoch": 1.52, "learning_rate": 3.0357042451504074e-05, "loss": 0.4578, "step": 5400 }, { "epoch": 1.53, "learning_rate": 3.052572392465561e-05, "loss": 0.4509, "step": 5430 }, { "epoch": 1.53, "learning_rate": 3.069440539780714e-05, "loss": 0.4864, "step": 5460 }, { "epoch": 1.54, "learning_rate": 3.0863086870958675e-05, "loss": 0.4256, "step": 5490 }, { "epoch": 1.55, "learning_rate": 3.103176834411021e-05, "loss": 0.4903, "step": 5520 }, { "epoch": 1.56, "learning_rate": 3.120044981726174e-05, "loss": 0.4521, "step": 5550 }, { "epoch": 1.57, "learning_rate": 3.136913129041327e-05, "loss": 0.4468, "step": 5580 }, { "epoch": 1.58, "learning_rate": 3.1537812763564804e-05, "loss": 0.4822, "step": 5610 }, { "epoch": 1.59, "learning_rate": 3.1706494236716336e-05, "loss": 0.4293, "step": 5640 }, { "epoch": 1.59, "learning_rate": 3.187517570986787e-05, "loss": 0.4591, "step": 5670 }, { "epoch": 1.6, "learning_rate": 3.20438571830194e-05, "loss": 0.4288, "step": 5700 }, { "epoch": 1.61, "learning_rate": 3.221253865617093e-05, "loss": 0.4464, "step": 5730 }, { "epoch": 1.62, "learning_rate": 3.2381220129322465e-05, "loss": 0.4698, "step": 5760 }, { "epoch": 1.63, "learning_rate": 3.2549901602474e-05, "loss": 0.4046, "step": 5790 }, { "epoch": 1.64, "learning_rate": 3.271858307562553e-05, "loss": 0.4578, "step": 5820 }, { "epoch": 1.64, "learning_rate": 3.288726454877706e-05, "loss": 0.4225, "step": 5850 }, { "epoch": 1.65, "learning_rate": 3.3055946021928594e-05, "loss": 0.4364, "step": 5880 }, { "epoch": 1.66, "learning_rate": 3.3224627495080127e-05, "loss": 0.4601, "step": 5910 }, { "epoch": 1.67, "learning_rate": 3.339330896823166e-05, "loss": 0.4043, "step": 5940 }, { "epoch": 1.68, "learning_rate": 3.356199044138319e-05, "loss": 0.4533, "step": 5970 }, { "epoch": 1.69, "learning_rate": 3.3730671914534723e-05, "loss": 0.4269, "step": 6000 }, { "epoch": 1.7, "learning_rate": 3.3899353387686256e-05, "loss": 0.4232, "step": 6030 }, { "epoch": 1.7, "learning_rate": 3.406803486083779e-05, "loss": 0.4536, "step": 6060 }, { "epoch": 1.71, "learning_rate": 3.4236716333989314e-05, "loss": 0.3908, "step": 6090 }, { "epoch": 1.72, "learning_rate": 3.4405397807140846e-05, "loss": 0.4204, "step": 6120 }, { "epoch": 1.73, "learning_rate": 3.4574079280292385e-05, "loss": 0.4227, "step": 6150 }, { "epoch": 1.74, "learning_rate": 3.474276075344392e-05, "loss": 0.4017, "step": 6180 }, { "epoch": 1.75, "learning_rate": 3.491144222659545e-05, "loss": 0.4394, "step": 6210 }, { "epoch": 1.75, "learning_rate": 3.508012369974698e-05, "loss": 0.3858, "step": 6240 }, { "epoch": 1.76, "learning_rate": 3.5248805172898514e-05, "loss": 0.4235, "step": 6270 }, { "epoch": 1.77, "learning_rate": 3.5417486646050046e-05, "loss": 0.4025, "step": 6300 }, { "epoch": 1.78, "learning_rate": 3.558616811920157e-05, "loss": 0.4115, "step": 6330 }, { "epoch": 1.79, "learning_rate": 3.5754849592353104e-05, "loss": 0.4366, "step": 6360 }, { "epoch": 1.8, "learning_rate": 3.592353106550464e-05, "loss": 0.3796, "step": 6390 }, { "epoch": 1.8, "learning_rate": 3.6092212538656175e-05, "loss": 0.4116, "step": 6420 }, { "epoch": 1.81, "learning_rate": 3.625527129603599e-05, "loss": 0.3995, "step": 6450 }, { "epoch": 1.82, "learning_rate": 3.642395276918752e-05, "loss": 0.3909, "step": 6480 }, { "epoch": 1.83, "learning_rate": 3.659263424233905e-05, "loss": 0.4251, "step": 6510 }, { "epoch": 1.84, "learning_rate": 3.6761315715490585e-05, "loss": 0.378, "step": 6540 }, { "epoch": 1.85, "learning_rate": 3.692999718864212e-05, "loss": 0.4189, "step": 6570 }, { "epoch": 1.86, "learning_rate": 3.709867866179364e-05, "loss": 0.3978, "step": 6600 }, { "epoch": 1.86, "learning_rate": 3.726736013494518e-05, "loss": 0.3937, "step": 6630 }, { "epoch": 1.87, "learning_rate": 3.7436041608096714e-05, "loss": 0.4173, "step": 6660 }, { "epoch": 1.88, "learning_rate": 3.7604723081248246e-05, "loss": 0.3611, "step": 6690 }, { "epoch": 1.89, "learning_rate": 3.777340455439978e-05, "loss": 0.415, "step": 6720 }, { "epoch": 1.9, "learning_rate": 3.794208602755131e-05, "loss": 0.3909, "step": 6750 }, { "epoch": 1.91, "learning_rate": 3.811076750070284e-05, "loss": 0.398, "step": 6780 }, { "epoch": 1.91, "learning_rate": 3.8279448973854375e-05, "loss": 0.4173, "step": 6810 }, { "epoch": 1.92, "learning_rate": 3.84481304470059e-05, "loss": 0.3814, "step": 6840 }, { "epoch": 1.93, "learning_rate": 3.861681192015743e-05, "loss": 0.4008, "step": 6870 }, { "epoch": 1.94, "learning_rate": 3.878549339330897e-05, "loss": 0.3793, "step": 6900 }, { "epoch": 1.95, "learning_rate": 3.8954174866460504e-05, "loss": 0.3828, "step": 6930 }, { "epoch": 1.96, "learning_rate": 3.912285633961204e-05, "loss": 0.4004, "step": 6960 }, { "epoch": 1.97, "learning_rate": 3.929153781276357e-05, "loss": 0.3492, "step": 6990 }, { "epoch": 1.97, "learning_rate": 3.94602192859151e-05, "loss": 0.4091, "step": 7020 }, { "epoch": 1.98, "learning_rate": 3.962890075906663e-05, "loss": 0.3959, "step": 7050 }, { "epoch": 1.99, "learning_rate": 3.979758223221816e-05, "loss": 0.3989, "step": 7080 }, { "epoch": 2.0, "learning_rate": 3.996626370536969e-05, "loss": 0.3992, "step": 7110 }, { "epoch": 2.0, "eval_loss": 0.3737587332725525, "eval_runtime": 480.2975, "eval_samples_per_second": 33.381, "eval_steps_per_second": 1.045, "eval_wer": 0.39358972609283094, "step": 7114 }, { "epoch": 2.01, "learning_rate": 4.013494517852123e-05, "loss": 0.3616, "step": 7140 }, { "epoch": 2.02, "learning_rate": 4.030362665167276e-05, "loss": 0.3869, "step": 7170 }, { "epoch": 2.02, "learning_rate": 4.0472308124824295e-05, "loss": 0.344, "step": 7200 }, { "epoch": 2.03, "learning_rate": 4.064098959797583e-05, "loss": 0.3751, "step": 7230 }, { "epoch": 2.04, "learning_rate": 4.080967107112736e-05, "loss": 0.3755, "step": 7260 }, { "epoch": 2.05, "learning_rate": 4.0978352544278885e-05, "loss": 0.3529, "step": 7290 }, { "epoch": 2.06, "learning_rate": 4.114703401743042e-05, "loss": 0.3805, "step": 7320 }, { "epoch": 2.07, "learning_rate": 4.131571549058195e-05, "loss": 0.3421, "step": 7350 }, { "epoch": 2.07, "learning_rate": 4.148439696373348e-05, "loss": 0.3584, "step": 7380 }, { "epoch": 2.08, "learning_rate": 4.165307843688502e-05, "loss": 0.3639, "step": 7410 }, { "epoch": 2.09, "learning_rate": 4.182175991003655e-05, "loss": 0.3447, "step": 7440 }, { "epoch": 2.1, "learning_rate": 4.1990441383188086e-05, "loss": 0.3812, "step": 7470 }, { "epoch": 2.11, "learning_rate": 4.215912285633962e-05, "loss": 0.342, "step": 7500 }, { "epoch": 2.12, "learning_rate": 4.232780432949114e-05, "loss": 0.3811, "step": 7530 }, { "epoch": 2.13, "learning_rate": 4.2496485802642676e-05, "loss": 0.3631, "step": 7560 }, { "epoch": 2.13, "learning_rate": 4.266516727579421e-05, "loss": 0.338, "step": 7590 }, { "epoch": 2.14, "learning_rate": 4.283384874894574e-05, "loss": 0.3733, "step": 7620 }, { "epoch": 2.15, "learning_rate": 4.300253022209727e-05, "loss": 0.3247, "step": 7650 }, { "epoch": 2.16, "learning_rate": 4.317121169524881e-05, "loss": 0.3573, "step": 7680 }, { "epoch": 2.17, "learning_rate": 4.3339893168400344e-05, "loss": 0.3536, "step": 7710 }, { "epoch": 2.18, "learning_rate": 4.350857464155187e-05, "loss": 0.336, "step": 7740 }, { "epoch": 2.18, "learning_rate": 4.36772561147034e-05, "loss": 0.3805, "step": 7770 }, { "epoch": 2.19, "learning_rate": 4.3845937587854934e-05, "loss": 0.3219, "step": 7800 }, { "epoch": 2.2, "learning_rate": 4.4014619061006466e-05, "loss": 0.3488, "step": 7830 }, { "epoch": 2.21, "learning_rate": 4.4183300534158e-05, "loss": 0.3505, "step": 7860 }, { "epoch": 2.22, "learning_rate": 4.435198200730953e-05, "loss": 0.3363, "step": 7890 }, { "epoch": 2.23, "learning_rate": 4.452066348046107e-05, "loss": 0.3674, "step": 7920 }, { "epoch": 2.23, "learning_rate": 4.46893449536126e-05, "loss": 0.3187, "step": 7950 }, { "epoch": 2.24, "learning_rate": 4.485802642676413e-05, "loss": 0.342, "step": 7980 }, { "epoch": 2.25, "learning_rate": 4.502670789991566e-05, "loss": 0.3452, "step": 8010 }, { "epoch": 2.26, "learning_rate": 4.519538937306719e-05, "loss": 0.3259, "step": 8040 }, { "epoch": 2.27, "learning_rate": 4.5364070846218724e-05, "loss": 0.365, "step": 8070 }, { "epoch": 2.28, "learning_rate": 4.553275231937026e-05, "loss": 0.3086, "step": 8100 }, { "epoch": 2.29, "learning_rate": 4.570143379252179e-05, "loss": 0.347, "step": 8130 }, { "epoch": 2.29, "learning_rate": 4.587011526567332e-05, "loss": 0.3502, "step": 8160 }, { "epoch": 2.3, "learning_rate": 4.6038796738824854e-05, "loss": 0.3292, "step": 8190 }, { "epoch": 2.31, "learning_rate": 4.6207478211976386e-05, "loss": 0.3591, "step": 8220 }, { "epoch": 2.32, "learning_rate": 4.637615968512792e-05, "loss": 0.3107, "step": 8250 }, { "epoch": 2.33, "learning_rate": 4.654484115827945e-05, "loss": 0.3472, "step": 8280 }, { "epoch": 2.34, "learning_rate": 4.671352263143098e-05, "loss": 0.3508, "step": 8310 }, { "epoch": 2.34, "learning_rate": 4.6882204104582515e-05, "loss": 0.3302, "step": 8340 }, { "epoch": 2.35, "learning_rate": 4.705088557773405e-05, "loss": 0.3546, "step": 8370 }, { "epoch": 2.36, "learning_rate": 4.721956705088558e-05, "loss": 0.3139, "step": 8400 }, { "epoch": 2.37, "learning_rate": 4.738824852403711e-05, "loss": 0.3369, "step": 8430 }, { "epoch": 2.38, "learning_rate": 4.7556929997188644e-05, "loss": 0.3388, "step": 8460 }, { "epoch": 2.39, "learning_rate": 4.7725611470340176e-05, "loss": 0.3249, "step": 8490 }, { "epoch": 2.4, "learning_rate": 4.789429294349171e-05, "loss": 0.3521, "step": 8520 }, { "epoch": 2.4, "learning_rate": 4.806297441664324e-05, "loss": 0.3098, "step": 8550 }, { "epoch": 2.41, "learning_rate": 4.823165588979477e-05, "loss": 0.3394, "step": 8580 }, { "epoch": 2.42, "learning_rate": 4.8400337362946306e-05, "loss": 0.3332, "step": 8610 }, { "epoch": 2.43, "learning_rate": 4.856901883609784e-05, "loss": 0.3176, "step": 8640 }, { "epoch": 2.44, "learning_rate": 4.873770030924937e-05, "loss": 0.3477, "step": 8670 }, { "epoch": 2.45, "learning_rate": 4.89063817824009e-05, "loss": 0.2996, "step": 8700 }, { "epoch": 2.45, "learning_rate": 4.9075063255552435e-05, "loss": 0.3392, "step": 8730 }, { "epoch": 2.46, "learning_rate": 4.924374472870397e-05, "loss": 0.3182, "step": 8760 }, { "epoch": 2.47, "learning_rate": 4.94124262018555e-05, "loss": 0.3102, "step": 8790 }, { "epoch": 2.48, "learning_rate": 4.958110767500703e-05, "loss": 0.3393, "step": 8820 }, { "epoch": 2.49, "learning_rate": 4.9749789148158564e-05, "loss": 0.3018, "step": 8850 }, { "epoch": 2.5, "learning_rate": 4.9918470621310096e-05, "loss": 0.3248, "step": 8880 }, { "epoch": 2.5, "learning_rate": 5.008715209446163e-05, "loss": 0.3333, "step": 8910 }, { "epoch": 2.51, "learning_rate": 5.025021085184144e-05, "loss": 0.3293, "step": 8940 }, { "epoch": 2.52, "learning_rate": 5.041889232499297e-05, "loss": 0.3295, "step": 8970 }, { "epoch": 2.53, "learning_rate": 5.0587573798144506e-05, "loss": 0.305, "step": 9000 }, { "epoch": 2.54, "learning_rate": 5.075625527129604e-05, "loss": 0.3299, "step": 9030 }, { "epoch": 2.55, "learning_rate": 5.092493674444757e-05, "loss": 0.3191, "step": 9060 }, { "epoch": 2.56, "learning_rate": 5.10936182175991e-05, "loss": 0.3088, "step": 9090 }, { "epoch": 2.56, "learning_rate": 5.1262299690750635e-05, "loss": 0.3358, "step": 9120 }, { "epoch": 2.57, "learning_rate": 5.143098116390217e-05, "loss": 0.2975, "step": 9150 }, { "epoch": 2.58, "learning_rate": 5.1599662637053706e-05, "loss": 0.3194, "step": 9180 }, { "epoch": 2.59, "learning_rate": 5.176834411020524e-05, "loss": 0.315, "step": 9210 }, { "epoch": 2.6, "learning_rate": 5.193702558335677e-05, "loss": 0.3019, "step": 9240 }, { "epoch": 2.61, "learning_rate": 5.210570705650829e-05, "loss": 0.341, "step": 9270 }, { "epoch": 2.61, "learning_rate": 5.227438852965982e-05, "loss": 0.2915, "step": 9300 }, { "epoch": 2.62, "learning_rate": 5.2443070002811354e-05, "loss": 0.3036, "step": 9330 }, { "epoch": 2.63, "learning_rate": 5.2611751475962886e-05, "loss": 0.3123, "step": 9360 }, { "epoch": 2.64, "learning_rate": 5.2780432949114425e-05, "loss": 0.2926, "step": 9390 }, { "epoch": 2.65, "learning_rate": 5.294911442226596e-05, "loss": 0.3263, "step": 9420 }, { "epoch": 2.66, "learning_rate": 5.311779589541749e-05, "loss": 0.2841, "step": 9450 }, { "epoch": 2.67, "learning_rate": 5.328647736856902e-05, "loss": 0.3243, "step": 9480 }, { "epoch": 2.67, "learning_rate": 5.3455158841720554e-05, "loss": 0.3091, "step": 9510 }, { "epoch": 2.68, "learning_rate": 5.3623840314872087e-05, "loss": 0.3011, "step": 9540 }, { "epoch": 2.69, "learning_rate": 5.379252178802362e-05, "loss": 0.3216, "step": 9570 }, { "epoch": 2.7, "learning_rate": 5.396120326117515e-05, "loss": 0.2834, "step": 9600 }, { "epoch": 2.71, "learning_rate": 5.4129884734326683e-05, "loss": 0.3174, "step": 9630 }, { "epoch": 2.72, "learning_rate": 5.4298566207478216e-05, "loss": 0.2969, "step": 9660 }, { "epoch": 2.72, "learning_rate": 5.4467247680629755e-05, "loss": 0.2896, "step": 9690 }, { "epoch": 2.73, "learning_rate": 5.463592915378129e-05, "loss": 0.3153, "step": 9720 }, { "epoch": 2.74, "learning_rate": 5.4804610626932806e-05, "loss": 0.2767, "step": 9750 }, { "epoch": 2.75, "learning_rate": 5.497329210008434e-05, "loss": 0.3188, "step": 9780 }, { "epoch": 2.76, "learning_rate": 5.514197357323587e-05, "loss": 0.3092, "step": 9810 }, { "epoch": 2.77, "learning_rate": 5.53106550463874e-05, "loss": 0.2959, "step": 9840 }, { "epoch": 2.77, "learning_rate": 5.5479336519538935e-05, "loss": 0.3283, "step": 9870 }, { "epoch": 2.78, "learning_rate": 5.5648017992690474e-05, "loss": 0.2868, "step": 9900 }, { "epoch": 2.79, "learning_rate": 5.5816699465842006e-05, "loss": 0.3149, "step": 9930 }, { "epoch": 2.8, "learning_rate": 5.598538093899354e-05, "loss": 0.304, "step": 9960 }, { "epoch": 2.81, "learning_rate": 5.615406241214507e-05, "loss": 0.2867, "step": 9990 }, { "epoch": 2.82, "learning_rate": 5.63227438852966e-05, "loss": 0.321, "step": 10020 }, { "epoch": 2.83, "learning_rate": 5.6491425358448135e-05, "loss": 0.2739, "step": 10050 }, { "epoch": 2.83, "learning_rate": 5.666010683159967e-05, "loss": 0.3268, "step": 10080 }, { "epoch": 2.84, "learning_rate": 5.68287883047512e-05, "loss": 0.3024, "step": 10110 }, { "epoch": 2.85, "learning_rate": 5.699746977790273e-05, "loss": 0.2842, "step": 10140 }, { "epoch": 2.86, "learning_rate": 5.7166151251054265e-05, "loss": 0.3249, "step": 10170 }, { "epoch": 2.87, "learning_rate": 5.733483272420579e-05, "loss": 0.2767, "step": 10200 }, { "epoch": 2.88, "learning_rate": 5.750351419735732e-05, "loss": 0.3021, "step": 10230 }, { "epoch": 2.88, "learning_rate": 5.7672195670508855e-05, "loss": 0.3049, "step": 10260 }, { "epoch": 2.89, "learning_rate": 5.784087714366039e-05, "loss": 0.2757, "step": 10290 }, { "epoch": 2.9, "learning_rate": 5.800955861681192e-05, "loss": 0.3065, "step": 10320 }, { "epoch": 2.91, "learning_rate": 5.817824008996345e-05, "loss": 0.2667, "step": 10350 }, { "epoch": 2.92, "learning_rate": 5.8346921563114984e-05, "loss": 0.3008, "step": 10380 }, { "epoch": 2.93, "learning_rate": 5.851560303626652e-05, "loss": 0.2879, "step": 10410 }, { "epoch": 2.93, "learning_rate": 5.8684284509418055e-05, "loss": 0.2768, "step": 10440 }, { "epoch": 2.94, "learning_rate": 5.885296598256959e-05, "loss": 0.3082, "step": 10470 }, { "epoch": 2.95, "learning_rate": 5.902164745572112e-05, "loss": 0.2627, "step": 10500 }, { "epoch": 2.96, "learning_rate": 5.919032892887265e-05, "loss": 0.3004, "step": 10530 }, { "epoch": 2.97, "learning_rate": 5.9359010402024184e-05, "loss": 0.2858, "step": 10560 }, { "epoch": 2.98, "learning_rate": 5.9527691875175717e-05, "loss": 0.2808, "step": 10590 }, { "epoch": 2.99, "learning_rate": 5.969637334832725e-05, "loss": 0.299, "step": 10620 }, { "epoch": 2.99, "learning_rate": 5.9865054821478774e-05, "loss": 0.2611, "step": 10650 }, { "epoch": 3.0, "eval_loss": 0.30112308263778687, "eval_runtime": 481.9568, "eval_samples_per_second": 33.266, "eval_steps_per_second": 1.042, "eval_wer": 0.3177432342063243, "step": 10671 }, { "epoch": 3.0, "learning_rate": 6.003373629463031e-05, "loss": 0.3151, "step": 10680 }, { "epoch": 3.01, "learning_rate": 6.020241776778184e-05, "loss": 0.2666, "step": 10710 }, { "epoch": 3.02, "learning_rate": 6.037109924093337e-05, "loss": 0.278, "step": 10740 }, { "epoch": 3.03, "learning_rate": 6.0539780714084903e-05, "loss": 0.2873, "step": 10770 }, { "epoch": 3.04, "learning_rate": 6.0708462187236436e-05, "loss": 0.2838, "step": 10800 }, { "epoch": 3.04, "learning_rate": 6.087714366038797e-05, "loss": 0.2901, "step": 10830 }, { "epoch": 3.05, "learning_rate": 6.104582513353951e-05, "loss": 0.2606, "step": 10860 }, { "epoch": 3.06, "learning_rate": 6.121450660669103e-05, "loss": 0.2811, "step": 10890 }, { "epoch": 3.07, "learning_rate": 6.138318807984257e-05, "loss": 0.2904, "step": 10920 }, { "epoch": 3.08, "learning_rate": 6.15518695529941e-05, "loss": 0.2569, "step": 10950 }, { "epoch": 3.09, "learning_rate": 6.172055102614564e-05, "loss": 0.2859, "step": 10980 }, { "epoch": 3.1, "learning_rate": 6.188923249929716e-05, "loss": 0.2584, "step": 11010 }, { "epoch": 3.1, "learning_rate": 6.20579139724487e-05, "loss": 0.2834, "step": 11040 }, { "epoch": 3.11, "learning_rate": 6.222659544560024e-05, "loss": 0.2814, "step": 11070 }, { "epoch": 3.12, "learning_rate": 6.239527691875175e-05, "loss": 0.2533, "step": 11100 }, { "epoch": 3.13, "learning_rate": 6.256395839190329e-05, "loss": 0.2884, "step": 11130 }, { "epoch": 3.14, "learning_rate": 6.273263986505482e-05, "loss": 0.2633, "step": 11160 }, { "epoch": 3.15, "learning_rate": 6.290132133820636e-05, "loss": 0.2737, "step": 11190 }, { "epoch": 3.15, "learning_rate": 6.307000281135788e-05, "loss": 0.2805, "step": 11220 }, { "epoch": 3.16, "learning_rate": 6.323868428450942e-05, "loss": 0.2478, "step": 11250 }, { "epoch": 3.17, "learning_rate": 6.340736575766096e-05, "loss": 0.2918, "step": 11280 }, { "epoch": 3.18, "learning_rate": 6.357604723081248e-05, "loss": 0.2566, "step": 11310 }, { "epoch": 3.19, "learning_rate": 6.374472870396402e-05, "loss": 0.2685, "step": 11340 }, { "epoch": 3.2, "learning_rate": 6.391341017711555e-05, "loss": 0.2871, "step": 11370 }, { "epoch": 3.2, "learning_rate": 6.408209165026709e-05, "loss": 0.2461, "step": 11400 }, { "epoch": 3.21, "learning_rate": 6.425077312341861e-05, "loss": 0.2769, "step": 11430 }, { "epoch": 3.22, "learning_rate": 6.441945459657015e-05, "loss": 0.2561, "step": 11460 }, { "epoch": 3.23, "learning_rate": 6.458813606972168e-05, "loss": 0.2703, "step": 11490 }, { "epoch": 3.24, "learning_rate": 6.475681754287322e-05, "loss": 0.28, "step": 11520 }, { "epoch": 3.25, "learning_rate": 6.492549901602474e-05, "loss": 0.2409, "step": 11550 }, { "epoch": 3.26, "learning_rate": 6.509418048917627e-05, "loss": 0.2825, "step": 11580 }, { "epoch": 3.26, "learning_rate": 6.526286196232781e-05, "loss": 0.255, "step": 11610 }, { "epoch": 3.27, "learning_rate": 6.543154343547933e-05, "loss": 0.2633, "step": 11640 }, { "epoch": 3.28, "learning_rate": 6.560022490863087e-05, "loss": 0.2806, "step": 11670 }, { "epoch": 3.29, "learning_rate": 6.57689063817824e-05, "loss": 0.2471, "step": 11700 }, { "epoch": 3.3, "learning_rate": 6.593758785493394e-05, "loss": 0.2886, "step": 11730 }, { "epoch": 3.31, "learning_rate": 6.610626932808546e-05, "loss": 0.2501, "step": 11760 }, { "epoch": 3.31, "learning_rate": 6.626932808546529e-05, "loss": 0.2899, "step": 11790 }, { "epoch": 3.32, "learning_rate": 6.643800955861683e-05, "loss": 0.2852, "step": 11820 }, { "epoch": 3.33, "learning_rate": 6.660669103176834e-05, "loss": 0.2445, "step": 11850 }, { "epoch": 3.34, "learning_rate": 6.677537250491988e-05, "loss": 0.2772, "step": 11880 }, { "epoch": 3.35, "learning_rate": 6.69440539780714e-05, "loss": 0.2438, "step": 11910 }, { "epoch": 3.36, "learning_rate": 6.711273545122294e-05, "loss": 0.2682, "step": 11940 }, { "epoch": 3.37, "learning_rate": 6.728141692437447e-05, "loss": 0.2745, "step": 11970 }, { "epoch": 3.37, "learning_rate": 6.745009839752601e-05, "loss": 0.2412, "step": 12000 }, { "epoch": 3.38, "learning_rate": 6.761877987067755e-05, "loss": 0.2704, "step": 12030 }, { "epoch": 3.39, "learning_rate": 6.778746134382907e-05, "loss": 0.2515, "step": 12060 }, { "epoch": 3.4, "learning_rate": 6.795614281698061e-05, "loss": 0.2614, "step": 12090 }, { "epoch": 3.41, "learning_rate": 6.812482429013214e-05, "loss": 0.2673, "step": 12120 }, { "epoch": 3.42, "learning_rate": 6.829350576328368e-05, "loss": 0.2377, "step": 12150 }, { "epoch": 3.42, "learning_rate": 6.84621872364352e-05, "loss": 0.2801, "step": 12180 }, { "epoch": 3.43, "learning_rate": 6.863086870958674e-05, "loss": 0.2468, "step": 12210 }, { "epoch": 3.44, "learning_rate": 6.879955018273827e-05, "loss": 0.263, "step": 12240 }, { "epoch": 3.45, "learning_rate": 6.89682316558898e-05, "loss": 0.2722, "step": 12270 }, { "epoch": 3.46, "learning_rate": 6.913691312904133e-05, "loss": 0.2458, "step": 12300 }, { "epoch": 3.47, "learning_rate": 6.930559460219286e-05, "loss": 0.2719, "step": 12330 }, { "epoch": 3.47, "learning_rate": 6.94742760753444e-05, "loss": 0.2646, "step": 12360 }, { "epoch": 3.48, "learning_rate": 6.964295754849592e-05, "loss": 0.2577, "step": 12390 }, { "epoch": 3.49, "learning_rate": 6.981163902164746e-05, "loss": 0.2693, "step": 12420 }, { "epoch": 3.5, "learning_rate": 6.998032049479898e-05, "loss": 0.2399, "step": 12450 }, { "epoch": 3.51, "learning_rate": 7.014900196795052e-05, "loss": 0.2699, "step": 12480 }, { "epoch": 3.52, "learning_rate": 7.031768344110205e-05, "loss": 0.2454, "step": 12510 }, { "epoch": 3.53, "learning_rate": 7.048636491425359e-05, "loss": 0.2598, "step": 12540 }, { "epoch": 3.53, "learning_rate": 7.065504638740513e-05, "loss": 0.2643, "step": 12570 }, { "epoch": 3.54, "learning_rate": 7.082372786055665e-05, "loss": 0.2328, "step": 12600 }, { "epoch": 3.55, "learning_rate": 7.099240933370819e-05, "loss": 0.2691, "step": 12630 }, { "epoch": 3.56, "learning_rate": 7.116109080685972e-05, "loss": 0.233, "step": 12660 }, { "epoch": 3.57, "learning_rate": 7.132977228001126e-05, "loss": 0.2597, "step": 12690 }, { "epoch": 3.58, "learning_rate": 7.149845375316278e-05, "loss": 0.2666, "step": 12720 }, { "epoch": 3.58, "learning_rate": 7.166713522631431e-05, "loss": 0.2254, "step": 12750 }, { "epoch": 3.59, "learning_rate": 7.183581669946585e-05, "loss": 0.2699, "step": 12780 }, { "epoch": 3.6, "learning_rate": 7.200449817261737e-05, "loss": 0.2374, "step": 12810 }, { "epoch": 3.61, "learning_rate": 7.217317964576891e-05, "loss": 0.2505, "step": 12840 }, { "epoch": 3.62, "learning_rate": 7.234186111892044e-05, "loss": 0.2685, "step": 12870 }, { "epoch": 3.63, "learning_rate": 7.251054259207198e-05, "loss": 0.2371, "step": 12900 }, { "epoch": 3.63, "learning_rate": 7.26792240652235e-05, "loss": 0.2573, "step": 12930 }, { "epoch": 3.64, "learning_rate": 7.284790553837504e-05, "loss": 0.2376, "step": 12960 }, { "epoch": 3.65, "learning_rate": 7.301658701152657e-05, "loss": 0.2575, "step": 12990 }, { "epoch": 3.66, "learning_rate": 7.31852684846781e-05, "loss": 0.2615, "step": 13020 }, { "epoch": 3.67, "learning_rate": 7.335394995782964e-05, "loss": 0.2391, "step": 13050 }, { "epoch": 3.68, "learning_rate": 7.352263143098117e-05, "loss": 0.2535, "step": 13080 }, { "epoch": 3.69, "learning_rate": 7.369131290413271e-05, "loss": 0.237, "step": 13110 }, { "epoch": 3.69, "learning_rate": 7.385999437728423e-05, "loss": 0.2592, "step": 13140 }, { "epoch": 3.7, "learning_rate": 7.402867585043577e-05, "loss": 0.2529, "step": 13170 }, { "epoch": 3.71, "learning_rate": 7.419735732358729e-05, "loss": 0.2341, "step": 13200 }, { "epoch": 3.72, "learning_rate": 7.436603879673882e-05, "loss": 0.2643, "step": 13230 }, { "epoch": 3.73, "learning_rate": 7.453472026989036e-05, "loss": 0.2348, "step": 13260 }, { "epoch": 3.74, "learning_rate": 7.470340174304189e-05, "loss": 0.2549, "step": 13290 }, { "epoch": 3.74, "learning_rate": 7.487208321619343e-05, "loss": 0.2583, "step": 13320 }, { "epoch": 3.75, "learning_rate": 7.504076468934495e-05, "loss": 0.2319, "step": 13350 }, { "epoch": 3.76, "learning_rate": 7.520944616249649e-05, "loss": 0.2575, "step": 13380 }, { "epoch": 3.77, "learning_rate": 7.537812763564802e-05, "loss": 0.2378, "step": 13410 }, { "epoch": 3.78, "learning_rate": 7.554680910879956e-05, "loss": 0.2515, "step": 13440 }, { "epoch": 3.79, "learning_rate": 7.571549058195108e-05, "loss": 0.2695, "step": 13470 }, { "epoch": 3.8, "learning_rate": 7.588417205510262e-05, "loss": 0.2304, "step": 13500 }, { "epoch": 3.8, "learning_rate": 7.605285352825415e-05, "loss": 0.2562, "step": 13530 }, { "epoch": 3.81, "learning_rate": 7.622153500140569e-05, "loss": 0.2263, "step": 13560 }, { "epoch": 3.82, "learning_rate": 7.639021647455723e-05, "loss": 0.2499, "step": 13590 }, { "epoch": 3.83, "learning_rate": 7.655889794770875e-05, "loss": 0.2728, "step": 13620 }, { "epoch": 3.84, "learning_rate": 7.672757942086028e-05, "loss": 0.2294, "step": 13650 }, { "epoch": 3.85, "learning_rate": 7.68962608940118e-05, "loss": 0.2573, "step": 13680 }, { "epoch": 3.85, "learning_rate": 7.706494236716334e-05, "loss": 0.2317, "step": 13710 }, { "epoch": 3.86, "learning_rate": 7.723362384031487e-05, "loss": 0.251, "step": 13740 }, { "epoch": 3.87, "learning_rate": 7.74023053134664e-05, "loss": 0.2668, "step": 13770 }, { "epoch": 3.88, "learning_rate": 7.757098678661794e-05, "loss": 0.2297, "step": 13800 }, { "epoch": 3.89, "learning_rate": 7.773966825976947e-05, "loss": 0.2567, "step": 13830 }, { "epoch": 3.9, "learning_rate": 7.790834973292101e-05, "loss": 0.2354, "step": 13860 }, { "epoch": 3.9, "learning_rate": 7.807703120607253e-05, "loss": 0.2504, "step": 13890 }, { "epoch": 3.91, "learning_rate": 7.824571267922407e-05, "loss": 0.256, "step": 13920 }, { "epoch": 3.92, "learning_rate": 7.84143941523756e-05, "loss": 0.256, "step": 13950 }, { "epoch": 3.93, "learning_rate": 7.858307562552714e-05, "loss": 0.2575, "step": 13980 }, { "epoch": 3.94, "learning_rate": 7.875175709867866e-05, "loss": 0.2254, "step": 14010 }, { "epoch": 3.95, "learning_rate": 7.89204385718302e-05, "loss": 0.2451, "step": 14040 }, { "epoch": 3.96, "learning_rate": 7.908912004498173e-05, "loss": 0.258, "step": 14070 }, { "epoch": 3.96, "learning_rate": 7.925780151813325e-05, "loss": 0.2254, "step": 14100 }, { "epoch": 3.97, "learning_rate": 7.942648299128479e-05, "loss": 0.2545, "step": 14130 }, { "epoch": 3.98, "learning_rate": 7.959516446443632e-05, "loss": 0.2294, "step": 14160 }, { "epoch": 3.99, "learning_rate": 7.976384593758786e-05, "loss": 0.2423, "step": 14190 }, { "epoch": 4.0, "learning_rate": 7.993252741073938e-05, "loss": 0.2536, "step": 14220 }, { "epoch": 4.0, "eval_loss": 0.2671508193016052, "eval_runtime": 482.3902, "eval_samples_per_second": 33.237, "eval_steps_per_second": 1.041, "eval_wer": 0.27493073847119676, "step": 14228 }, { "epoch": 4.01, "learning_rate": 8.010120888389092e-05, "loss": 0.2218, "step": 14250 }, { "epoch": 4.01, "learning_rate": 8.026989035704246e-05, "loss": 0.2506, "step": 14280 }, { "epoch": 4.02, "learning_rate": 8.043857183019399e-05, "loss": 0.2084, "step": 14310 }, { "epoch": 4.03, "learning_rate": 8.060725330334553e-05, "loss": 0.2442, "step": 14340 }, { "epoch": 4.04, "learning_rate": 8.077593477649705e-05, "loss": 0.2309, "step": 14370 }, { "epoch": 4.05, "learning_rate": 8.094461624964859e-05, "loss": 0.235, "step": 14400 }, { "epoch": 4.06, "learning_rate": 8.111329772280012e-05, "loss": 0.2574, "step": 14430 }, { "epoch": 4.07, "learning_rate": 8.128197919595165e-05, "loss": 0.2079, "step": 14460 }, { "epoch": 4.07, "learning_rate": 8.145066066910318e-05, "loss": 0.2396, "step": 14490 }, { "epoch": 4.08, "learning_rate": 8.161934214225472e-05, "loss": 0.2266, "step": 14520 }, { "epoch": 4.09, "learning_rate": 8.178802361540624e-05, "loss": 0.2359, "step": 14550 }, { "epoch": 4.1, "learning_rate": 8.195670508855777e-05, "loss": 0.2542, "step": 14580 }, { "epoch": 4.11, "learning_rate": 8.212538656170931e-05, "loss": 0.2034, "step": 14610 }, { "epoch": 4.12, "learning_rate": 8.229406803486083e-05, "loss": 0.2437, "step": 14640 }, { "epoch": 4.12, "learning_rate": 8.246274950801237e-05, "loss": 0.2173, "step": 14670 }, { "epoch": 4.13, "learning_rate": 8.26314309811639e-05, "loss": 0.2339, "step": 14700 }, { "epoch": 4.14, "learning_rate": 8.280011245431544e-05, "loss": 0.2409, "step": 14730 }, { "epoch": 4.15, "learning_rate": 8.296879392746696e-05, "loss": 0.2086, "step": 14760 }, { "epoch": 4.16, "learning_rate": 8.31374754006185e-05, "loss": 0.2382, "step": 14790 }, { "epoch": 4.17, "learning_rate": 8.330615687377004e-05, "loss": 0.2231, "step": 14820 }, { "epoch": 4.17, "learning_rate": 8.347483834692157e-05, "loss": 0.2237, "step": 14850 }, { "epoch": 4.18, "learning_rate": 8.36435198200731e-05, "loss": 0.2468, "step": 14880 }, { "epoch": 4.19, "learning_rate": 8.381220129322463e-05, "loss": 0.2035, "step": 14910 }, { "epoch": 4.2, "learning_rate": 8.398088276637617e-05, "loss": 0.2326, "step": 14940 }, { "epoch": 4.21, "learning_rate": 8.41495642395277e-05, "loss": 0.2307, "step": 14970 }, { "epoch": 4.22, "learning_rate": 8.431824571267924e-05, "loss": 0.2215, "step": 15000 }, { "epoch": 4.23, "learning_rate": 8.448692718583076e-05, "loss": 0.2467, "step": 15030 }, { "epoch": 4.23, "learning_rate": 8.465560865898229e-05, "loss": 0.2137, "step": 15060 }, { "epoch": 4.24, "learning_rate": 8.482429013213383e-05, "loss": 0.2265, "step": 15090 }, { "epoch": 4.25, "learning_rate": 8.499297160528535e-05, "loss": 0.2221, "step": 15120 }, { "epoch": 4.26, "learning_rate": 8.516165307843689e-05, "loss": 0.2279, "step": 15150 }, { "epoch": 4.27, "learning_rate": 8.533033455158842e-05, "loss": 0.2438, "step": 15180 }, { "epoch": 4.28, "learning_rate": 8.549901602473995e-05, "loss": 0.2015, "step": 15210 }, { "epoch": 4.28, "learning_rate": 8.566769749789148e-05, "loss": 0.2331, "step": 15240 }, { "epoch": 4.29, "learning_rate": 8.583637897104302e-05, "loss": 0.2249, "step": 15270 }, { "epoch": 4.3, "learning_rate": 8.600506044419455e-05, "loss": 0.2211, "step": 15300 }, { "epoch": 4.31, "learning_rate": 8.617374191734608e-05, "loss": 0.2383, "step": 15330 }, { "epoch": 4.32, "learning_rate": 8.634242339049762e-05, "loss": 0.2055, "step": 15360 }, { "epoch": 4.33, "learning_rate": 8.651110486364915e-05, "loss": 0.2317, "step": 15390 }, { "epoch": 4.34, "learning_rate": 8.667978633680069e-05, "loss": 0.2153, "step": 15420 }, { "epoch": 4.34, "learning_rate": 8.684846780995221e-05, "loss": 0.2264, "step": 15450 }, { "epoch": 4.35, "learning_rate": 8.701714928310374e-05, "loss": 0.2393, "step": 15480 }, { "epoch": 4.36, "learning_rate": 8.718583075625528e-05, "loss": 0.2047, "step": 15510 }, { "epoch": 4.37, "learning_rate": 8.73545122294068e-05, "loss": 0.2277, "step": 15540 }, { "epoch": 4.38, "learning_rate": 8.752319370255834e-05, "loss": 0.2107, "step": 15570 }, { "epoch": 4.39, "learning_rate": 8.769187517570987e-05, "loss": 0.2283, "step": 15600 }, { "epoch": 4.39, "learning_rate": 8.786055664886141e-05, "loss": 0.2457, "step": 15630 }, { "epoch": 4.4, "learning_rate": 8.802923812201293e-05, "loss": 0.1963, "step": 15660 }, { "epoch": 4.41, "learning_rate": 8.819791959516447e-05, "loss": 0.2371, "step": 15690 }, { "epoch": 4.42, "learning_rate": 8.8366601068316e-05, "loss": 0.2193, "step": 15720 }, { "epoch": 4.43, "learning_rate": 8.853528254146754e-05, "loss": 0.2212, "step": 15750 }, { "epoch": 4.44, "learning_rate": 8.870396401461906e-05, "loss": 0.2679, "step": 15780 }, { "epoch": 4.44, "learning_rate": 8.88726454877706e-05, "loss": 0.2074, "step": 15810 }, { "epoch": 4.45, "learning_rate": 8.903570424515041e-05, "loss": 0.2531, "step": 15840 }, { "epoch": 4.46, "learning_rate": 8.920438571830194e-05, "loss": 0.2107, "step": 15870 }, { "epoch": 4.47, "learning_rate": 8.937306719145348e-05, "loss": 0.2273, "step": 15900 }, { "epoch": 4.48, "learning_rate": 8.9541748664605e-05, "loss": 0.237, "step": 15930 }, { "epoch": 4.49, "learning_rate": 8.971043013775654e-05, "loss": 0.2008, "step": 15960 }, { "epoch": 4.5, "learning_rate": 8.987911161090807e-05, "loss": 0.2249, "step": 15990 }, { "epoch": 4.5, "learning_rate": 9.004779308405961e-05, "loss": 0.2184, "step": 16020 }, { "epoch": 4.51, "learning_rate": 9.021647455721115e-05, "loss": 0.2237, "step": 16050 }, { "epoch": 4.52, "learning_rate": 9.038515603036267e-05, "loss": 0.2461, "step": 16080 }, { "epoch": 4.53, "learning_rate": 9.055383750351421e-05, "loss": 0.2031, "step": 16110 }, { "epoch": 4.54, "learning_rate": 9.072251897666574e-05, "loss": 0.2328, "step": 16140 }, { "epoch": 4.55, "learning_rate": 9.089120044981728e-05, "loss": 0.2092, "step": 16170 }, { "epoch": 4.55, "learning_rate": 9.10598819229688e-05, "loss": 0.2176, "step": 16200 }, { "epoch": 4.56, "learning_rate": 9.122856339612033e-05, "loss": 0.2333, "step": 16230 }, { "epoch": 4.57, "learning_rate": 9.139724486927187e-05, "loss": 0.1933, "step": 16260 }, { "epoch": 4.58, "learning_rate": 9.156592634242339e-05, "loss": 0.2253, "step": 16290 }, { "epoch": 4.59, "learning_rate": 9.173460781557493e-05, "loss": 0.2157, "step": 16320 }, { "epoch": 4.6, "learning_rate": 9.190328928872646e-05, "loss": 0.2216, "step": 16350 }, { "epoch": 4.6, "learning_rate": 9.2071970761878e-05, "loss": 0.2463, "step": 16380 }, { "epoch": 4.61, "learning_rate": 9.224065223502952e-05, "loss": 0.1942, "step": 16410 }, { "epoch": 4.62, "learning_rate": 9.240933370818106e-05, "loss": 0.2332, "step": 16440 }, { "epoch": 4.63, "learning_rate": 9.257801518133258e-05, "loss": 0.2105, "step": 16470 }, { "epoch": 4.64, "learning_rate": 9.274669665448412e-05, "loss": 0.2198, "step": 16500 }, { "epoch": 4.65, "learning_rate": 9.291537812763565e-05, "loss": 0.2386, "step": 16530 }, { "epoch": 4.66, "learning_rate": 9.308405960078719e-05, "loss": 0.2008, "step": 16560 }, { "epoch": 4.66, "learning_rate": 9.325274107393873e-05, "loss": 0.2357, "step": 16590 }, { "epoch": 4.67, "learning_rate": 9.342142254709025e-05, "loss": 0.2182, "step": 16620 }, { "epoch": 4.68, "learning_rate": 9.359010402024179e-05, "loss": 0.2139, "step": 16650 }, { "epoch": 4.69, "learning_rate": 9.375316277762159e-05, "loss": 0.2395, "step": 16680 }, { "epoch": 4.7, "learning_rate": 9.392184425077313e-05, "loss": 0.1978, "step": 16710 }, { "epoch": 4.71, "learning_rate": 9.408490300815294e-05, "loss": 0.238, "step": 16740 }, { "epoch": 4.71, "learning_rate": 9.425358448130448e-05, "loss": 0.2058, "step": 16770 }, { "epoch": 4.72, "learning_rate": 9.4422265954456e-05, "loss": 0.2152, "step": 16800 }, { "epoch": 4.73, "learning_rate": 9.459094742760753e-05, "loss": 0.2404, "step": 16830 }, { "epoch": 4.74, "learning_rate": 9.475962890075907e-05, "loss": 0.1975, "step": 16860 }, { "epoch": 4.75, "learning_rate": 9.49283103739106e-05, "loss": 0.2275, "step": 16890 }, { "epoch": 4.76, "learning_rate": 9.509699184706214e-05, "loss": 0.2064, "step": 16920 }, { "epoch": 4.77, "learning_rate": 9.526567332021366e-05, "loss": 0.2191, "step": 16950 }, { "epoch": 4.77, "learning_rate": 9.54343547933652e-05, "loss": 0.2312, "step": 16980 }, { "epoch": 4.78, "learning_rate": 9.560303626651673e-05, "loss": 0.1969, "step": 17010 }, { "epoch": 4.79, "learning_rate": 9.577171773966826e-05, "loss": 0.2319, "step": 17040 }, { "epoch": 4.8, "learning_rate": 9.59403992128198e-05, "loss": 0.2196, "step": 17070 }, { "epoch": 4.81, "learning_rate": 9.610908068597133e-05, "loss": 0.2149, "step": 17100 }, { "epoch": 4.82, "learning_rate": 9.627776215912287e-05, "loss": 0.238, "step": 17130 }, { "epoch": 4.82, "learning_rate": 9.64464436322744e-05, "loss": 0.1979, "step": 17160 }, { "epoch": 4.83, "learning_rate": 9.661512510542593e-05, "loss": 0.2254, "step": 17190 }, { "epoch": 4.84, "learning_rate": 9.678380657857746e-05, "loss": 0.2059, "step": 17220 }, { "epoch": 4.85, "learning_rate": 9.695248805172898e-05, "loss": 0.2144, "step": 17250 }, { "epoch": 4.86, "learning_rate": 9.712116952488052e-05, "loss": 0.2367, "step": 17280 }, { "epoch": 4.87, "learning_rate": 9.728985099803205e-05, "loss": 0.1976, "step": 17310 }, { "epoch": 4.87, "learning_rate": 9.745853247118359e-05, "loss": 0.2329, "step": 17340 }, { "epoch": 4.88, "learning_rate": 9.762721394433511e-05, "loss": 0.2366, "step": 17370 }, { "epoch": 4.89, "learning_rate": 9.779589541748665e-05, "loss": 0.2181, "step": 17400 }, { "epoch": 4.9, "learning_rate": 9.796457689063818e-05, "loss": 0.2285, "step": 17430 }, { "epoch": 4.91, "learning_rate": 9.813325836378972e-05, "loss": 0.188, "step": 17460 }, { "epoch": 4.92, "learning_rate": 9.830193983694124e-05, "loss": 0.2252, "step": 17490 }, { "epoch": 4.93, "learning_rate": 9.847062131009278e-05, "loss": 0.2112, "step": 17520 }, { "epoch": 4.93, "learning_rate": 9.863930278324432e-05, "loss": 0.216, "step": 17550 }, { "epoch": 4.94, "learning_rate": 9.880798425639585e-05, "loss": 0.2321, "step": 17580 }, { "epoch": 4.95, "learning_rate": 9.897666572954739e-05, "loss": 0.1984, "step": 17610 }, { "epoch": 4.96, "learning_rate": 9.914534720269891e-05, "loss": 0.2293, "step": 17640 }, { "epoch": 4.97, "learning_rate": 9.931402867585045e-05, "loss": 0.2077, "step": 17670 }, { "epoch": 4.98, "learning_rate": 9.948271014900196e-05, "loss": 0.2105, "step": 17700 }, { "epoch": 4.98, "learning_rate": 9.96513916221535e-05, "loss": 0.2451, "step": 17730 }, { "epoch": 4.99, "learning_rate": 9.982007309530504e-05, "loss": 0.1943, "step": 17760 }, { "epoch": 5.0, "eval_loss": 0.24867025017738342, "eval_runtime": 481.4061, "eval_samples_per_second": 33.305, "eval_steps_per_second": 1.043, "eval_wer": 0.24798356829937357, "step": 17785 }, { "epoch": 5.0, "learning_rate": 9.998875456845657e-05, "loss": 0.2282, "step": 17790 }, { "epoch": 5.01, "learning_rate": 9.9982507106488e-05, "loss": 0.1934, "step": 17820 }, { "epoch": 5.02, "learning_rate": 9.996376472058226e-05, "loss": 0.2085, "step": 17850 }, { "epoch": 5.03, "learning_rate": 9.994502233467654e-05, "loss": 0.1973, "step": 17880 }, { "epoch": 5.04, "learning_rate": 9.992627994877082e-05, "loss": 0.1986, "step": 17910 }, { "epoch": 5.04, "learning_rate": 9.990753756286509e-05, "loss": 0.2231, "step": 17940 }, { "epoch": 5.05, "learning_rate": 9.988879517695936e-05, "loss": 0.187, "step": 17970 }, { "epoch": 5.06, "learning_rate": 9.987005279105364e-05, "loss": 0.2081, "step": 18000 }, { "epoch": 5.07, "learning_rate": 9.985131040514792e-05, "loss": 0.2039, "step": 18030 }, { "epoch": 5.08, "learning_rate": 9.983256801924219e-05, "loss": 0.1983, "step": 18060 }, { "epoch": 5.09, "learning_rate": 9.981382563333647e-05, "loss": 0.2192, "step": 18090 }, { "epoch": 5.09, "learning_rate": 9.979508324743073e-05, "loss": 0.1883, "step": 18120 }, { "epoch": 5.1, "learning_rate": 9.977634086152502e-05, "loss": 0.2088, "step": 18150 }, { "epoch": 5.11, "learning_rate": 9.975759847561928e-05, "loss": 0.2058, "step": 18180 }, { "epoch": 5.12, "learning_rate": 9.973885608971356e-05, "loss": 0.1956, "step": 18210 }, { "epoch": 5.13, "learning_rate": 9.972011370380784e-05, "loss": 0.23, "step": 18240 }, { "epoch": 5.14, "learning_rate": 9.97013713179021e-05, "loss": 0.1872, "step": 18270 }, { "epoch": 5.14, "learning_rate": 9.968262893199638e-05, "loss": 0.2122, "step": 18300 }, { "epoch": 5.15, "learning_rate": 9.966388654609066e-05, "loss": 0.2017, "step": 18330 }, { "epoch": 5.16, "learning_rate": 9.964514416018493e-05, "loss": 0.1956, "step": 18360 }, { "epoch": 5.17, "learning_rate": 9.96264017742792e-05, "loss": 0.2146, "step": 18390 }, { "epoch": 5.18, "learning_rate": 9.960765938837348e-05, "loss": 0.1876, "step": 18420 }, { "epoch": 5.19, "learning_rate": 9.958891700246776e-05, "loss": 0.2131, "step": 18450 }, { "epoch": 5.2, "learning_rate": 9.957017461656202e-05, "loss": 0.1991, "step": 18480 }, { "epoch": 5.2, "learning_rate": 9.95514322306563e-05, "loss": 0.2035, "step": 18510 }, { "epoch": 5.21, "learning_rate": 9.953268984475057e-05, "loss": 0.2284, "step": 18540 }, { "epoch": 5.22, "learning_rate": 9.951394745884485e-05, "loss": 0.1843, "step": 18570 }, { "epoch": 5.23, "learning_rate": 9.949520507293912e-05, "loss": 0.206, "step": 18600 }, { "epoch": 5.24, "learning_rate": 9.94764626870334e-05, "loss": 0.1995, "step": 18630 }, { "epoch": 5.25, "learning_rate": 9.945772030112768e-05, "loss": 0.1975, "step": 18660 }, { "epoch": 5.25, "learning_rate": 9.943897791522194e-05, "loss": 0.2307, "step": 18690 }, { "epoch": 5.26, "learning_rate": 9.942023552931622e-05, "loss": 0.184, "step": 18720 }, { "epoch": 5.27, "learning_rate": 9.94014931434105e-05, "loss": 0.1995, "step": 18750 }, { "epoch": 5.28, "learning_rate": 9.938275075750477e-05, "loss": 0.1945, "step": 18780 }, { "epoch": 5.29, "learning_rate": 9.936400837159903e-05, "loss": 0.1972, "step": 18810 }, { "epoch": 5.3, "learning_rate": 9.934526598569331e-05, "loss": 0.2212, "step": 18840 }, { "epoch": 5.3, "learning_rate": 9.93265235997876e-05, "loss": 0.1812, "step": 18870 }, { "epoch": 5.31, "learning_rate": 9.930778121388186e-05, "loss": 0.2027, "step": 18900 }, { "epoch": 5.32, "learning_rate": 9.928903882797614e-05, "loss": 0.2014, "step": 18930 }, { "epoch": 5.33, "learning_rate": 9.927029644207041e-05, "loss": 0.2044, "step": 18960 }, { "epoch": 5.34, "learning_rate": 9.925155405616469e-05, "loss": 0.2154, "step": 18990 }, { "epoch": 5.35, "learning_rate": 9.923281167025896e-05, "loss": 0.1867, "step": 19020 }, { "epoch": 5.36, "learning_rate": 9.921406928435324e-05, "loss": 0.2095, "step": 19050 }, { "epoch": 5.36, "learning_rate": 9.919532689844752e-05, "loss": 0.2086, "step": 19080 }, { "epoch": 5.37, "learning_rate": 9.917658451254178e-05, "loss": 0.1861, "step": 19110 }, { "epoch": 5.38, "learning_rate": 9.915784212663606e-05, "loss": 0.2321, "step": 19140 }, { "epoch": 5.39, "learning_rate": 9.913909974073034e-05, "loss": 0.1855, "step": 19170 }, { "epoch": 5.4, "learning_rate": 9.91203573548246e-05, "loss": 0.208, "step": 19200 }, { "epoch": 5.41, "learning_rate": 9.910161496891887e-05, "loss": 0.1986, "step": 19230 }, { "epoch": 5.41, "learning_rate": 9.908287258301315e-05, "loss": 0.1984, "step": 19260 }, { "epoch": 5.42, "learning_rate": 9.906413019710743e-05, "loss": 0.2198, "step": 19290 }, { "epoch": 5.43, "learning_rate": 9.90453878112017e-05, "loss": 0.1778, "step": 19320 }, { "epoch": 5.44, "learning_rate": 9.902664542529598e-05, "loss": 0.2127, "step": 19350 }, { "epoch": 5.45, "learning_rate": 9.900790303939025e-05, "loss": 0.1995, "step": 19380 }, { "epoch": 5.46, "learning_rate": 9.898916065348453e-05, "loss": 0.194, "step": 19410 }, { "epoch": 5.47, "learning_rate": 9.89704182675788e-05, "loss": 0.2109, "step": 19440 }, { "epoch": 5.47, "learning_rate": 9.895167588167308e-05, "loss": 0.1722, "step": 19470 }, { "epoch": 5.48, "learning_rate": 9.893293349576735e-05, "loss": 0.2064, "step": 19500 }, { "epoch": 5.49, "learning_rate": 9.891419110986161e-05, "loss": 0.1981, "step": 19530 }, { "epoch": 5.5, "learning_rate": 9.88954487239559e-05, "loss": 0.19, "step": 19560 }, { "epoch": 5.51, "learning_rate": 9.887670633805018e-05, "loss": 0.219, "step": 19590 }, { "epoch": 5.52, "learning_rate": 9.885796395214444e-05, "loss": 0.176, "step": 19620 }, { "epoch": 5.52, "learning_rate": 9.883922156623871e-05, "loss": 0.2065, "step": 19650 }, { "epoch": 5.53, "learning_rate": 9.882047918033299e-05, "loss": 0.195, "step": 19680 }, { "epoch": 5.54, "learning_rate": 9.880173679442727e-05, "loss": 0.1915, "step": 19710 }, { "epoch": 5.55, "learning_rate": 9.878299440852154e-05, "loss": 0.2066, "step": 19740 }, { "epoch": 5.56, "learning_rate": 9.876425202261582e-05, "loss": 0.1802, "step": 19770 }, { "epoch": 5.57, "learning_rate": 9.874550963671009e-05, "loss": 0.2033, "step": 19800 }, { "epoch": 5.57, "learning_rate": 9.872676725080437e-05, "loss": 0.1952, "step": 19830 }, { "epoch": 5.58, "learning_rate": 9.870802486489864e-05, "loss": 0.195, "step": 19860 }, { "epoch": 5.59, "learning_rate": 9.868928247899292e-05, "loss": 0.2103, "step": 19890 }, { "epoch": 5.6, "learning_rate": 9.867054009308719e-05, "loss": 0.1803, "step": 19920 }, { "epoch": 5.61, "learning_rate": 9.865179770718145e-05, "loss": 0.2008, "step": 19950 }, { "epoch": 5.62, "learning_rate": 9.863305532127573e-05, "loss": 0.2135, "step": 19980 }, { "epoch": 5.63, "learning_rate": 9.861431293537001e-05, "loss": 0.1886, "step": 20010 }, { "epoch": 5.63, "learning_rate": 9.859557054946428e-05, "loss": 0.2032, "step": 20040 }, { "epoch": 5.64, "learning_rate": 9.857682816355855e-05, "loss": 0.182, "step": 20070 }, { "epoch": 5.65, "learning_rate": 9.855808577765283e-05, "loss": 0.2084, "step": 20100 }, { "epoch": 5.66, "learning_rate": 9.853934339174711e-05, "loss": 0.2042, "step": 20130 }, { "epoch": 5.67, "learning_rate": 9.852060100584138e-05, "loss": 0.1928, "step": 20160 }, { "epoch": 5.68, "learning_rate": 9.850185861993566e-05, "loss": 0.2089, "step": 20190 }, { "epoch": 5.68, "learning_rate": 9.848311623402993e-05, "loss": 0.1816, "step": 20220 }, { "epoch": 5.69, "learning_rate": 9.846437384812421e-05, "loss": 0.2145, "step": 20250 }, { "epoch": 5.7, "learning_rate": 9.844563146221848e-05, "loss": 0.1957, "step": 20280 }, { "epoch": 5.71, "learning_rate": 9.842688907631276e-05, "loss": 0.1906, "step": 20310 }, { "epoch": 5.72, "learning_rate": 9.840814669040702e-05, "loss": 0.2095, "step": 20340 }, { "epoch": 5.73, "learning_rate": 9.838940430450129e-05, "loss": 0.1812, "step": 20370 }, { "epoch": 5.74, "learning_rate": 9.837066191859557e-05, "loss": 0.2028, "step": 20400 }, { "epoch": 5.74, "learning_rate": 9.835191953268985e-05, "loss": 0.1893, "step": 20430 }, { "epoch": 5.75, "learning_rate": 9.833317714678413e-05, "loss": 0.1979, "step": 20460 }, { "epoch": 5.76, "learning_rate": 9.831443476087839e-05, "loss": 0.2088, "step": 20490 }, { "epoch": 5.77, "learning_rate": 9.829569237497267e-05, "loss": 0.1761, "step": 20520 }, { "epoch": 5.78, "learning_rate": 9.827694998906695e-05, "loss": 0.1947, "step": 20550 }, { "epoch": 5.79, "learning_rate": 9.825820760316122e-05, "loss": 0.2022, "step": 20580 }, { "epoch": 5.79, "learning_rate": 9.82394652172555e-05, "loss": 0.1878, "step": 20610 }, { "epoch": 5.8, "learning_rate": 9.822072283134977e-05, "loss": 0.209, "step": 20640 }, { "epoch": 5.81, "learning_rate": 9.820198044544405e-05, "loss": 0.1745, "step": 20670 }, { "epoch": 5.82, "learning_rate": 9.818323805953831e-05, "loss": 0.2038, "step": 20700 }, { "epoch": 5.83, "learning_rate": 9.81644956736326e-05, "loss": 0.1929, "step": 20730 }, { "epoch": 5.84, "learning_rate": 9.814575328772686e-05, "loss": 0.1853, "step": 20760 }, { "epoch": 5.84, "learning_rate": 9.812701090182113e-05, "loss": 0.209, "step": 20790 }, { "epoch": 5.85, "learning_rate": 9.810826851591541e-05, "loss": 0.1737, "step": 20820 }, { "epoch": 5.86, "learning_rate": 9.808952613000969e-05, "loss": 0.1993, "step": 20850 }, { "epoch": 5.87, "learning_rate": 9.807078374410397e-05, "loss": 0.1926, "step": 20880 }, { "epoch": 5.88, "learning_rate": 9.805204135819823e-05, "loss": 0.184, "step": 20910 }, { "epoch": 5.89, "learning_rate": 9.803329897229251e-05, "loss": 0.2172, "step": 20940 }, { "epoch": 5.9, "learning_rate": 9.801455658638679e-05, "loss": 0.1867, "step": 20970 }, { "epoch": 5.9, "learning_rate": 9.799581420048106e-05, "loss": 0.1985, "step": 21000 }, { "epoch": 5.91, "learning_rate": 9.797707181457534e-05, "loss": 0.1884, "step": 21030 }, { "epoch": 5.92, "learning_rate": 9.79583294286696e-05, "loss": 0.1902, "step": 21060 }, { "epoch": 5.93, "learning_rate": 9.793958704276389e-05, "loss": 0.2094, "step": 21090 }, { "epoch": 5.94, "learning_rate": 9.792084465685815e-05, "loss": 0.1748, "step": 21120 }, { "epoch": 5.95, "learning_rate": 9.790210227095243e-05, "loss": 0.2104, "step": 21150 }, { "epoch": 5.95, "learning_rate": 9.78833598850467e-05, "loss": 0.1953, "step": 21180 }, { "epoch": 5.96, "learning_rate": 9.786461749914098e-05, "loss": 0.1853, "step": 21210 }, { "epoch": 5.97, "learning_rate": 9.784587511323525e-05, "loss": 0.1937, "step": 21240 }, { "epoch": 5.98, "learning_rate": 9.782713272732953e-05, "loss": 0.1741, "step": 21270 }, { "epoch": 5.99, "learning_rate": 9.780839034142381e-05, "loss": 0.2014, "step": 21300 }, { "epoch": 6.0, "learning_rate": 9.778964795551807e-05, "loss": 0.2004, "step": 21330 }, { "epoch": 6.0, "eval_loss": 0.22455841302871704, "eval_runtime": 479.6485, "eval_samples_per_second": 33.427, "eval_steps_per_second": 1.047, "eval_wer": 0.2267956819019284, "step": 21342 }, { "epoch": 6.01, "learning_rate": 9.777090556961235e-05, "loss": 0.189, "step": 21360 }, { "epoch": 6.01, "learning_rate": 9.775216318370663e-05, "loss": 0.1862, "step": 21390 }, { "epoch": 6.02, "learning_rate": 9.77334207978009e-05, "loss": 0.178, "step": 21420 }, { "epoch": 6.03, "learning_rate": 9.771467841189518e-05, "loss": 0.1925, "step": 21450 }, { "epoch": 6.04, "learning_rate": 9.769593602598944e-05, "loss": 0.171, "step": 21480 }, { "epoch": 6.05, "learning_rate": 9.767719364008372e-05, "loss": 0.1871, "step": 21510 }, { "epoch": 6.06, "learning_rate": 9.765845125417799e-05, "loss": 0.186, "step": 21540 }, { "epoch": 6.06, "learning_rate": 9.763970886827227e-05, "loss": 0.1691, "step": 21570 }, { "epoch": 6.07, "learning_rate": 9.762096648236654e-05, "loss": 0.1968, "step": 21600 }, { "epoch": 6.08, "learning_rate": 9.760222409646082e-05, "loss": 0.1729, "step": 21630 }, { "epoch": 6.09, "learning_rate": 9.758348171055509e-05, "loss": 0.1882, "step": 21660 }, { "epoch": 6.1, "learning_rate": 9.756473932464937e-05, "loss": 0.1836, "step": 21690 }, { "epoch": 6.11, "learning_rate": 9.754599693874365e-05, "loss": 0.1704, "step": 21720 }, { "epoch": 6.11, "learning_rate": 9.75272545528379e-05, "loss": 0.1932, "step": 21750 }, { "epoch": 6.12, "learning_rate": 9.750851216693219e-05, "loss": 0.1824, "step": 21780 }, { "epoch": 6.13, "learning_rate": 9.748976978102647e-05, "loss": 0.1855, "step": 21810 }, { "epoch": 6.14, "learning_rate": 9.747102739512073e-05, "loss": 0.1903, "step": 21840 }, { "epoch": 6.15, "learning_rate": 9.745290975541187e-05, "loss": 0.1735, "step": 21870 }, { "epoch": 6.16, "learning_rate": 9.743416736950614e-05, "loss": 0.1922, "step": 21900 }, { "epoch": 6.17, "learning_rate": 9.741542498360041e-05, "loss": 0.168, "step": 21930 }, { "epoch": 6.17, "learning_rate": 9.739668259769469e-05, "loss": 0.1856, "step": 21960 }, { "epoch": 6.18, "learning_rate": 9.737794021178897e-05, "loss": 0.1876, "step": 21990 }, { "epoch": 6.19, "learning_rate": 9.735919782588324e-05, "loss": 0.1738, "step": 22020 }, { "epoch": 6.2, "learning_rate": 9.734045543997752e-05, "loss": 0.196, "step": 22050 }, { "epoch": 6.21, "learning_rate": 9.732171305407179e-05, "loss": 0.1711, "step": 22080 }, { "epoch": 6.22, "learning_rate": 9.730297066816605e-05, "loss": 0.1895, "step": 22110 }, { "epoch": 6.22, "learning_rate": 9.728422828226034e-05, "loss": 0.1879, "step": 22140 }, { "epoch": 6.23, "learning_rate": 9.726548589635462e-05, "loss": 0.1935, "step": 22170 }, { "epoch": 6.24, "learning_rate": 9.724674351044888e-05, "loss": 0.1967, "step": 22200 }, { "epoch": 6.25, "learning_rate": 9.722800112454315e-05, "loss": 0.1687, "step": 22230 }, { "epoch": 6.26, "learning_rate": 9.720925873863743e-05, "loss": 0.1852, "step": 22260 }, { "epoch": 6.27, "learning_rate": 9.719051635273171e-05, "loss": 0.1916, "step": 22290 }, { "epoch": 6.27, "learning_rate": 9.717177396682598e-05, "loss": 0.1701, "step": 22320 }, { "epoch": 6.28, "learning_rate": 9.715303158092025e-05, "loss": 0.2169, "step": 22350 }, { "epoch": 6.29, "learning_rate": 9.713428919501453e-05, "loss": 0.1695, "step": 22380 }, { "epoch": 6.3, "learning_rate": 9.711554680910881e-05, "loss": 0.1891, "step": 22410 }, { "epoch": 6.31, "learning_rate": 9.709680442320308e-05, "loss": 0.1845, "step": 22440 }, { "epoch": 6.32, "learning_rate": 9.707806203729736e-05, "loss": 0.1811, "step": 22470 }, { "epoch": 6.33, "learning_rate": 9.705931965139163e-05, "loss": 0.1991, "step": 22500 }, { "epoch": 6.33, "learning_rate": 9.70405772654859e-05, "loss": 0.1663, "step": 22530 }, { "epoch": 6.34, "learning_rate": 9.702183487958017e-05, "loss": 0.1848, "step": 22560 }, { "epoch": 6.35, "learning_rate": 9.700309249367446e-05, "loss": 0.188, "step": 22590 }, { "epoch": 6.36, "learning_rate": 9.698435010776872e-05, "loss": 0.1712, "step": 22620 }, { "epoch": 6.37, "learning_rate": 9.696560772186299e-05, "loss": 0.1949, "step": 22650 }, { "epoch": 6.38, "learning_rate": 9.694686533595727e-05, "loss": 0.1711, "step": 22680 }, { "epoch": 6.38, "learning_rate": 9.692812295005155e-05, "loss": 0.1781, "step": 22710 }, { "epoch": 6.39, "learning_rate": 9.690938056414582e-05, "loss": 0.1853, "step": 22740 }, { "epoch": 6.4, "learning_rate": 9.689063817824009e-05, "loss": 0.1683, "step": 22770 }, { "epoch": 6.41, "learning_rate": 9.687189579233437e-05, "loss": 0.2022, "step": 22800 }, { "epoch": 6.42, "learning_rate": 9.685315340642865e-05, "loss": 0.1749, "step": 22830 }, { "epoch": 6.43, "learning_rate": 9.683441102052292e-05, "loss": 0.1827, "step": 22860 }, { "epoch": 6.44, "learning_rate": 9.68156686346172e-05, "loss": 0.196, "step": 22890 }, { "epoch": 6.44, "learning_rate": 9.679692624871146e-05, "loss": 0.1645, "step": 22920 }, { "epoch": 6.45, "learning_rate": 9.677818386280573e-05, "loss": 0.1914, "step": 22950 }, { "epoch": 6.46, "learning_rate": 9.675944147690001e-05, "loss": 0.1651, "step": 22980 }, { "epoch": 6.47, "learning_rate": 9.67406990909943e-05, "loss": 0.1829, "step": 23010 }, { "epoch": 6.48, "learning_rate": 9.672195670508856e-05, "loss": 0.1873, "step": 23040 }, { "epoch": 6.49, "learning_rate": 9.670321431918283e-05, "loss": 0.1705, "step": 23070 }, { "epoch": 6.49, "learning_rate": 9.668447193327711e-05, "loss": 0.1941, "step": 23100 }, { "epoch": 6.5, "learning_rate": 9.666635429356824e-05, "loss": 0.1662, "step": 23130 }, { "epoch": 6.51, "learning_rate": 9.664761190766252e-05, "loss": 0.1801, "step": 23160 }, { "epoch": 6.52, "learning_rate": 9.66288695217568e-05, "loss": 0.1801, "step": 23190 }, { "epoch": 6.53, "learning_rate": 9.661012713585107e-05, "loss": 0.1699, "step": 23220 }, { "epoch": 6.54, "learning_rate": 9.659138474994533e-05, "loss": 0.1854, "step": 23250 }, { "epoch": 6.54, "learning_rate": 9.657264236403961e-05, "loss": 0.1731, "step": 23280 }, { "epoch": 6.55, "learning_rate": 9.655389997813388e-05, "loss": 0.1813, "step": 23310 }, { "epoch": 6.56, "learning_rate": 9.653515759222816e-05, "loss": 0.1832, "step": 23340 }, { "epoch": 6.57, "learning_rate": 9.651641520632244e-05, "loss": 0.1711, "step": 23370 }, { "epoch": 6.58, "learning_rate": 9.649767282041671e-05, "loss": 0.1868, "step": 23400 }, { "epoch": 6.59, "learning_rate": 9.647893043451098e-05, "loss": 0.1687, "step": 23430 }, { "epoch": 6.6, "learning_rate": 9.646018804860526e-05, "loss": 0.1852, "step": 23460 }, { "epoch": 6.6, "learning_rate": 9.644144566269954e-05, "loss": 0.1929, "step": 23490 }, { "epoch": 6.61, "learning_rate": 9.642270327679381e-05, "loss": 0.1647, "step": 23520 }, { "epoch": 6.62, "learning_rate": 9.640396089088808e-05, "loss": 0.1908, "step": 23550 }, { "epoch": 6.63, "learning_rate": 9.638521850498236e-05, "loss": 0.1694, "step": 23580 }, { "epoch": 6.64, "learning_rate": 9.636647611907664e-05, "loss": 0.1826, "step": 23610 }, { "epoch": 6.65, "learning_rate": 9.63477337331709e-05, "loss": 0.1811, "step": 23640 }, { "epoch": 6.65, "learning_rate": 9.632899134726517e-05, "loss": 0.1694, "step": 23670 }, { "epoch": 6.66, "learning_rate": 9.631024896135945e-05, "loss": 0.1822, "step": 23700 }, { "epoch": 6.67, "learning_rate": 9.629150657545372e-05, "loss": 0.1716, "step": 23730 }, { "epoch": 6.68, "learning_rate": 9.6272764189548e-05, "loss": 0.1766, "step": 23760 }, { "epoch": 6.69, "learning_rate": 9.625402180364228e-05, "loss": 0.1839, "step": 23790 }, { "epoch": 6.7, "learning_rate": 9.623527941773655e-05, "loss": 0.1729, "step": 23820 }, { "epoch": 6.7, "learning_rate": 9.621653703183082e-05, "loss": 0.185, "step": 23850 }, { "epoch": 6.71, "learning_rate": 9.61977946459251e-05, "loss": 0.167, "step": 23880 }, { "epoch": 6.72, "learning_rate": 9.617905226001938e-05, "loss": 0.1695, "step": 23910 }, { "epoch": 6.73, "learning_rate": 9.616030987411365e-05, "loss": 0.1803, "step": 23940 }, { "epoch": 6.74, "learning_rate": 9.614156748820791e-05, "loss": 0.1726, "step": 23970 }, { "epoch": 6.75, "learning_rate": 9.61228251023022e-05, "loss": 0.1836, "step": 24000 }, { "epoch": 6.76, "learning_rate": 9.610408271639648e-05, "loss": 0.1595, "step": 24030 }, { "epoch": 6.76, "learning_rate": 9.608534033049074e-05, "loss": 0.1787, "step": 24060 }, { "epoch": 6.77, "learning_rate": 9.606659794458501e-05, "loss": 0.1775, "step": 24090 }, { "epoch": 6.78, "learning_rate": 9.604785555867929e-05, "loss": 0.1698, "step": 24120 }, { "epoch": 6.79, "learning_rate": 9.602911317277356e-05, "loss": 0.1858, "step": 24150 }, { "epoch": 6.8, "learning_rate": 9.601037078686784e-05, "loss": 0.1682, "step": 24180 }, { "epoch": 6.81, "learning_rate": 9.599162840096212e-05, "loss": 0.181, "step": 24210 }, { "epoch": 6.81, "learning_rate": 9.597288601505639e-05, "loss": 0.1774, "step": 24240 }, { "epoch": 6.82, "learning_rate": 9.595414362915066e-05, "loss": 0.1743, "step": 24270 }, { "epoch": 6.83, "learning_rate": 9.593540124324494e-05, "loss": 0.1867, "step": 24300 }, { "epoch": 6.84, "learning_rate": 9.591665885733922e-05, "loss": 0.1672, "step": 24330 }, { "epoch": 6.85, "learning_rate": 9.589791647143349e-05, "loss": 0.1817, "step": 24360 }, { "epoch": 6.86, "learning_rate": 9.587917408552775e-05, "loss": 0.1774, "step": 24390 }, { "epoch": 6.87, "learning_rate": 9.586043169962203e-05, "loss": 0.1679, "step": 24420 }, { "epoch": 6.87, "learning_rate": 9.584168931371632e-05, "loss": 0.1908, "step": 24450 }, { "epoch": 6.88, "learning_rate": 9.582294692781058e-05, "loss": 0.1584, "step": 24480 }, { "epoch": 6.89, "learning_rate": 9.580420454190485e-05, "loss": 0.1763, "step": 24510 }, { "epoch": 6.9, "learning_rate": 9.578546215599913e-05, "loss": 0.184, "step": 24540 }, { "epoch": 6.91, "learning_rate": 9.57667197700934e-05, "loss": 0.1639, "step": 24570 }, { "epoch": 6.92, "learning_rate": 9.574797738418768e-05, "loss": 0.1887, "step": 24600 }, { "epoch": 6.92, "learning_rate": 9.572923499828196e-05, "loss": 0.1645, "step": 24630 }, { "epoch": 6.93, "learning_rate": 9.571049261237623e-05, "loss": 0.1768, "step": 24660 }, { "epoch": 6.94, "learning_rate": 9.56917502264705e-05, "loss": 0.1916, "step": 24690 }, { "epoch": 6.95, "learning_rate": 9.567300784056478e-05, "loss": 0.1623, "step": 24720 }, { "epoch": 6.96, "learning_rate": 9.565426545465906e-05, "loss": 0.2004, "step": 24750 }, { "epoch": 6.97, "learning_rate": 9.563552306875332e-05, "loss": 0.1615, "step": 24780 }, { "epoch": 6.97, "learning_rate": 9.561678068284759e-05, "loss": 0.1826, "step": 24810 }, { "epoch": 6.98, "learning_rate": 9.559803829694187e-05, "loss": 0.1842, "step": 24840 }, { "epoch": 6.99, "learning_rate": 9.557929591103615e-05, "loss": 0.1605, "step": 24870 }, { "epoch": 7.0, "eval_loss": 0.2175769805908203, "eval_runtime": 478.6384, "eval_samples_per_second": 33.497, "eval_steps_per_second": 1.049, "eval_wer": 0.21197439711762858, "step": 24899 }, { "epoch": 7.0, "learning_rate": 9.556055352513042e-05, "loss": 0.1973, "step": 24900 }, { "epoch": 7.01, "learning_rate": 9.554181113922469e-05, "loss": 0.1446, "step": 24930 }, { "epoch": 7.02, "learning_rate": 9.552306875331897e-05, "loss": 0.172, "step": 24960 }, { "epoch": 7.03, "learning_rate": 9.550432636741324e-05, "loss": 0.1592, "step": 24990 }, { "epoch": 7.03, "learning_rate": 9.548558398150752e-05, "loss": 0.1663, "step": 25020 }, { "epoch": 7.04, "learning_rate": 9.546684159560179e-05, "loss": 0.194, "step": 25050 }, { "epoch": 7.05, "learning_rate": 9.544809920969607e-05, "loss": 0.1514, "step": 25080 }, { "epoch": 7.06, "learning_rate": 9.542935682379033e-05, "loss": 0.1735, "step": 25110 }, { "epoch": 7.07, "learning_rate": 9.541061443788461e-05, "loss": 0.1586, "step": 25140 }, { "epoch": 7.08, "learning_rate": 9.53918720519789e-05, "loss": 0.1807, "step": 25170 }, { "epoch": 7.08, "learning_rate": 9.537312966607316e-05, "loss": 0.1757, "step": 25200 }, { "epoch": 7.09, "learning_rate": 9.535438728016743e-05, "loss": 0.145, "step": 25230 }, { "epoch": 7.1, "learning_rate": 9.533564489426171e-05, "loss": 0.1695, "step": 25260 }, { "epoch": 7.11, "learning_rate": 9.531690250835599e-05, "loss": 0.1631, "step": 25290 }, { "epoch": 7.12, "learning_rate": 9.529816012245026e-05, "loss": 0.1638, "step": 25320 }, { "epoch": 7.13, "learning_rate": 9.527941773654453e-05, "loss": 0.1766, "step": 25350 }, { "epoch": 7.14, "learning_rate": 9.526067535063881e-05, "loss": 0.1464, "step": 25380 }, { "epoch": 7.14, "learning_rate": 9.524193296473309e-05, "loss": 0.1746, "step": 25410 }, { "epoch": 7.15, "learning_rate": 9.522319057882736e-05, "loss": 0.1564, "step": 25440 }, { "epoch": 7.16, "learning_rate": 9.520444819292162e-05, "loss": 0.1598, "step": 25470 }, { "epoch": 7.17, "learning_rate": 9.51857058070159e-05, "loss": 0.1798, "step": 25500 }, { "epoch": 7.18, "learning_rate": 9.516696342111017e-05, "loss": 0.1506, "step": 25530 }, { "epoch": 7.19, "learning_rate": 9.514822103520445e-05, "loss": 0.1717, "step": 25560 }, { "epoch": 7.19, "learning_rate": 9.512947864929873e-05, "loss": 0.1586, "step": 25590 }, { "epoch": 7.2, "learning_rate": 9.5110736263393e-05, "loss": 0.1695, "step": 25620 }, { "epoch": 7.21, "learning_rate": 9.509199387748727e-05, "loss": 0.173, "step": 25650 }, { "epoch": 7.22, "learning_rate": 9.507325149158155e-05, "loss": 0.1468, "step": 25680 }, { "epoch": 7.23, "learning_rate": 9.505450910567583e-05, "loss": 0.1749, "step": 25710 }, { "epoch": 7.24, "learning_rate": 9.50357667197701e-05, "loss": 0.1609, "step": 25740 }, { "epoch": 7.24, "learning_rate": 9.501702433386437e-05, "loss": 0.1712, "step": 25770 }, { "epoch": 7.25, "learning_rate": 9.499828194795865e-05, "loss": 0.1844, "step": 25800 }, { "epoch": 7.26, "learning_rate": 9.497953956205293e-05, "loss": 0.1508, "step": 25830 }, { "epoch": 7.27, "learning_rate": 9.49607971761472e-05, "loss": 0.1767, "step": 25860 }, { "epoch": 7.28, "learning_rate": 9.494205479024146e-05, "loss": 0.1609, "step": 25890 }, { "epoch": 7.29, "learning_rate": 9.492331240433574e-05, "loss": 0.1644, "step": 25920 }, { "epoch": 7.3, "learning_rate": 9.490457001843001e-05, "loss": 0.1788, "step": 25950 }, { "epoch": 7.3, "learning_rate": 9.488582763252429e-05, "loss": 0.1519, "step": 25980 }, { "epoch": 7.31, "learning_rate": 9.486708524661857e-05, "loss": 0.1708, "step": 26010 }, { "epoch": 7.32, "learning_rate": 9.484834286071284e-05, "loss": 0.1571, "step": 26040 }, { "epoch": 7.33, "learning_rate": 9.482960047480711e-05, "loss": 0.1727, "step": 26070 }, { "epoch": 7.34, "learning_rate": 9.481085808890139e-05, "loss": 0.1843, "step": 26100 }, { "epoch": 7.35, "learning_rate": 9.479211570299567e-05, "loss": 0.1489, "step": 26130 }, { "epoch": 7.35, "learning_rate": 9.477337331708994e-05, "loss": 0.1675, "step": 26160 }, { "epoch": 7.36, "learning_rate": 9.47546309311842e-05, "loss": 0.1596, "step": 26190 }, { "epoch": 7.37, "learning_rate": 9.473588854527849e-05, "loss": 0.1626, "step": 26220 }, { "epoch": 7.38, "learning_rate": 9.471714615937277e-05, "loss": 0.1838, "step": 26250 }, { "epoch": 7.39, "learning_rate": 9.469840377346703e-05, "loss": 0.1511, "step": 26280 }, { "epoch": 7.4, "learning_rate": 9.46796613875613e-05, "loss": 0.183, "step": 26310 }, { "epoch": 7.41, "learning_rate": 9.466091900165558e-05, "loss": 0.1619, "step": 26340 }, { "epoch": 7.41, "learning_rate": 9.464217661574985e-05, "loss": 0.1685, "step": 26370 }, { "epoch": 7.42, "learning_rate": 9.462343422984413e-05, "loss": 0.1724, "step": 26400 }, { "epoch": 7.43, "learning_rate": 9.460469184393841e-05, "loss": 0.1478, "step": 26430 }, { "epoch": 7.44, "learning_rate": 9.458594945803268e-05, "loss": 0.1795, "step": 26460 }, { "epoch": 7.45, "learning_rate": 9.456720707212695e-05, "loss": 0.157, "step": 26490 }, { "epoch": 7.46, "learning_rate": 9.454846468622123e-05, "loss": 0.1705, "step": 26520 }, { "epoch": 7.46, "learning_rate": 9.452972230031551e-05, "loss": 0.1815, "step": 26550 }, { "epoch": 7.47, "learning_rate": 9.451097991440978e-05, "loss": 0.1459, "step": 26580 }, { "epoch": 7.48, "learning_rate": 9.449223752850404e-05, "loss": 0.1747, "step": 26610 }, { "epoch": 7.49, "learning_rate": 9.447349514259832e-05, "loss": 0.1625, "step": 26640 }, { "epoch": 7.5, "learning_rate": 9.44547527566926e-05, "loss": 0.1675, "step": 26670 }, { "epoch": 7.51, "learning_rate": 9.443601037078687e-05, "loss": 0.1816, "step": 26700 }, { "epoch": 7.51, "learning_rate": 9.441726798488114e-05, "loss": 0.1526, "step": 26730 }, { "epoch": 7.52, "learning_rate": 9.439852559897542e-05, "loss": 0.1826, "step": 26760 }, { "epoch": 7.53, "learning_rate": 9.437978321306969e-05, "loss": 0.1595, "step": 26790 }, { "epoch": 7.54, "learning_rate": 9.436104082716397e-05, "loss": 0.1705, "step": 26820 }, { "epoch": 7.55, "learning_rate": 9.434229844125825e-05, "loss": 0.1778, "step": 26850 }, { "epoch": 7.56, "learning_rate": 9.432355605535252e-05, "loss": 0.1514, "step": 26880 }, { "epoch": 7.57, "learning_rate": 9.430481366944679e-05, "loss": 0.1749, "step": 26910 }, { "epoch": 7.57, "learning_rate": 9.428607128354107e-05, "loss": 0.159, "step": 26940 }, { "epoch": 7.58, "learning_rate": 9.426732889763535e-05, "loss": 0.167, "step": 26970 }, { "epoch": 7.59, "learning_rate": 9.424858651172961e-05, "loss": 0.1819, "step": 27000 }, { "epoch": 7.6, "learning_rate": 9.422984412582388e-05, "loss": 0.1506, "step": 27030 }, { "epoch": 7.61, "learning_rate": 9.421110173991816e-05, "loss": 0.1736, "step": 27060 }, { "epoch": 7.62, "learning_rate": 9.419235935401244e-05, "loss": 0.1546, "step": 27090 }, { "epoch": 7.62, "learning_rate": 9.417361696810671e-05, "loss": 0.1667, "step": 27120 }, { "epoch": 7.63, "learning_rate": 9.415487458220098e-05, "loss": 0.1817, "step": 27150 }, { "epoch": 7.64, "learning_rate": 9.413613219629526e-05, "loss": 0.1571, "step": 27180 }, { "epoch": 7.65, "learning_rate": 9.411738981038953e-05, "loss": 0.1728, "step": 27210 }, { "epoch": 7.66, "learning_rate": 9.409864742448381e-05, "loss": 0.1586, "step": 27240 }, { "epoch": 7.67, "learning_rate": 9.407990503857809e-05, "loss": 0.1627, "step": 27270 }, { "epoch": 7.67, "learning_rate": 9.406116265267236e-05, "loss": 0.1711, "step": 27300 }, { "epoch": 7.68, "learning_rate": 9.404242026676662e-05, "loss": 0.149, "step": 27330 }, { "epoch": 7.69, "learning_rate": 9.40236778808609e-05, "loss": 0.1698, "step": 27360 }, { "epoch": 7.7, "learning_rate": 9.400493549495519e-05, "loss": 0.1562, "step": 27390 }, { "epoch": 7.71, "learning_rate": 9.398619310904945e-05, "loss": 0.1595, "step": 27420 }, { "epoch": 7.72, "learning_rate": 9.396745072314372e-05, "loss": 0.1754, "step": 27450 }, { "epoch": 7.73, "learning_rate": 9.3948708337238e-05, "loss": 0.1469, "step": 27480 }, { "epoch": 7.73, "learning_rate": 9.392996595133228e-05, "loss": 0.1762, "step": 27510 }, { "epoch": 7.74, "learning_rate": 9.391122356542655e-05, "loss": 0.1586, "step": 27540 }, { "epoch": 7.75, "learning_rate": 9.389248117952082e-05, "loss": 0.1669, "step": 27570 }, { "epoch": 7.76, "learning_rate": 9.38737387936151e-05, "loss": 0.1792, "step": 27600 }, { "epoch": 7.77, "learning_rate": 9.385499640770937e-05, "loss": 0.1467, "step": 27630 }, { "epoch": 7.78, "learning_rate": 9.383625402180365e-05, "loss": 0.1749, "step": 27660 }, { "epoch": 7.78, "learning_rate": 9.381751163589793e-05, "loss": 0.1577, "step": 27690 }, { "epoch": 7.79, "learning_rate": 9.37987692499922e-05, "loss": 0.1676, "step": 27720 }, { "epoch": 7.8, "learning_rate": 9.378002686408646e-05, "loss": 0.1791, "step": 27750 }, { "epoch": 7.81, "learning_rate": 9.376128447818074e-05, "loss": 0.1508, "step": 27780 }, { "epoch": 7.82, "learning_rate": 9.374254209227502e-05, "loss": 0.1746, "step": 27810 }, { "epoch": 7.83, "learning_rate": 9.372379970636929e-05, "loss": 0.1564, "step": 27840 }, { "epoch": 7.84, "learning_rate": 9.370505732046356e-05, "loss": 0.1633, "step": 27870 }, { "epoch": 7.84, "learning_rate": 9.368631493455784e-05, "loss": 0.1766, "step": 27900 }, { "epoch": 7.85, "learning_rate": 9.366757254865212e-05, "loss": 0.147, "step": 27930 }, { "epoch": 7.86, "learning_rate": 9.364883016274639e-05, "loss": 0.1762, "step": 27960 }, { "epoch": 7.87, "learning_rate": 9.363008777684066e-05, "loss": 0.1618, "step": 27990 }, { "epoch": 7.88, "learning_rate": 9.361134539093494e-05, "loss": 0.1721, "step": 28020 }, { "epoch": 7.89, "learning_rate": 9.359260300502922e-05, "loss": 0.1843, "step": 28050 }, { "epoch": 7.89, "learning_rate": 9.357386061912349e-05, "loss": 0.151, "step": 28080 }, { "epoch": 7.9, "learning_rate": 9.355511823321777e-05, "loss": 0.1718, "step": 28110 }, { "epoch": 7.91, "learning_rate": 9.353637584731203e-05, "loss": 0.1575, "step": 28140 }, { "epoch": 7.92, "learning_rate": 9.35176334614063e-05, "loss": 0.1578, "step": 28170 }, { "epoch": 7.93, "learning_rate": 9.349889107550058e-05, "loss": 0.1781, "step": 28200 }, { "epoch": 7.94, "learning_rate": 9.348014868959486e-05, "loss": 0.1412, "step": 28230 }, { "epoch": 7.94, "learning_rate": 9.346140630368913e-05, "loss": 0.1711, "step": 28260 }, { "epoch": 7.95, "learning_rate": 9.34426639177834e-05, "loss": 0.1557, "step": 28290 }, { "epoch": 7.96, "learning_rate": 9.342392153187768e-05, "loss": 0.1607, "step": 28320 }, { "epoch": 7.97, "learning_rate": 9.340517914597196e-05, "loss": 0.1763, "step": 28350 }, { "epoch": 7.98, "learning_rate": 9.338643676006623e-05, "loss": 0.1441, "step": 28380 }, { "epoch": 7.99, "learning_rate": 9.33676943741605e-05, "loss": 0.1739, "step": 28410 }, { "epoch": 8.0, "learning_rate": 9.334895198825478e-05, "loss": 0.1579, "step": 28440 }, { "epoch": 8.0, "eval_loss": 0.20457884669303894, "eval_runtime": 477.673, "eval_samples_per_second": 33.565, "eval_steps_per_second": 1.051, "eval_wer": 0.20240743520805754, "step": 28456 }, { "epoch": 8.0, "learning_rate": 9.333020960234906e-05, "loss": 0.1691, "step": 28470 }, { "epoch": 8.01, "learning_rate": 9.331146721644332e-05, "loss": 0.1501, "step": 28500 }, { "epoch": 8.02, "learning_rate": 9.32927248305376e-05, "loss": 0.1653, "step": 28530 }, { "epoch": 8.03, "learning_rate": 9.327398244463187e-05, "loss": 0.1736, "step": 28560 }, { "epoch": 8.04, "learning_rate": 9.325524005872614e-05, "loss": 0.1407, "step": 28590 }, { "epoch": 8.05, "learning_rate": 9.323649767282042e-05, "loss": 0.1634, "step": 28620 }, { "epoch": 8.05, "learning_rate": 9.32177552869147e-05, "loss": 0.151, "step": 28650 }, { "epoch": 8.06, "learning_rate": 9.319901290100897e-05, "loss": 0.1583, "step": 28680 }, { "epoch": 8.07, "learning_rate": 9.318027051510324e-05, "loss": 0.1657, "step": 28710 }, { "epoch": 8.08, "learning_rate": 9.316152812919752e-05, "loss": 0.1443, "step": 28740 }, { "epoch": 8.09, "learning_rate": 9.31427857432918e-05, "loss": 0.1535, "step": 28770 }, { "epoch": 8.1, "learning_rate": 9.312404335738607e-05, "loss": 0.1491, "step": 28800 }, { "epoch": 8.11, "learning_rate": 9.310530097148033e-05, "loss": 0.1525, "step": 28830 }, { "epoch": 8.11, "learning_rate": 9.308655858557461e-05, "loss": 0.1651, "step": 28860 }, { "epoch": 8.12, "learning_rate": 9.30678161996689e-05, "loss": 0.1411, "step": 28890 }, { "epoch": 8.13, "learning_rate": 9.304907381376316e-05, "loss": 0.1585, "step": 28920 }, { "epoch": 8.14, "learning_rate": 9.303033142785744e-05, "loss": 0.1506, "step": 28950 }, { "epoch": 8.15, "learning_rate": 9.301158904195171e-05, "loss": 0.1455, "step": 28980 }, { "epoch": 8.16, "learning_rate": 9.299284665604598e-05, "loss": 0.1692, "step": 29010 }, { "epoch": 8.16, "learning_rate": 9.297410427014026e-05, "loss": 0.1419, "step": 29040 }, { "epoch": 8.17, "learning_rate": 9.295536188423454e-05, "loss": 0.16, "step": 29070 }, { "epoch": 8.18, "learning_rate": 9.293661949832881e-05, "loss": 0.1529, "step": 29100 }, { "epoch": 8.19, "learning_rate": 9.291787711242308e-05, "loss": 0.16, "step": 29130 }, { "epoch": 8.2, "learning_rate": 9.289913472651736e-05, "loss": 0.1715, "step": 29160 }, { "epoch": 8.21, "learning_rate": 9.288039234061164e-05, "loss": 0.1412, "step": 29190 }, { "epoch": 8.21, "learning_rate": 9.28616499547059e-05, "loss": 0.1558, "step": 29220 }, { "epoch": 8.22, "learning_rate": 9.284290756880017e-05, "loss": 0.1502, "step": 29250 }, { "epoch": 8.23, "learning_rate": 9.282416518289445e-05, "loss": 0.1461, "step": 29280 }, { "epoch": 8.24, "learning_rate": 9.280542279698873e-05, "loss": 0.1623, "step": 29310 }, { "epoch": 8.25, "learning_rate": 9.2786680411083e-05, "loss": 0.1414, "step": 29340 }, { "epoch": 8.26, "learning_rate": 9.276793802517728e-05, "loss": 0.1583, "step": 29370 }, { "epoch": 8.27, "learning_rate": 9.274919563927155e-05, "loss": 0.1536, "step": 29400 }, { "epoch": 8.27, "learning_rate": 9.273045325336582e-05, "loss": 0.1542, "step": 29430 }, { "epoch": 8.28, "learning_rate": 9.27117108674601e-05, "loss": 0.1768, "step": 29460 }, { "epoch": 8.29, "learning_rate": 9.269296848155438e-05, "loss": 0.138, "step": 29490 }, { "epoch": 8.3, "learning_rate": 9.267422609564865e-05, "loss": 0.1596, "step": 29520 }, { "epoch": 8.31, "learning_rate": 9.265548370974291e-05, "loss": 0.1612, "step": 29550 }, { "epoch": 8.32, "learning_rate": 9.263736607003406e-05, "loss": 0.1545, "step": 29580 }, { "epoch": 8.32, "learning_rate": 9.261862368412832e-05, "loss": 0.1678, "step": 29610 }, { "epoch": 8.33, "learning_rate": 9.25998812982226e-05, "loss": 0.1419, "step": 29640 }, { "epoch": 8.34, "learning_rate": 9.258113891231688e-05, "loss": 0.1613, "step": 29670 }, { "epoch": 8.35, "learning_rate": 9.256239652641115e-05, "loss": 0.1547, "step": 29700 }, { "epoch": 8.36, "learning_rate": 9.254365414050542e-05, "loss": 0.1518, "step": 29730 }, { "epoch": 8.37, "learning_rate": 9.25249117545997e-05, "loss": 0.1679, "step": 29760 }, { "epoch": 8.37, "learning_rate": 9.250616936869397e-05, "loss": 0.1399, "step": 29790 }, { "epoch": 8.38, "learning_rate": 9.248742698278825e-05, "loss": 0.1626, "step": 29820 }, { "epoch": 8.39, "learning_rate": 9.246868459688252e-05, "loss": 0.1491, "step": 29850 }, { "epoch": 8.4, "learning_rate": 9.24499422109768e-05, "loss": 0.1552, "step": 29880 }, { "epoch": 8.41, "learning_rate": 9.243119982507106e-05, "loss": 0.167, "step": 29910 }, { "epoch": 8.42, "learning_rate": 9.241245743916535e-05, "loss": 0.1427, "step": 29940 }, { "epoch": 8.43, "learning_rate": 9.239371505325963e-05, "loss": 0.1594, "step": 29970 }, { "epoch": 8.43, "learning_rate": 9.23749726673539e-05, "loss": 0.1584, "step": 30000 }, { "epoch": 8.44, "learning_rate": 9.235623028144816e-05, "loss": 0.163, "step": 30030 }, { "epoch": 8.45, "learning_rate": 9.233748789554244e-05, "loss": 0.1628, "step": 30060 }, { "epoch": 8.46, "learning_rate": 9.231874550963672e-05, "loss": 0.1366, "step": 30090 }, { "epoch": 8.47, "learning_rate": 9.230000312373099e-05, "loss": 0.1564, "step": 30120 }, { "epoch": 8.48, "learning_rate": 9.228126073782526e-05, "loss": 0.1532, "step": 30150 }, { "epoch": 8.48, "learning_rate": 9.226251835191954e-05, "loss": 0.1561, "step": 30180 }, { "epoch": 8.49, "learning_rate": 9.22437759660138e-05, "loss": 0.1672, "step": 30210 }, { "epoch": 8.5, "learning_rate": 9.222503358010809e-05, "loss": 0.1394, "step": 30240 }, { "epoch": 8.51, "learning_rate": 9.220629119420235e-05, "loss": 0.154, "step": 30270 }, { "epoch": 8.52, "learning_rate": 9.218754880829664e-05, "loss": 0.1488, "step": 30300 }, { "epoch": 8.53, "learning_rate": 9.21688064223909e-05, "loss": 0.1608, "step": 30330 }, { "epoch": 8.54, "learning_rate": 9.215006403648518e-05, "loss": 0.1753, "step": 30360 }, { "epoch": 8.54, "learning_rate": 9.213132165057946e-05, "loss": 0.1395, "step": 30390 }, { "epoch": 8.55, "learning_rate": 9.211257926467373e-05, "loss": 0.1618, "step": 30420 }, { "epoch": 8.56, "learning_rate": 9.2093836878768e-05, "loss": 0.1517, "step": 30450 }, { "epoch": 8.57, "learning_rate": 9.207509449286228e-05, "loss": 0.1575, "step": 30480 }, { "epoch": 8.58, "learning_rate": 9.205635210695656e-05, "loss": 0.1733, "step": 30510 }, { "epoch": 8.59, "learning_rate": 9.203760972105083e-05, "loss": 0.1354, "step": 30540 }, { "epoch": 8.59, "learning_rate": 9.20188673351451e-05, "loss": 0.1627, "step": 30570 }, { "epoch": 8.6, "learning_rate": 9.200012494923938e-05, "loss": 0.1507, "step": 30600 }, { "epoch": 8.61, "learning_rate": 9.198138256333364e-05, "loss": 0.1558, "step": 30630 }, { "epoch": 8.62, "learning_rate": 9.196264017742793e-05, "loss": 0.1705, "step": 30660 }, { "epoch": 8.63, "learning_rate": 9.19438977915222e-05, "loss": 0.145, "step": 30690 }, { "epoch": 8.64, "learning_rate": 9.192515540561647e-05, "loss": 0.1545, "step": 30720 }, { "epoch": 8.64, "learning_rate": 9.190641301971074e-05, "loss": 0.1529, "step": 30750 }, { "epoch": 8.65, "learning_rate": 9.188767063380502e-05, "loss": 0.1532, "step": 30780 }, { "epoch": 8.66, "learning_rate": 9.18689282478993e-05, "loss": 0.1758, "step": 30810 }, { "epoch": 8.67, "learning_rate": 9.185018586199357e-05, "loss": 0.1431, "step": 30840 }, { "epoch": 8.68, "learning_rate": 9.183144347608784e-05, "loss": 0.1601, "step": 30870 }, { "epoch": 8.69, "learning_rate": 9.181270109018212e-05, "loss": 0.1566, "step": 30900 }, { "epoch": 8.7, "learning_rate": 9.17939587042764e-05, "loss": 0.1508, "step": 30930 }, { "epoch": 8.7, "learning_rate": 9.177521631837067e-05, "loss": 0.1649, "step": 30960 }, { "epoch": 8.71, "learning_rate": 9.175647393246494e-05, "loss": 0.1384, "step": 30990 }, { "epoch": 8.72, "learning_rate": 9.173773154655922e-05, "loss": 0.1627, "step": 31020 }, { "epoch": 8.73, "learning_rate": 9.171898916065348e-05, "loss": 0.1521, "step": 31050 }, { "epoch": 8.74, "learning_rate": 9.170024677474776e-05, "loss": 0.1704, "step": 31080 }, { "epoch": 8.75, "learning_rate": 9.168150438884203e-05, "loss": 0.1703, "step": 31110 }, { "epoch": 8.75, "learning_rate": 9.166276200293631e-05, "loss": 0.1414, "step": 31140 }, { "epoch": 8.76, "learning_rate": 9.164401961703058e-05, "loss": 0.1608, "step": 31170 }, { "epoch": 8.77, "learning_rate": 9.162527723112486e-05, "loss": 0.1476, "step": 31200 }, { "epoch": 8.78, "learning_rate": 9.160653484521914e-05, "loss": 0.1512, "step": 31230 }, { "epoch": 8.79, "learning_rate": 9.158779245931341e-05, "loss": 0.163, "step": 31260 }, { "epoch": 8.8, "learning_rate": 9.156905007340768e-05, "loss": 0.138, "step": 31290 }, { "epoch": 8.81, "learning_rate": 9.155030768750196e-05, "loss": 0.1663, "step": 31320 }, { "epoch": 8.81, "learning_rate": 9.153156530159624e-05, "loss": 0.1562, "step": 31350 }, { "epoch": 8.82, "learning_rate": 9.15128229156905e-05, "loss": 0.1519, "step": 31380 }, { "epoch": 8.83, "learning_rate": 9.149408052978477e-05, "loss": 0.1659, "step": 31410 }, { "epoch": 8.84, "learning_rate": 9.147533814387905e-05, "loss": 0.1398, "step": 31440 }, { "epoch": 8.85, "learning_rate": 9.145659575797332e-05, "loss": 0.1624, "step": 31470 }, { "epoch": 8.86, "learning_rate": 9.14378533720676e-05, "loss": 0.1481, "step": 31500 }, { "epoch": 8.86, "learning_rate": 9.141911098616187e-05, "loss": 0.1516, "step": 31530 }, { "epoch": 8.87, "learning_rate": 9.140036860025615e-05, "loss": 0.1661, "step": 31560 }, { "epoch": 8.88, "learning_rate": 9.138162621435042e-05, "loss": 0.133, "step": 31590 }, { "epoch": 8.89, "learning_rate": 9.13628838284447e-05, "loss": 0.1653, "step": 31620 }, { "epoch": 8.9, "learning_rate": 9.134414144253898e-05, "loss": 0.1572, "step": 31650 }, { "epoch": 8.91, "learning_rate": 9.132539905663325e-05, "loss": 0.1493, "step": 31680 }, { "epoch": 8.91, "learning_rate": 9.130665667072752e-05, "loss": 0.1715, "step": 31710 }, { "epoch": 8.92, "learning_rate": 9.12879142848218e-05, "loss": 0.1434, "step": 31740 }, { "epoch": 8.93, "learning_rate": 9.126917189891608e-05, "loss": 0.165, "step": 31770 }, { "epoch": 8.94, "learning_rate": 9.125042951301035e-05, "loss": 0.1505, "step": 31800 }, { "epoch": 8.95, "learning_rate": 9.123168712710461e-05, "loss": 0.1466, "step": 31830 }, { "epoch": 8.96, "learning_rate": 9.12129447411989e-05, "loss": 0.1676, "step": 31860 }, { "epoch": 8.97, "learning_rate": 9.119420235529317e-05, "loss": 0.143, "step": 31890 }, { "epoch": 8.97, "learning_rate": 9.117545996938744e-05, "loss": 0.1589, "step": 31920 }, { "epoch": 8.98, "learning_rate": 9.115671758348171e-05, "loss": 0.1529, "step": 31950 }, { "epoch": 8.99, "learning_rate": 9.113797519757599e-05, "loss": 0.1491, "step": 31980 }, { "epoch": 9.0, "learning_rate": 9.111923281167026e-05, "loss": 0.1668, "step": 32010 }, { "epoch": 9.0, "eval_loss": 0.20271660387516022, "eval_runtime": 480.4264, "eval_samples_per_second": 33.372, "eval_steps_per_second": 1.045, "eval_wer": 0.19443724154872874, "step": 32013 }, { "epoch": 9.01, "learning_rate": 9.110049042576454e-05, "loss": 0.1419, "step": 32040 }, { "epoch": 9.02, "learning_rate": 9.108174803985882e-05, "loss": 0.1552, "step": 32070 }, { "epoch": 9.02, "learning_rate": 9.106300565395309e-05, "loss": 0.1401, "step": 32100 }, { "epoch": 9.03, "learning_rate": 9.104426326804735e-05, "loss": 0.1473, "step": 32130 }, { "epoch": 9.04, "learning_rate": 9.102552088214164e-05, "loss": 0.1431, "step": 32160 }, { "epoch": 9.05, "learning_rate": 9.100740324243276e-05, "loss": 0.1363, "step": 32190 }, { "epoch": 9.06, "learning_rate": 9.098866085652704e-05, "loss": 0.1572, "step": 32220 }, { "epoch": 9.07, "learning_rate": 9.096991847062132e-05, "loss": 0.1328, "step": 32250 }, { "epoch": 9.08, "learning_rate": 9.095117608471558e-05, "loss": 0.1498, "step": 32280 }, { "epoch": 9.08, "learning_rate": 9.093243369880986e-05, "loss": 0.1395, "step": 32310 }, { "epoch": 9.09, "learning_rate": 9.091369131290414e-05, "loss": 0.1405, "step": 32340 }, { "epoch": 9.1, "learning_rate": 9.089494892699841e-05, "loss": 0.1531, "step": 32370 }, { "epoch": 9.11, "learning_rate": 9.087620654109269e-05, "loss": 0.143, "step": 32400 }, { "epoch": 9.12, "learning_rate": 9.085746415518696e-05, "loss": 0.1493, "step": 32430 }, { "epoch": 9.13, "learning_rate": 9.083872176928124e-05, "loss": 0.1452, "step": 32460 }, { "epoch": 9.13, "learning_rate": 9.08199793833755e-05, "loss": 0.1398, "step": 32490 }, { "epoch": 9.14, "learning_rate": 9.080123699746979e-05, "loss": 0.1479, "step": 32520 }, { "epoch": 9.15, "learning_rate": 9.078249461156407e-05, "loss": 0.1371, "step": 32550 }, { "epoch": 9.16, "learning_rate": 9.076375222565832e-05, "loss": 0.1589, "step": 32580 }, { "epoch": 9.17, "learning_rate": 9.07450098397526e-05, "loss": 0.1518, "step": 32610 }, { "epoch": 9.18, "learning_rate": 9.072626745384688e-05, "loss": 0.1395, "step": 32640 }, { "epoch": 9.18, "learning_rate": 9.070752506794116e-05, "loss": 0.1503, "step": 32670 }, { "epoch": 9.19, "learning_rate": 9.068878268203542e-05, "loss": 0.1312, "step": 32700 }, { "epoch": 9.2, "learning_rate": 9.06700402961297e-05, "loss": 0.1455, "step": 32730 }, { "epoch": 9.21, "learning_rate": 9.065129791022398e-05, "loss": 0.154, "step": 32760 }, { "epoch": 9.22, "learning_rate": 9.063255552431825e-05, "loss": 0.1488, "step": 32790 }, { "epoch": 9.23, "learning_rate": 9.061381313841253e-05, "loss": 0.1592, "step": 32820 }, { "epoch": 9.24, "learning_rate": 9.05950707525068e-05, "loss": 0.1328, "step": 32850 }, { "epoch": 9.24, "learning_rate": 9.057632836660108e-05, "loss": 0.1484, "step": 32880 }, { "epoch": 9.25, "learning_rate": 9.055758598069534e-05, "loss": 0.15, "step": 32910 }, { "epoch": 9.26, "learning_rate": 9.053884359478962e-05, "loss": 0.1398, "step": 32940 }, { "epoch": 9.27, "learning_rate": 9.05201012088839e-05, "loss": 0.1523, "step": 32970 }, { "epoch": 9.28, "learning_rate": 9.050135882297817e-05, "loss": 0.1337, "step": 33000 }, { "epoch": 9.29, "learning_rate": 9.048261643707244e-05, "loss": 0.1517, "step": 33030 }, { "epoch": 9.29, "learning_rate": 9.046449879736357e-05, "loss": 0.1507, "step": 33060 }, { "epoch": 9.3, "learning_rate": 9.044575641145785e-05, "loss": 0.1424, "step": 33090 }, { "epoch": 9.31, "learning_rate": 9.042701402555213e-05, "loss": 0.1612, "step": 33120 }, { "epoch": 9.32, "learning_rate": 9.04082716396464e-05, "loss": 0.1389, "step": 33150 }, { "epoch": 9.33, "learning_rate": 9.038952925374066e-05, "loss": 0.1519, "step": 33180 }, { "epoch": 9.34, "learning_rate": 9.037078686783495e-05, "loss": 0.1426, "step": 33210 }, { "epoch": 9.34, "learning_rate": 9.035204448192923e-05, "loss": 0.1386, "step": 33240 }, { "epoch": 9.35, "learning_rate": 9.03333020960235e-05, "loss": 0.1566, "step": 33270 }, { "epoch": 9.36, "learning_rate": 9.031455971011777e-05, "loss": 0.1354, "step": 33300 }, { "epoch": 9.37, "learning_rate": 9.029581732421204e-05, "loss": 0.1502, "step": 33330 }, { "epoch": 9.38, "learning_rate": 9.027707493830632e-05, "loss": 0.1536, "step": 33360 }, { "epoch": 9.39, "learning_rate": 9.025833255240059e-05, "loss": 0.1453, "step": 33390 }, { "epoch": 9.4, "learning_rate": 9.023959016649487e-05, "loss": 0.1602, "step": 33420 }, { "epoch": 9.4, "learning_rate": 9.022084778058914e-05, "loss": 0.1344, "step": 33450 }, { "epoch": 9.41, "learning_rate": 9.02021053946834e-05, "loss": 0.152, "step": 33480 }, { "epoch": 9.42, "learning_rate": 9.018336300877769e-05, "loss": 0.1545, "step": 33510 }, { "epoch": 9.43, "learning_rate": 9.016462062287197e-05, "loss": 0.1418, "step": 33540 }, { "epoch": 9.44, "learning_rate": 9.014587823696624e-05, "loss": 0.1589, "step": 33570 }, { "epoch": 9.45, "learning_rate": 9.01271358510605e-05, "loss": 0.1331, "step": 33600 }, { "epoch": 9.45, "learning_rate": 9.010839346515478e-05, "loss": 0.1476, "step": 33630 }, { "epoch": 9.46, "learning_rate": 9.008965107924906e-05, "loss": 0.1456, "step": 33660 }, { "epoch": 9.47, "learning_rate": 9.007090869334333e-05, "loss": 0.1427, "step": 33690 }, { "epoch": 9.48, "learning_rate": 9.005216630743761e-05, "loss": 0.1528, "step": 33720 }, { "epoch": 9.49, "learning_rate": 9.003342392153188e-05, "loss": 0.1328, "step": 33750 }, { "epoch": 9.5, "learning_rate": 9.001468153562616e-05, "loss": 0.147, "step": 33780 }, { "epoch": 9.51, "learning_rate": 8.999593914972043e-05, "loss": 0.1503, "step": 33810 }, { "epoch": 9.51, "learning_rate": 8.997719676381471e-05, "loss": 0.1416, "step": 33840 }, { "epoch": 9.52, "learning_rate": 8.995845437790898e-05, "loss": 0.1699, "step": 33870 }, { "epoch": 9.53, "learning_rate": 8.993971199200324e-05, "loss": 0.1438, "step": 33900 }, { "epoch": 9.54, "learning_rate": 8.992096960609753e-05, "loss": 0.1845, "step": 33930 }, { "epoch": 9.55, "learning_rate": 8.990222722019181e-05, "loss": 0.1453, "step": 33960 }, { "epoch": 9.56, "learning_rate": 8.988348483428607e-05, "loss": 0.1379, "step": 33990 }, { "epoch": 9.56, "learning_rate": 8.986474244838034e-05, "loss": 0.1605, "step": 34020 }, { "epoch": 9.57, "learning_rate": 8.984600006247462e-05, "loss": 0.1322, "step": 34050 }, { "epoch": 9.58, "learning_rate": 8.98272576765689e-05, "loss": 0.1483, "step": 34080 }, { "epoch": 9.59, "learning_rate": 8.980851529066317e-05, "loss": 0.1529, "step": 34110 }, { "epoch": 9.6, "learning_rate": 8.978977290475745e-05, "loss": 0.1424, "step": 34140 }, { "epoch": 9.61, "learning_rate": 8.977103051885172e-05, "loss": 0.1585, "step": 34170 }, { "epoch": 9.61, "learning_rate": 8.9752288132946e-05, "loss": 0.1332, "step": 34200 }, { "epoch": 9.62, "learning_rate": 8.973354574704027e-05, "loss": 0.1488, "step": 34230 }, { "epoch": 9.63, "learning_rate": 8.971480336113455e-05, "loss": 0.1484, "step": 34260 }, { "epoch": 9.64, "learning_rate": 8.969606097522882e-05, "loss": 0.1382, "step": 34290 }, { "epoch": 9.65, "learning_rate": 8.967731858932308e-05, "loss": 0.1565, "step": 34320 }, { "epoch": 9.66, "learning_rate": 8.965857620341736e-05, "loss": 0.1494, "step": 34350 }, { "epoch": 9.67, "learning_rate": 8.963983381751165e-05, "loss": 0.1682, "step": 34380 }, { "epoch": 9.67, "learning_rate": 8.962109143160591e-05, "loss": 0.1465, "step": 34410 }, { "epoch": 9.68, "learning_rate": 8.960234904570018e-05, "loss": 0.1334, "step": 34440 }, { "epoch": 9.69, "learning_rate": 8.958360665979446e-05, "loss": 0.154, "step": 34470 }, { "epoch": 9.7, "learning_rate": 8.956486427388874e-05, "loss": 0.1351, "step": 34500 }, { "epoch": 9.71, "learning_rate": 8.954612188798301e-05, "loss": 0.1512, "step": 34530 }, { "epoch": 9.72, "learning_rate": 8.952737950207728e-05, "loss": 0.1509, "step": 34560 }, { "epoch": 9.72, "learning_rate": 8.950863711617156e-05, "loss": 0.1423, "step": 34590 }, { "epoch": 9.73, "learning_rate": 8.948989473026584e-05, "loss": 0.1546, "step": 34620 }, { "epoch": 9.74, "learning_rate": 8.94711523443601e-05, "loss": 0.1358, "step": 34650 }, { "epoch": 9.75, "learning_rate": 8.945240995845439e-05, "loss": 0.1512, "step": 34680 }, { "epoch": 9.76, "learning_rate": 8.943366757254865e-05, "loss": 0.1478, "step": 34710 }, { "epoch": 9.77, "learning_rate": 8.941492518664292e-05, "loss": 0.1393, "step": 34740 }, { "epoch": 9.77, "learning_rate": 8.93961828007372e-05, "loss": 0.1501, "step": 34770 }, { "epoch": 9.78, "learning_rate": 8.937744041483148e-05, "loss": 0.1328, "step": 34800 }, { "epoch": 9.79, "learning_rate": 8.935869802892575e-05, "loss": 0.1516, "step": 34830 }, { "epoch": 9.8, "learning_rate": 8.933995564302002e-05, "loss": 0.148, "step": 34860 }, { "epoch": 9.81, "learning_rate": 8.93212132571143e-05, "loss": 0.1357, "step": 34890 }, { "epoch": 9.82, "learning_rate": 8.930247087120858e-05, "loss": 0.161, "step": 34920 }, { "epoch": 9.83, "learning_rate": 8.928372848530285e-05, "loss": 0.1379, "step": 34950 }, { "epoch": 9.83, "learning_rate": 8.926498609939712e-05, "loss": 0.1554, "step": 34980 }, { "epoch": 9.84, "learning_rate": 8.92462437134914e-05, "loss": 0.1519, "step": 35010 }, { "epoch": 9.85, "learning_rate": 8.922750132758568e-05, "loss": 0.1393, "step": 35040 }, { "epoch": 9.86, "learning_rate": 8.920875894167995e-05, "loss": 0.1578, "step": 35070 }, { "epoch": 9.87, "learning_rate": 8.919001655577423e-05, "loss": 0.1331, "step": 35100 }, { "epoch": 9.88, "learning_rate": 8.91712741698685e-05, "loss": 0.1481, "step": 35130 }, { "epoch": 9.88, "learning_rate": 8.915253178396276e-05, "loss": 0.1467, "step": 35160 }, { "epoch": 9.89, "learning_rate": 8.913378939805704e-05, "loss": 0.1447, "step": 35190 }, { "epoch": 9.9, "learning_rate": 8.911504701215132e-05, "loss": 0.1507, "step": 35220 }, { "epoch": 9.91, "learning_rate": 8.909630462624559e-05, "loss": 0.1358, "step": 35250 }, { "epoch": 9.92, "learning_rate": 8.907756224033986e-05, "loss": 0.1411, "step": 35280 }, { "epoch": 9.93, "learning_rate": 8.905881985443414e-05, "loss": 0.145, "step": 35310 }, { "epoch": 9.94, "learning_rate": 8.904007746852842e-05, "loss": 0.14, "step": 35340 }, { "epoch": 9.94, "learning_rate": 8.902133508262269e-05, "loss": 0.1562, "step": 35370 }, { "epoch": 9.95, "learning_rate": 8.900259269671695e-05, "loss": 0.1337, "step": 35400 }, { "epoch": 9.96, "learning_rate": 8.898385031081124e-05, "loss": 0.1455, "step": 35430 }, { "epoch": 9.97, "learning_rate": 8.896510792490552e-05, "loss": 0.1489, "step": 35460 }, { "epoch": 9.98, "learning_rate": 8.894636553899978e-05, "loss": 0.1385, "step": 35490 }, { "epoch": 9.99, "learning_rate": 8.892762315309406e-05, "loss": 0.1525, "step": 35520 }, { "epoch": 9.99, "learning_rate": 8.890888076718833e-05, "loss": 0.1338, "step": 35550 }, { "epoch": 10.0, "eval_loss": 0.19677478075027466, "eval_runtime": 480.2192, "eval_samples_per_second": 33.387, "eval_steps_per_second": 1.045, "eval_wer": 0.18540253572257176, "step": 35570 }, { "epoch": 10.0, "learning_rate": 8.88901383812826e-05, "loss": 0.1577, "step": 35580 }, { "epoch": 10.01, "learning_rate": 8.887139599537688e-05, "loss": 0.126, "step": 35610 }, { "epoch": 10.02, "learning_rate": 8.885265360947116e-05, "loss": 0.1397, "step": 35640 }, { "epoch": 10.03, "learning_rate": 8.883391122356544e-05, "loss": 0.1469, "step": 35670 }, { "epoch": 10.04, "learning_rate": 8.88151688376597e-05, "loss": 0.1223, "step": 35700 }, { "epoch": 10.04, "learning_rate": 8.879642645175398e-05, "loss": 0.1476, "step": 35730 }, { "epoch": 10.05, "learning_rate": 8.877768406584826e-05, "loss": 0.1295, "step": 35760 }, { "epoch": 10.06, "learning_rate": 8.875894167994253e-05, "loss": 0.1416, "step": 35790 }, { "epoch": 10.07, "learning_rate": 8.874019929403679e-05, "loss": 0.1501, "step": 35820 }, { "epoch": 10.08, "learning_rate": 8.872145690813107e-05, "loss": 0.1268, "step": 35850 }, { "epoch": 10.09, "learning_rate": 8.870271452222536e-05, "loss": 0.1408, "step": 35880 }, { "epoch": 10.1, "learning_rate": 8.868397213631962e-05, "loss": 0.1251, "step": 35910 }, { "epoch": 10.1, "learning_rate": 8.86652297504139e-05, "loss": 0.1372, "step": 35940 }, { "epoch": 10.11, "learning_rate": 8.864648736450817e-05, "loss": 0.1599, "step": 35970 }, { "epoch": 10.12, "learning_rate": 8.862774497860244e-05, "loss": 0.1254, "step": 36000 }, { "epoch": 10.13, "learning_rate": 8.860900259269672e-05, "loss": 0.1437, "step": 36030 }, { "epoch": 10.14, "learning_rate": 8.8590260206791e-05, "loss": 0.1295, "step": 36060 }, { "epoch": 10.15, "learning_rate": 8.857214256708213e-05, "loss": 0.1405, "step": 36090 }, { "epoch": 10.15, "learning_rate": 8.855340018117641e-05, "loss": 0.1457, "step": 36120 }, { "epoch": 10.16, "learning_rate": 8.853465779527068e-05, "loss": 0.1312, "step": 36150 }, { "epoch": 10.17, "learning_rate": 8.851591540936494e-05, "loss": 0.1476, "step": 36180 }, { "epoch": 10.18, "learning_rate": 8.849717302345922e-05, "loss": 0.1384, "step": 36210 }, { "epoch": 10.19, "learning_rate": 8.84784306375535e-05, "loss": 0.1427, "step": 36240 }, { "epoch": 10.2, "learning_rate": 8.845968825164777e-05, "loss": 0.1544, "step": 36270 }, { "epoch": 10.21, "learning_rate": 8.844094586574204e-05, "loss": 0.1251, "step": 36300 }, { "epoch": 10.21, "learning_rate": 8.842220347983632e-05, "loss": 0.1529, "step": 36330 }, { "epoch": 10.22, "learning_rate": 8.840346109393059e-05, "loss": 0.1352, "step": 36360 }, { "epoch": 10.23, "learning_rate": 8.838471870802487e-05, "loss": 0.1373, "step": 36390 }, { "epoch": 10.24, "learning_rate": 8.836597632211915e-05, "loss": 0.1523, "step": 36420 }, { "epoch": 10.25, "learning_rate": 8.834723393621342e-05, "loss": 0.125, "step": 36450 }, { "epoch": 10.26, "learning_rate": 8.832849155030769e-05, "loss": 0.1466, "step": 36480 }, { "epoch": 10.26, "learning_rate": 8.830974916440197e-05, "loss": 0.1257, "step": 36510 }, { "epoch": 10.27, "learning_rate": 8.829100677849625e-05, "loss": 0.1424, "step": 36540 }, { "epoch": 10.28, "learning_rate": 8.827226439259051e-05, "loss": 0.1519, "step": 36570 }, { "epoch": 10.29, "learning_rate": 8.825352200668478e-05, "loss": 0.1251, "step": 36600 }, { "epoch": 10.3, "learning_rate": 8.823477962077906e-05, "loss": 0.1453, "step": 36630 }, { "epoch": 10.31, "learning_rate": 8.821603723487334e-05, "loss": 0.1313, "step": 36660 }, { "epoch": 10.31, "learning_rate": 8.819729484896761e-05, "loss": 0.1441, "step": 36690 }, { "epoch": 10.32, "learning_rate": 8.817855246306188e-05, "loss": 0.1528, "step": 36720 }, { "epoch": 10.33, "learning_rate": 8.815981007715616e-05, "loss": 0.1278, "step": 36750 }, { "epoch": 10.34, "learning_rate": 8.814106769125044e-05, "loss": 0.1456, "step": 36780 }, { "epoch": 10.35, "learning_rate": 8.812232530534471e-05, "loss": 0.1373, "step": 36810 }, { "epoch": 10.36, "learning_rate": 8.810358291943899e-05, "loss": 0.146, "step": 36840 }, { "epoch": 10.37, "learning_rate": 8.808484053353326e-05, "loss": 0.1453, "step": 36870 }, { "epoch": 10.37, "learning_rate": 8.806609814762752e-05, "loss": 0.1258, "step": 36900 }, { "epoch": 10.38, "learning_rate": 8.80473557617218e-05, "loss": 0.1607, "step": 36930 }, { "epoch": 10.39, "learning_rate": 8.802861337581609e-05, "loss": 0.1325, "step": 36960 }, { "epoch": 10.4, "learning_rate": 8.800987098991035e-05, "loss": 0.1382, "step": 36990 }, { "epoch": 10.41, "learning_rate": 8.799112860400462e-05, "loss": 0.1456, "step": 37020 }, { "epoch": 10.42, "learning_rate": 8.79723862180989e-05, "loss": 0.1236, "step": 37050 }, { "epoch": 10.42, "learning_rate": 8.795364383219318e-05, "loss": 0.1515, "step": 37080 }, { "epoch": 10.43, "learning_rate": 8.793490144628745e-05, "loss": 0.1295, "step": 37110 }, { "epoch": 10.44, "learning_rate": 8.791615906038172e-05, "loss": 0.1371, "step": 37140 }, { "epoch": 10.45, "learning_rate": 8.7897416674476e-05, "loss": 0.151, "step": 37170 }, { "epoch": 10.46, "learning_rate": 8.787867428857028e-05, "loss": 0.122, "step": 37200 }, { "epoch": 10.47, "learning_rate": 8.785993190266455e-05, "loss": 0.1449, "step": 37230 }, { "epoch": 10.48, "learning_rate": 8.784118951675883e-05, "loss": 0.1325, "step": 37260 }, { "epoch": 10.48, "learning_rate": 8.78224471308531e-05, "loss": 0.1402, "step": 37290 }, { "epoch": 10.49, "learning_rate": 8.780370474494736e-05, "loss": 0.1541, "step": 37320 }, { "epoch": 10.5, "learning_rate": 8.778496235904164e-05, "loss": 0.1226, "step": 37350 }, { "epoch": 10.51, "learning_rate": 8.776621997313592e-05, "loss": 0.1441, "step": 37380 }, { "epoch": 10.52, "learning_rate": 8.774747758723019e-05, "loss": 0.1264, "step": 37410 }, { "epoch": 10.53, "learning_rate": 8.772873520132446e-05, "loss": 0.1375, "step": 37440 }, { "epoch": 10.53, "learning_rate": 8.770999281541874e-05, "loss": 0.1486, "step": 37470 }, { "epoch": 10.54, "learning_rate": 8.769125042951302e-05, "loss": 0.1249, "step": 37500 }, { "epoch": 10.55, "learning_rate": 8.767250804360729e-05, "loss": 0.1508, "step": 37530 }, { "epoch": 10.56, "learning_rate": 8.765376565770156e-05, "loss": 0.1286, "step": 37560 }, { "epoch": 10.57, "learning_rate": 8.763502327179584e-05, "loss": 0.1402, "step": 37590 }, { "epoch": 10.58, "learning_rate": 8.761628088589012e-05, "loss": 0.1529, "step": 37620 }, { "epoch": 10.58, "learning_rate": 8.759753849998439e-05, "loss": 0.1225, "step": 37650 }, { "epoch": 10.59, "learning_rate": 8.757879611407867e-05, "loss": 0.1485, "step": 37680 }, { "epoch": 10.6, "learning_rate": 8.756005372817293e-05, "loss": 0.1306, "step": 37710 }, { "epoch": 10.61, "learning_rate": 8.75413113422672e-05, "loss": 0.1424, "step": 37740 }, { "epoch": 10.62, "learning_rate": 8.752256895636148e-05, "loss": 0.1507, "step": 37770 }, { "epoch": 10.63, "learning_rate": 8.750382657045576e-05, "loss": 0.1254, "step": 37800 }, { "epoch": 10.64, "learning_rate": 8.748508418455003e-05, "loss": 0.1455, "step": 37830 }, { "epoch": 10.64, "learning_rate": 8.74663417986443e-05, "loss": 0.134, "step": 37860 }, { "epoch": 10.65, "learning_rate": 8.744759941273858e-05, "loss": 0.1381, "step": 37890 }, { "epoch": 10.66, "learning_rate": 8.742885702683286e-05, "loss": 0.149, "step": 37920 }, { "epoch": 10.67, "learning_rate": 8.741011464092713e-05, "loss": 0.1205, "step": 37950 }, { "epoch": 10.68, "learning_rate": 8.73913722550214e-05, "loss": 0.1481, "step": 37980 }, { "epoch": 10.69, "learning_rate": 8.737262986911568e-05, "loss": 0.1385, "step": 38010 }, { "epoch": 10.69, "learning_rate": 8.735388748320996e-05, "loss": 0.1368, "step": 38040 }, { "epoch": 10.7, "learning_rate": 8.733514509730422e-05, "loss": 0.151, "step": 38070 }, { "epoch": 10.71, "learning_rate": 8.73164027113985e-05, "loss": 0.1279, "step": 38100 }, { "epoch": 10.72, "learning_rate": 8.729766032549277e-05, "loss": 0.1501, "step": 38130 }, { "epoch": 10.73, "learning_rate": 8.727891793958704e-05, "loss": 0.142, "step": 38160 }, { "epoch": 10.74, "learning_rate": 8.726017555368132e-05, "loss": 0.1391, "step": 38190 }, { "epoch": 10.74, "learning_rate": 8.72414331677756e-05, "loss": 0.1548, "step": 38220 }, { "epoch": 10.75, "learning_rate": 8.722269078186987e-05, "loss": 0.1266, "step": 38250 }, { "epoch": 10.76, "learning_rate": 8.720394839596414e-05, "loss": 0.1479, "step": 38280 }, { "epoch": 10.77, "learning_rate": 8.718520601005842e-05, "loss": 0.1385, "step": 38310 }, { "epoch": 10.78, "learning_rate": 8.71664636241527e-05, "loss": 0.1431, "step": 38340 }, { "epoch": 10.79, "learning_rate": 8.714772123824697e-05, "loss": 0.1527, "step": 38370 }, { "epoch": 10.8, "learning_rate": 8.712897885234123e-05, "loss": 0.1253, "step": 38400 }, { "epoch": 10.8, "learning_rate": 8.711023646643551e-05, "loss": 0.1533, "step": 38430 }, { "epoch": 10.81, "learning_rate": 8.70914940805298e-05, "loss": 0.1286, "step": 38460 }, { "epoch": 10.82, "learning_rate": 8.707275169462406e-05, "loss": 0.1318, "step": 38490 }, { "epoch": 10.83, "learning_rate": 8.705463405491519e-05, "loss": 0.1631, "step": 38520 }, { "epoch": 10.84, "learning_rate": 8.703589166900947e-05, "loss": 0.1207, "step": 38550 }, { "epoch": 10.85, "learning_rate": 8.701714928310374e-05, "loss": 0.1482, "step": 38580 }, { "epoch": 10.85, "learning_rate": 8.699840689719802e-05, "loss": 0.1333, "step": 38610 }, { "epoch": 10.86, "learning_rate": 8.697966451129229e-05, "loss": 0.144, "step": 38640 }, { "epoch": 10.87, "learning_rate": 8.696092212538657e-05, "loss": 0.1588, "step": 38670 }, { "epoch": 10.88, "learning_rate": 8.694217973948085e-05, "loss": 0.1212, "step": 38700 }, { "epoch": 10.89, "learning_rate": 8.692343735357512e-05, "loss": 0.1465, "step": 38730 }, { "epoch": 10.9, "learning_rate": 8.690469496766938e-05, "loss": 0.1286, "step": 38760 }, { "epoch": 10.91, "learning_rate": 8.688595258176366e-05, "loss": 0.146, "step": 38790 }, { "epoch": 10.91, "learning_rate": 8.686721019585795e-05, "loss": 0.1503, "step": 38820 }, { "epoch": 10.92, "learning_rate": 8.684846780995221e-05, "loss": 0.1341, "step": 38850 }, { "epoch": 10.93, "learning_rate": 8.682972542404648e-05, "loss": 0.1495, "step": 38880 }, { "epoch": 10.94, "learning_rate": 8.681098303814076e-05, "loss": 0.1285, "step": 38910 }, { "epoch": 10.95, "learning_rate": 8.679224065223503e-05, "loss": 0.1437, "step": 38940 }, { "epoch": 10.96, "learning_rate": 8.677349826632931e-05, "loss": 0.1519, "step": 38970 }, { "epoch": 10.96, "learning_rate": 8.675475588042358e-05, "loss": 0.1245, "step": 39000 }, { "epoch": 10.97, "learning_rate": 8.673601349451786e-05, "loss": 0.1472, "step": 39030 }, { "epoch": 10.98, "learning_rate": 8.671727110861213e-05, "loss": 0.1323, "step": 39060 }, { "epoch": 10.99, "learning_rate": 8.66985287227064e-05, "loss": 0.1388, "step": 39090 }, { "epoch": 11.0, "learning_rate": 8.667978633680069e-05, "loss": 0.1478, "step": 39120 }, { "epoch": 11.0, "eval_loss": 0.1963042914867401, "eval_runtime": 479.3311, "eval_samples_per_second": 33.449, "eval_steps_per_second": 1.047, "eval_wer": 0.18230453236526414, "step": 39127 }, { "epoch": 11.01, "learning_rate": 8.666104395089496e-05, "loss": 0.1225, "step": 39150 }, { "epoch": 11.01, "learning_rate": 8.664230156498922e-05, "loss": 0.1408, "step": 39180 }, { "epoch": 11.02, "learning_rate": 8.66235591790835e-05, "loss": 0.1196, "step": 39210 }, { "epoch": 11.03, "learning_rate": 8.660481679317778e-05, "loss": 0.135, "step": 39240 }, { "epoch": 11.04, "learning_rate": 8.658607440727205e-05, "loss": 0.1295, "step": 39270 }, { "epoch": 11.05, "learning_rate": 8.656733202136632e-05, "loss": 0.1283, "step": 39300 }, { "epoch": 11.06, "learning_rate": 8.65485896354606e-05, "loss": 0.1426, "step": 39330 }, { "epoch": 11.07, "learning_rate": 8.652984724955487e-05, "loss": 0.1163, "step": 39360 }, { "epoch": 11.07, "learning_rate": 8.651110486364915e-05, "loss": 0.1324, "step": 39390 }, { "epoch": 11.08, "learning_rate": 8.649236247774342e-05, "loss": 0.1245, "step": 39420 }, { "epoch": 11.09, "learning_rate": 8.64736200918377e-05, "loss": 0.1335, "step": 39450 }, { "epoch": 11.1, "learning_rate": 8.645487770593196e-05, "loss": 0.1421, "step": 39480 }, { "epoch": 11.11, "learning_rate": 8.643613532002625e-05, "loss": 0.119, "step": 39510 }, { "epoch": 11.12, "learning_rate": 8.641739293412053e-05, "loss": 0.1411, "step": 39540 }, { "epoch": 11.12, "learning_rate": 8.63986505482148e-05, "loss": 0.1278, "step": 39570 }, { "epoch": 11.13, "learning_rate": 8.637990816230906e-05, "loss": 0.1336, "step": 39600 }, { "epoch": 11.14, "learning_rate": 8.636116577640334e-05, "loss": 0.143, "step": 39630 }, { "epoch": 11.15, "learning_rate": 8.634242339049762e-05, "loss": 0.1256, "step": 39660 }, { "epoch": 11.16, "learning_rate": 8.632368100459189e-05, "loss": 0.1332, "step": 39690 }, { "epoch": 11.17, "learning_rate": 8.630493861868616e-05, "loss": 0.1258, "step": 39720 }, { "epoch": 11.18, "learning_rate": 8.628619623278044e-05, "loss": 0.1286, "step": 39750 }, { "epoch": 11.18, "learning_rate": 8.62674538468747e-05, "loss": 0.1467, "step": 39780 }, { "epoch": 11.19, "learning_rate": 8.624871146096899e-05, "loss": 0.1143, "step": 39810 }, { "epoch": 11.2, "learning_rate": 8.622996907506325e-05, "loss": 0.1353, "step": 39840 }, { "epoch": 11.21, "learning_rate": 8.621122668915754e-05, "loss": 0.1315, "step": 39870 }, { "epoch": 11.22, "learning_rate": 8.61924843032518e-05, "loss": 0.1311, "step": 39900 }, { "epoch": 11.23, "learning_rate": 8.617374191734608e-05, "loss": 0.1403, "step": 39930 }, { "epoch": 11.23, "learning_rate": 8.615499953144037e-05, "loss": 0.1215, "step": 39960 }, { "epoch": 11.24, "learning_rate": 8.613625714553463e-05, "loss": 0.1423, "step": 39990 }, { "epoch": 11.25, "learning_rate": 8.61175147596289e-05, "loss": 0.1286, "step": 40020 }, { "epoch": 11.26, "learning_rate": 8.609877237372318e-05, "loss": 0.1436, "step": 40050 }, { "epoch": 11.27, "learning_rate": 8.608002998781746e-05, "loss": 0.1448, "step": 40080 }, { "epoch": 11.28, "learning_rate": 8.606128760191172e-05, "loss": 0.1137, "step": 40110 }, { "epoch": 11.28, "learning_rate": 8.6042545216006e-05, "loss": 0.1395, "step": 40140 }, { "epoch": 11.29, "learning_rate": 8.602380283010028e-05, "loss": 0.129, "step": 40170 }, { "epoch": 11.3, "learning_rate": 8.600506044419455e-05, "loss": 0.1381, "step": 40200 }, { "epoch": 11.31, "learning_rate": 8.598631805828883e-05, "loss": 0.1547, "step": 40230 }, { "epoch": 11.32, "learning_rate": 8.59675756723831e-05, "loss": 0.1182, "step": 40260 }, { "epoch": 11.33, "learning_rate": 8.594883328647737e-05, "loss": 0.1422, "step": 40290 }, { "epoch": 11.34, "learning_rate": 8.593009090057164e-05, "loss": 0.1323, "step": 40320 }, { "epoch": 11.34, "learning_rate": 8.591134851466592e-05, "loss": 0.1241, "step": 40350 }, { "epoch": 11.35, "learning_rate": 8.58926061287602e-05, "loss": 0.1451, "step": 40380 }, { "epoch": 11.36, "learning_rate": 8.587386374285447e-05, "loss": 0.1225, "step": 40410 }, { "epoch": 11.37, "learning_rate": 8.585512135694874e-05, "loss": 0.1381, "step": 40440 }, { "epoch": 11.38, "learning_rate": 8.583637897104302e-05, "loss": 0.1275, "step": 40470 }, { "epoch": 11.39, "learning_rate": 8.58176365851373e-05, "loss": 0.1301, "step": 40500 }, { "epoch": 11.39, "learning_rate": 8.579889419923155e-05, "loss": 0.1473, "step": 40530 }, { "epoch": 11.4, "learning_rate": 8.578015181332584e-05, "loss": 0.1212, "step": 40560 }, { "epoch": 11.41, "learning_rate": 8.576140942742012e-05, "loss": 0.1399, "step": 40590 }, { "epoch": 11.42, "learning_rate": 8.57426670415144e-05, "loss": 0.1206, "step": 40620 }, { "epoch": 11.43, "learning_rate": 8.572392465560866e-05, "loss": 0.1391, "step": 40650 }, { "epoch": 11.44, "learning_rate": 8.570518226970293e-05, "loss": 0.1464, "step": 40680 }, { "epoch": 11.44, "learning_rate": 8.568643988379721e-05, "loss": 0.1203, "step": 40710 }, { "epoch": 11.45, "learning_rate": 8.566769749789148e-05, "loss": 0.1393, "step": 40740 }, { "epoch": 11.46, "learning_rate": 8.564895511198576e-05, "loss": 0.1302, "step": 40770 }, { "epoch": 11.47, "learning_rate": 8.563021272608004e-05, "loss": 0.1356, "step": 40800 }, { "epoch": 11.48, "learning_rate": 8.561147034017431e-05, "loss": 0.1402, "step": 40830 }, { "epoch": 11.49, "learning_rate": 8.559272795426858e-05, "loss": 0.1223, "step": 40860 }, { "epoch": 11.5, "learning_rate": 8.557398556836286e-05, "loss": 0.1409, "step": 40890 }, { "epoch": 11.5, "learning_rate": 8.555524318245714e-05, "loss": 0.1258, "step": 40920 }, { "epoch": 11.51, "learning_rate": 8.55365007965514e-05, "loss": 0.1279, "step": 40950 }, { "epoch": 11.52, "learning_rate": 8.551775841064567e-05, "loss": 0.1434, "step": 40980 }, { "epoch": 11.53, "learning_rate": 8.549901602473995e-05, "loss": 0.1148, "step": 41010 }, { "epoch": 11.54, "learning_rate": 8.548027363883424e-05, "loss": 0.1429, "step": 41040 }, { "epoch": 11.55, "learning_rate": 8.54615312529285e-05, "loss": 0.1257, "step": 41070 }, { "epoch": 11.55, "learning_rate": 8.544278886702277e-05, "loss": 0.1344, "step": 41100 }, { "epoch": 11.56, "learning_rate": 8.542404648111705e-05, "loss": 0.1427, "step": 41130 }, { "epoch": 11.57, "learning_rate": 8.540530409521132e-05, "loss": 0.1237, "step": 41160 }, { "epoch": 11.58, "learning_rate": 8.53865617093056e-05, "loss": 0.1369, "step": 41190 }, { "epoch": 11.59, "learning_rate": 8.536781932339988e-05, "loss": 0.129, "step": 41220 }, { "epoch": 11.6, "learning_rate": 8.534907693749415e-05, "loss": 0.1385, "step": 41250 }, { "epoch": 11.61, "learning_rate": 8.533033455158842e-05, "loss": 0.1428, "step": 41280 }, { "epoch": 11.61, "learning_rate": 8.53115921656827e-05, "loss": 0.1188, "step": 41310 }, { "epoch": 11.62, "learning_rate": 8.529284977977698e-05, "loss": 0.1442, "step": 41340 }, { "epoch": 11.63, "learning_rate": 8.527410739387125e-05, "loss": 0.132, "step": 41370 }, { "epoch": 11.64, "learning_rate": 8.525536500796551e-05, "loss": 0.137, "step": 41400 }, { "epoch": 11.65, "learning_rate": 8.52366226220598e-05, "loss": 0.1439, "step": 41430 }, { "epoch": 11.66, "learning_rate": 8.521788023615407e-05, "loss": 0.1165, "step": 41460 }, { "epoch": 11.66, "learning_rate": 8.519913785024834e-05, "loss": 0.1331, "step": 41490 }, { "epoch": 11.67, "learning_rate": 8.518039546434261e-05, "loss": 0.1333, "step": 41520 }, { "epoch": 11.68, "learning_rate": 8.516165307843689e-05, "loss": 0.1305, "step": 41550 }, { "epoch": 11.69, "learning_rate": 8.514291069253116e-05, "loss": 0.1469, "step": 41580 }, { "epoch": 11.7, "learning_rate": 8.512416830662544e-05, "loss": 0.1196, "step": 41610 }, { "epoch": 11.71, "learning_rate": 8.510542592071972e-05, "loss": 0.1409, "step": 41640 }, { "epoch": 11.71, "learning_rate": 8.508668353481399e-05, "loss": 0.1287, "step": 41670 }, { "epoch": 11.72, "learning_rate": 8.506794114890825e-05, "loss": 0.1311, "step": 41700 }, { "epoch": 11.73, "learning_rate": 8.504919876300254e-05, "loss": 0.1521, "step": 41730 }, { "epoch": 11.74, "learning_rate": 8.503045637709682e-05, "loss": 0.1193, "step": 41760 }, { "epoch": 11.75, "learning_rate": 8.501171399119108e-05, "loss": 0.1292, "step": 41790 }, { "epoch": 11.76, "learning_rate": 8.499297160528535e-05, "loss": 0.1316, "step": 41820 }, { "epoch": 11.77, "learning_rate": 8.497422921937963e-05, "loss": 0.1282, "step": 41850 }, { "epoch": 11.77, "learning_rate": 8.495548683347391e-05, "loss": 0.1428, "step": 41880 }, { "epoch": 11.78, "learning_rate": 8.493674444756818e-05, "loss": 0.1231, "step": 41910 }, { "epoch": 11.79, "learning_rate": 8.491800206166245e-05, "loss": 0.1375, "step": 41940 }, { "epoch": 11.8, "learning_rate": 8.489925967575673e-05, "loss": 0.1259, "step": 41970 }, { "epoch": 11.81, "learning_rate": 8.4880517289851e-05, "loss": 0.1291, "step": 42000 }, { "epoch": 11.82, "learning_rate": 8.486177490394528e-05, "loss": 0.1446, "step": 42030 }, { "epoch": 11.82, "learning_rate": 8.484303251803956e-05, "loss": 0.12, "step": 42060 }, { "epoch": 11.83, "learning_rate": 8.482429013213383e-05, "loss": 0.1332, "step": 42090 }, { "epoch": 11.84, "learning_rate": 8.480617249242495e-05, "loss": 0.1232, "step": 42120 }, { "epoch": 11.85, "learning_rate": 8.478743010651923e-05, "loss": 0.1266, "step": 42150 }, { "epoch": 11.86, "learning_rate": 8.47686877206135e-05, "loss": 0.1501, "step": 42180 }, { "epoch": 11.87, "learning_rate": 8.474994533470778e-05, "loss": 0.1221, "step": 42210 }, { "epoch": 11.88, "learning_rate": 8.473120294880206e-05, "loss": 0.1365, "step": 42240 }, { "epoch": 11.88, "learning_rate": 8.471246056289632e-05, "loss": 0.1262, "step": 42270 }, { "epoch": 11.89, "learning_rate": 8.46937181769906e-05, "loss": 0.1313, "step": 42300 }, { "epoch": 11.9, "learning_rate": 8.467497579108488e-05, "loss": 0.1452, "step": 42330 }, { "epoch": 11.91, "learning_rate": 8.465623340517915e-05, "loss": 0.1246, "step": 42360 }, { "epoch": 11.92, "learning_rate": 8.463749101927343e-05, "loss": 0.1378, "step": 42390 }, { "epoch": 11.93, "learning_rate": 8.46187486333677e-05, "loss": 0.1265, "step": 42420 }, { "epoch": 11.93, "learning_rate": 8.460000624746198e-05, "loss": 0.1343, "step": 42450 }, { "epoch": 11.94, "learning_rate": 8.458126386155624e-05, "loss": 0.1391, "step": 42480 }, { "epoch": 11.95, "learning_rate": 8.456252147565052e-05, "loss": 0.1157, "step": 42510 }, { "epoch": 11.96, "learning_rate": 8.454377908974479e-05, "loss": 0.1359, "step": 42540 }, { "epoch": 11.97, "learning_rate": 8.452503670383907e-05, "loss": 0.1298, "step": 42570 }, { "epoch": 11.98, "learning_rate": 8.450629431793334e-05, "loss": 0.1291, "step": 42600 }, { "epoch": 11.98, "learning_rate": 8.448755193202762e-05, "loss": 0.1352, "step": 42630 }, { "epoch": 11.99, "learning_rate": 8.44688095461219e-05, "loss": 0.1177, "step": 42660 }, { "epoch": 12.0, "eval_loss": 0.19564659893512726, "eval_runtime": 478.632, "eval_samples_per_second": 33.498, "eval_steps_per_second": 1.049, "eval_wer": 0.17997079415337164, "step": 42684 }, { "epoch": 12.0, "learning_rate": 8.445006716021616e-05, "loss": 0.1475, "step": 42690 }, { "epoch": 12.01, "learning_rate": 8.443132477431044e-05, "loss": 0.1208, "step": 42720 }, { "epoch": 12.02, "learning_rate": 8.441258238840472e-05, "loss": 0.1224, "step": 42750 }, { "epoch": 12.03, "learning_rate": 8.439384000249899e-05, "loss": 0.1231, "step": 42780 }, { "epoch": 12.04, "learning_rate": 8.437509761659327e-05, "loss": 0.1231, "step": 42810 }, { "epoch": 12.04, "learning_rate": 8.435635523068753e-05, "loss": 0.1325, "step": 42840 }, { "epoch": 12.05, "learning_rate": 8.433761284478181e-05, "loss": 0.1167, "step": 42870 }, { "epoch": 12.06, "learning_rate": 8.431887045887608e-05, "loss": 0.1336, "step": 42900 }, { "epoch": 12.07, "learning_rate": 8.430012807297036e-05, "loss": 0.1248, "step": 42930 }, { "epoch": 12.08, "learning_rate": 8.428138568706463e-05, "loss": 0.1246, "step": 42960 }, { "epoch": 12.09, "learning_rate": 8.426264330115891e-05, "loss": 0.1269, "step": 42990 }, { "epoch": 12.09, "learning_rate": 8.424390091525318e-05, "loss": 0.1137, "step": 43020 }, { "epoch": 12.1, "learning_rate": 8.422515852934746e-05, "loss": 0.1239, "step": 43050 }, { "epoch": 12.11, "learning_rate": 8.420641614344174e-05, "loss": 0.1295, "step": 43080 }, { "epoch": 12.12, "learning_rate": 8.4187673757536e-05, "loss": 0.1244, "step": 43110 }, { "epoch": 12.13, "learning_rate": 8.416893137163028e-05, "loss": 0.136, "step": 43140 }, { "epoch": 12.14, "learning_rate": 8.415018898572456e-05, "loss": 0.1142, "step": 43170 }, { "epoch": 12.15, "learning_rate": 8.413144659981882e-05, "loss": 0.1349, "step": 43200 }, { "epoch": 12.15, "learning_rate": 8.41127042139131e-05, "loss": 0.1246, "step": 43230 }, { "epoch": 12.16, "learning_rate": 8.409396182800737e-05, "loss": 0.1244, "step": 43260 }, { "epoch": 12.17, "learning_rate": 8.407521944210165e-05, "loss": 0.1357, "step": 43290 }, { "epoch": 12.18, "learning_rate": 8.405647705619592e-05, "loss": 0.1175, "step": 43320 }, { "epoch": 12.19, "learning_rate": 8.40377346702902e-05, "loss": 0.1322, "step": 43350 }, { "epoch": 12.2, "learning_rate": 8.401899228438447e-05, "loss": 0.1274, "step": 43380 }, { "epoch": 12.2, "learning_rate": 8.400024989847875e-05, "loss": 0.1226, "step": 43410 }, { "epoch": 12.21, "learning_rate": 8.398150751257302e-05, "loss": 0.1399, "step": 43440 }, { "epoch": 12.22, "learning_rate": 8.39627651266673e-05, "loss": 0.1195, "step": 43470 }, { "epoch": 12.23, "learning_rate": 8.394402274076158e-05, "loss": 0.13, "step": 43500 }, { "epoch": 12.24, "learning_rate": 8.392528035485583e-05, "loss": 0.1324, "step": 43530 }, { "epoch": 12.25, "learning_rate": 8.390653796895011e-05, "loss": 0.1257, "step": 43560 }, { "epoch": 12.25, "learning_rate": 8.38877955830444e-05, "loss": 0.1363, "step": 43590 }, { "epoch": 12.26, "learning_rate": 8.386905319713866e-05, "loss": 0.1137, "step": 43620 }, { "epoch": 12.27, "learning_rate": 8.385031081123294e-05, "loss": 0.1262, "step": 43650 }, { "epoch": 12.28, "learning_rate": 8.383156842532721e-05, "loss": 0.1309, "step": 43680 }, { "epoch": 12.29, "learning_rate": 8.381282603942149e-05, "loss": 0.1266, "step": 43710 }, { "epoch": 12.3, "learning_rate": 8.379408365351576e-05, "loss": 0.1372, "step": 43740 }, { "epoch": 12.31, "learning_rate": 8.377534126761004e-05, "loss": 0.1164, "step": 43770 }, { "epoch": 12.31, "learning_rate": 8.375659888170431e-05, "loss": 0.1326, "step": 43800 }, { "epoch": 12.32, "learning_rate": 8.373785649579859e-05, "loss": 0.1297, "step": 43830 }, { "epoch": 12.33, "learning_rate": 8.371911410989286e-05, "loss": 0.1234, "step": 43860 }, { "epoch": 12.34, "learning_rate": 8.370037172398714e-05, "loss": 0.1377, "step": 43890 }, { "epoch": 12.35, "learning_rate": 8.368162933808142e-05, "loss": 0.1154, "step": 43920 }, { "epoch": 12.36, "learning_rate": 8.366288695217567e-05, "loss": 0.1382, "step": 43950 }, { "epoch": 12.36, "learning_rate": 8.364414456626995e-05, "loss": 0.1308, "step": 43980 }, { "epoch": 12.37, "learning_rate": 8.362540218036423e-05, "loss": 0.1279, "step": 44010 }, { "epoch": 12.38, "learning_rate": 8.360665979445851e-05, "loss": 0.1345, "step": 44040 }, { "epoch": 12.39, "learning_rate": 8.358791740855278e-05, "loss": 0.1167, "step": 44070 }, { "epoch": 12.4, "learning_rate": 8.356917502264705e-05, "loss": 0.1296, "step": 44100 }, { "epoch": 12.41, "learning_rate": 8.355043263674133e-05, "loss": 0.1288, "step": 44130 }, { "epoch": 12.41, "learning_rate": 8.35316902508356e-05, "loss": 0.121, "step": 44160 }, { "epoch": 12.42, "learning_rate": 8.351294786492988e-05, "loss": 0.1304, "step": 44190 }, { "epoch": 12.43, "learning_rate": 8.349420547902415e-05, "loss": 0.1198, "step": 44220 }, { "epoch": 12.44, "learning_rate": 8.347546309311843e-05, "loss": 0.1348, "step": 44250 }, { "epoch": 12.45, "learning_rate": 8.34567207072127e-05, "loss": 0.1269, "step": 44280 }, { "epoch": 12.46, "learning_rate": 8.343797832130698e-05, "loss": 0.1216, "step": 44310 }, { "epoch": 12.47, "learning_rate": 8.341923593540126e-05, "loss": 0.1321, "step": 44340 }, { "epoch": 12.47, "learning_rate": 8.340049354949551e-05, "loss": 0.1204, "step": 44370 }, { "epoch": 12.48, "learning_rate": 8.338175116358979e-05, "loss": 0.1322, "step": 44400 }, { "epoch": 12.49, "learning_rate": 8.336300877768407e-05, "loss": 0.1259, "step": 44430 }, { "epoch": 12.5, "learning_rate": 8.334426639177835e-05, "loss": 0.1233, "step": 44460 }, { "epoch": 12.51, "learning_rate": 8.332552400587261e-05, "loss": 0.1342, "step": 44490 }, { "epoch": 12.52, "learning_rate": 8.330678161996689e-05, "loss": 0.1143, "step": 44520 }, { "epoch": 12.52, "learning_rate": 8.328803923406117e-05, "loss": 0.1335, "step": 44550 }, { "epoch": 12.53, "learning_rate": 8.326929684815544e-05, "loss": 0.1285, "step": 44580 }, { "epoch": 12.54, "learning_rate": 8.325055446224972e-05, "loss": 0.1218, "step": 44610 }, { "epoch": 12.55, "learning_rate": 8.323181207634399e-05, "loss": 0.1364, "step": 44640 }, { "epoch": 12.56, "learning_rate": 8.321306969043827e-05, "loss": 0.1171, "step": 44670 }, { "epoch": 12.57, "learning_rate": 8.319432730453253e-05, "loss": 0.1374, "step": 44700 }, { "epoch": 12.58, "learning_rate": 8.317558491862681e-05, "loss": 0.1288, "step": 44730 }, { "epoch": 12.58, "learning_rate": 8.31568425327211e-05, "loss": 0.126, "step": 44760 }, { "epoch": 12.59, "learning_rate": 8.313810014681536e-05, "loss": 0.1404, "step": 44790 }, { "epoch": 12.6, "learning_rate": 8.311935776090963e-05, "loss": 0.1171, "step": 44820 }, { "epoch": 12.61, "learning_rate": 8.310061537500391e-05, "loss": 0.1304, "step": 44850 }, { "epoch": 12.62, "learning_rate": 8.308187298909819e-05, "loss": 0.1322, "step": 44880 }, { "epoch": 12.63, "learning_rate": 8.306313060319245e-05, "loss": 0.1237, "step": 44910 }, { "epoch": 12.63, "learning_rate": 8.304438821728673e-05, "loss": 0.1353, "step": 44940 }, { "epoch": 12.64, "learning_rate": 8.302564583138101e-05, "loss": 0.1161, "step": 44970 }, { "epoch": 12.65, "learning_rate": 8.300690344547528e-05, "loss": 0.1297, "step": 45000 }, { "epoch": 12.66, "learning_rate": 8.298816105956956e-05, "loss": 0.1286, "step": 45030 }, { "epoch": 12.67, "learning_rate": 8.296941867366382e-05, "loss": 0.1245, "step": 45060 }, { "epoch": 12.68, "learning_rate": 8.29506762877581e-05, "loss": 0.1329, "step": 45090 }, { "epoch": 12.68, "learning_rate": 8.293193390185237e-05, "loss": 0.1151, "step": 45120 }, { "epoch": 12.69, "learning_rate": 8.291319151594665e-05, "loss": 0.1302, "step": 45150 }, { "epoch": 12.7, "learning_rate": 8.289444913004093e-05, "loss": 0.1284, "step": 45180 }, { "epoch": 12.71, "learning_rate": 8.28757067441352e-05, "loss": 0.1236, "step": 45210 }, { "epoch": 12.72, "learning_rate": 8.285696435822947e-05, "loss": 0.1403, "step": 45240 }, { "epoch": 12.73, "learning_rate": 8.283822197232375e-05, "loss": 0.112, "step": 45270 }, { "epoch": 12.74, "learning_rate": 8.281947958641803e-05, "loss": 0.1292, "step": 45300 }, { "epoch": 12.74, "learning_rate": 8.280073720051228e-05, "loss": 0.1273, "step": 45330 }, { "epoch": 12.75, "learning_rate": 8.278199481460657e-05, "loss": 0.1233, "step": 45360 }, { "epoch": 12.76, "learning_rate": 8.276325242870085e-05, "loss": 0.1404, "step": 45390 }, { "epoch": 12.77, "learning_rate": 8.274451004279511e-05, "loss": 0.1222, "step": 45420 }, { "epoch": 12.78, "learning_rate": 8.27257676568894e-05, "loss": 0.1301, "step": 45450 }, { "epoch": 12.79, "learning_rate": 8.270702527098366e-05, "loss": 0.1326, "step": 45480 }, { "epoch": 12.79, "learning_rate": 8.268828288507794e-05, "loss": 0.1243, "step": 45510 }, { "epoch": 12.8, "learning_rate": 8.266954049917221e-05, "loss": 0.1403, "step": 45540 }, { "epoch": 12.81, "learning_rate": 8.265079811326649e-05, "loss": 0.1198, "step": 45570 }, { "epoch": 12.82, "learning_rate": 8.263205572736077e-05, "loss": 0.1254, "step": 45600 }, { "epoch": 12.83, "learning_rate": 8.261331334145504e-05, "loss": 0.1306, "step": 45630 }, { "epoch": 12.84, "learning_rate": 8.259457095554931e-05, "loss": 0.1267, "step": 45660 }, { "epoch": 12.84, "learning_rate": 8.257582856964359e-05, "loss": 0.139, "step": 45690 }, { "epoch": 12.85, "learning_rate": 8.255708618373787e-05, "loss": 0.1106, "step": 45720 }, { "epoch": 12.86, "learning_rate": 8.2538968544029e-05, "loss": 0.1351, "step": 45750 }, { "epoch": 12.87, "learning_rate": 8.252022615812326e-05, "loss": 0.1265, "step": 45780 }, { "epoch": 12.88, "learning_rate": 8.250148377221753e-05, "loss": 0.1185, "step": 45810 }, { "epoch": 12.89, "learning_rate": 8.248274138631181e-05, "loss": 0.1317, "step": 45840 }, { "epoch": 12.9, "learning_rate": 8.24639990004061e-05, "loss": 0.1265, "step": 45870 }, { "epoch": 12.9, "learning_rate": 8.244525661450036e-05, "loss": 0.1248, "step": 45900 }, { "epoch": 12.91, "learning_rate": 8.242651422859464e-05, "loss": 0.1273, "step": 45930 }, { "epoch": 12.92, "learning_rate": 8.240777184268891e-05, "loss": 0.1254, "step": 45960 }, { "epoch": 12.93, "learning_rate": 8.238902945678319e-05, "loss": 0.1422, "step": 45990 }, { "epoch": 12.94, "learning_rate": 8.237028707087746e-05, "loss": 0.1225, "step": 46020 }, { "epoch": 12.95, "learning_rate": 8.235154468497174e-05, "loss": 0.1304, "step": 46050 }, { "epoch": 12.95, "learning_rate": 8.2332802299066e-05, "loss": 0.1287, "step": 46080 }, { "epoch": 12.96, "learning_rate": 8.231405991316027e-05, "loss": 0.1254, "step": 46110 }, { "epoch": 12.97, "learning_rate": 8.229531752725455e-05, "loss": 0.1448, "step": 46140 }, { "epoch": 12.98, "learning_rate": 8.227657514134884e-05, "loss": 0.117, "step": 46170 }, { "epoch": 12.99, "learning_rate": 8.22578327554431e-05, "loss": 0.1298, "step": 46200 }, { "epoch": 13.0, "learning_rate": 8.223909036953737e-05, "loss": 0.1245, "step": 46230 }, { "epoch": 13.0, "eval_loss": 0.1889359951019287, "eval_runtime": 478.3965, "eval_samples_per_second": 33.514, "eval_steps_per_second": 1.049, "eval_wer": 0.17316746959998908, "step": 46241 }, { "epoch": 13.01, "learning_rate": 8.222034798363165e-05, "loss": 0.1197, "step": 46260 }, { "epoch": 13.01, "learning_rate": 8.220160559772593e-05, "loss": 0.1297, "step": 46290 }, { "epoch": 13.02, "learning_rate": 8.21828632118202e-05, "loss": 0.1108, "step": 46320 }, { "epoch": 13.03, "learning_rate": 8.216412082591448e-05, "loss": 0.1317, "step": 46350 }, { "epoch": 13.04, "learning_rate": 8.214537844000875e-05, "loss": 0.1133, "step": 46380 }, { "epoch": 13.05, "learning_rate": 8.212663605410303e-05, "loss": 0.1236, "step": 46410 }, { "epoch": 13.06, "learning_rate": 8.21078936681973e-05, "loss": 0.1254, "step": 46440 }, { "epoch": 13.06, "learning_rate": 8.208915128229158e-05, "loss": 0.1126, "step": 46470 }, { "epoch": 13.07, "learning_rate": 8.207040889638585e-05, "loss": 0.1321, "step": 46500 }, { "epoch": 13.08, "learning_rate": 8.205166651048011e-05, "loss": 0.1185, "step": 46530 }, { "epoch": 13.09, "learning_rate": 8.20329241245744e-05, "loss": 0.1262, "step": 46560 }, { "epoch": 13.1, "learning_rate": 8.201418173866867e-05, "loss": 0.1228, "step": 46590 }, { "epoch": 13.11, "learning_rate": 8.199543935276294e-05, "loss": 0.1105, "step": 46620 }, { "epoch": 13.11, "learning_rate": 8.197669696685721e-05, "loss": 0.1295, "step": 46650 }, { "epoch": 13.12, "learning_rate": 8.195795458095149e-05, "loss": 0.1089, "step": 46680 }, { "epoch": 13.13, "learning_rate": 8.193921219504577e-05, "loss": 0.1168, "step": 46710 }, { "epoch": 13.14, "learning_rate": 8.192046980914004e-05, "loss": 0.1319, "step": 46740 }, { "epoch": 13.15, "learning_rate": 8.190172742323432e-05, "loss": 0.1141, "step": 46770 }, { "epoch": 13.16, "learning_rate": 8.188298503732859e-05, "loss": 0.1327, "step": 46800 }, { "epoch": 13.17, "learning_rate": 8.186424265142287e-05, "loss": 0.1142, "step": 46830 }, { "epoch": 13.17, "learning_rate": 8.184550026551714e-05, "loss": 0.1268, "step": 46860 }, { "epoch": 13.18, "learning_rate": 8.182675787961142e-05, "loss": 0.1296, "step": 46890 }, { "epoch": 13.19, "learning_rate": 8.180801549370568e-05, "loss": 0.1103, "step": 46920 }, { "epoch": 13.2, "learning_rate": 8.178927310779995e-05, "loss": 0.1404, "step": 46950 }, { "epoch": 13.21, "learning_rate": 8.177053072189423e-05, "loss": 0.1145, "step": 46980 }, { "epoch": 13.22, "learning_rate": 8.175178833598851e-05, "loss": 0.1248, "step": 47010 }, { "epoch": 13.22, "learning_rate": 8.173304595008278e-05, "loss": 0.123, "step": 47040 }, { "epoch": 13.23, "learning_rate": 8.171430356417705e-05, "loss": 0.11, "step": 47070 }, { "epoch": 13.24, "learning_rate": 8.169556117827133e-05, "loss": 0.1269, "step": 47100 }, { "epoch": 13.25, "learning_rate": 8.167681879236561e-05, "loss": 0.118, "step": 47130 }, { "epoch": 13.26, "learning_rate": 8.165807640645988e-05, "loss": 0.1306, "step": 47160 }, { "epoch": 13.27, "learning_rate": 8.163933402055416e-05, "loss": 0.1242, "step": 47190 }, { "epoch": 13.28, "learning_rate": 8.162059163464843e-05, "loss": 0.1105, "step": 47220 }, { "epoch": 13.28, "learning_rate": 8.16018492487427e-05, "loss": 0.1311, "step": 47250 }, { "epoch": 13.29, "learning_rate": 8.158310686283697e-05, "loss": 0.1116, "step": 47280 }, { "epoch": 13.3, "learning_rate": 8.156436447693125e-05, "loss": 0.1219, "step": 47310 }, { "epoch": 13.31, "learning_rate": 8.154562209102552e-05, "loss": 0.1371, "step": 47340 }, { "epoch": 13.32, "learning_rate": 8.152687970511979e-05, "loss": 0.1145, "step": 47370 }, { "epoch": 13.33, "learning_rate": 8.150813731921407e-05, "loss": 0.1321, "step": 47400 }, { "epoch": 13.33, "learning_rate": 8.148939493330835e-05, "loss": 0.1164, "step": 47430 }, { "epoch": 13.34, "learning_rate": 8.147065254740263e-05, "loss": 0.1286, "step": 47460 }, { "epoch": 13.35, "learning_rate": 8.145191016149689e-05, "loss": 0.1307, "step": 47490 }, { "epoch": 13.36, "learning_rate": 8.143316777559117e-05, "loss": 0.1099, "step": 47520 }, { "epoch": 13.37, "learning_rate": 8.141442538968545e-05, "loss": 0.1275, "step": 47550 }, { "epoch": 13.38, "learning_rate": 8.139568300377972e-05, "loss": 0.1101, "step": 47580 }, { "epoch": 13.38, "learning_rate": 8.1376940617874e-05, "loss": 0.1284, "step": 47610 }, { "epoch": 13.39, "learning_rate": 8.135819823196826e-05, "loss": 0.1295, "step": 47640 }, { "epoch": 13.4, "learning_rate": 8.133945584606255e-05, "loss": 0.1114, "step": 47670 }, { "epoch": 13.41, "learning_rate": 8.132071346015681e-05, "loss": 0.1311, "step": 47700 }, { "epoch": 13.42, "learning_rate": 8.13019710742511e-05, "loss": 0.1133, "step": 47730 }, { "epoch": 13.43, "learning_rate": 8.128322868834536e-05, "loss": 0.1211, "step": 47760 }, { "epoch": 13.44, "learning_rate": 8.126448630243963e-05, "loss": 0.1273, "step": 47790 }, { "epoch": 13.44, "learning_rate": 8.124574391653391e-05, "loss": 0.1107, "step": 47820 }, { "epoch": 13.45, "learning_rate": 8.122700153062819e-05, "loss": 0.1235, "step": 47850 }, { "epoch": 13.46, "learning_rate": 8.120825914472247e-05, "loss": 0.1126, "step": 47880 }, { "epoch": 13.47, "learning_rate": 8.118951675881673e-05, "loss": 0.1345, "step": 47910 }, { "epoch": 13.48, "learning_rate": 8.1170774372911e-05, "loss": 0.1258, "step": 47940 }, { "epoch": 13.49, "learning_rate": 8.115203198700529e-05, "loss": 0.1151, "step": 47970 }, { "epoch": 13.49, "learning_rate": 8.113328960109955e-05, "loss": 0.1267, "step": 48000 }, { "epoch": 13.5, "learning_rate": 8.111454721519384e-05, "loss": 0.115, "step": 48030 }, { "epoch": 13.51, "learning_rate": 8.10958048292881e-05, "loss": 0.1229, "step": 48060 }, { "epoch": 13.52, "learning_rate": 8.107706244338238e-05, "loss": 0.1356, "step": 48090 }, { "epoch": 13.53, "learning_rate": 8.105832005747665e-05, "loss": 0.1159, "step": 48120 }, { "epoch": 13.54, "learning_rate": 8.103957767157093e-05, "loss": 0.1342, "step": 48150 }, { "epoch": 13.55, "learning_rate": 8.10208352856652e-05, "loss": 0.1118, "step": 48180 }, { "epoch": 13.55, "learning_rate": 8.100209289975948e-05, "loss": 0.1213, "step": 48210 }, { "epoch": 13.56, "learning_rate": 8.098335051385375e-05, "loss": 0.1283, "step": 48240 }, { "epoch": 13.57, "learning_rate": 8.096460812794803e-05, "loss": 0.1207, "step": 48270 }, { "epoch": 13.58, "learning_rate": 8.094649048823916e-05, "loss": 0.1269, "step": 48300 }, { "epoch": 13.59, "learning_rate": 8.092774810233344e-05, "loss": 0.1162, "step": 48330 }, { "epoch": 13.6, "learning_rate": 8.09090057164277e-05, "loss": 0.1253, "step": 48360 }, { "epoch": 13.6, "learning_rate": 8.089026333052197e-05, "loss": 0.1266, "step": 48390 }, { "epoch": 13.61, "learning_rate": 8.087152094461625e-05, "loss": 0.1125, "step": 48420 }, { "epoch": 13.62, "learning_rate": 8.085277855871053e-05, "loss": 0.125, "step": 48450 }, { "epoch": 13.63, "learning_rate": 8.08340361728048e-05, "loss": 0.1151, "step": 48480 }, { "epoch": 13.64, "learning_rate": 8.081529378689907e-05, "loss": 0.1226, "step": 48510 }, { "epoch": 13.65, "learning_rate": 8.079655140099335e-05, "loss": 0.1302, "step": 48540 }, { "epoch": 13.65, "learning_rate": 8.077780901508763e-05, "loss": 0.115, "step": 48570 }, { "epoch": 13.66, "learning_rate": 8.07590666291819e-05, "loss": 0.1313, "step": 48600 }, { "epoch": 13.67, "learning_rate": 8.074032424327618e-05, "loss": 0.1105, "step": 48630 }, { "epoch": 13.68, "learning_rate": 8.072158185737045e-05, "loss": 0.125, "step": 48660 }, { "epoch": 13.69, "learning_rate": 8.070283947146471e-05, "loss": 0.1268, "step": 48690 }, { "epoch": 13.7, "learning_rate": 8.0684097085559e-05, "loss": 0.1144, "step": 48720 }, { "epoch": 13.71, "learning_rate": 8.066535469965328e-05, "loss": 0.128, "step": 48750 }, { "epoch": 13.71, "learning_rate": 8.064661231374754e-05, "loss": 0.1158, "step": 48780 }, { "epoch": 13.72, "learning_rate": 8.062786992784181e-05, "loss": 0.1235, "step": 48810 }, { "epoch": 13.73, "learning_rate": 8.060912754193609e-05, "loss": 0.1263, "step": 48840 }, { "epoch": 13.74, "learning_rate": 8.059038515603037e-05, "loss": 0.1115, "step": 48870 }, { "epoch": 13.75, "learning_rate": 8.057164277012464e-05, "loss": 0.1304, "step": 48900 }, { "epoch": 13.76, "learning_rate": 8.055290038421891e-05, "loss": 0.1208, "step": 48930 }, { "epoch": 13.76, "learning_rate": 8.053415799831319e-05, "loss": 0.117, "step": 48960 }, { "epoch": 13.77, "learning_rate": 8.051541561240747e-05, "loss": 0.1305, "step": 48990 }, { "epoch": 13.78, "learning_rate": 8.049667322650174e-05, "loss": 0.1103, "step": 49020 }, { "epoch": 13.79, "learning_rate": 8.047793084059602e-05, "loss": 0.1299, "step": 49050 }, { "epoch": 13.8, "learning_rate": 8.045918845469029e-05, "loss": 0.1135, "step": 49080 }, { "epoch": 13.81, "learning_rate": 8.044044606878455e-05, "loss": 0.1247, "step": 49110 }, { "epoch": 13.81, "learning_rate": 8.042170368287883e-05, "loss": 0.1263, "step": 49140 }, { "epoch": 13.82, "learning_rate": 8.040296129697311e-05, "loss": 0.1101, "step": 49170 }, { "epoch": 13.83, "learning_rate": 8.038421891106738e-05, "loss": 0.1288, "step": 49200 }, { "epoch": 13.84, "learning_rate": 8.036547652516165e-05, "loss": 0.1181, "step": 49230 }, { "epoch": 13.85, "learning_rate": 8.034673413925593e-05, "loss": 0.1241, "step": 49260 }, { "epoch": 13.86, "learning_rate": 8.032799175335021e-05, "loss": 0.1287, "step": 49290 }, { "epoch": 13.87, "learning_rate": 8.030924936744448e-05, "loss": 0.1149, "step": 49320 }, { "epoch": 13.87, "learning_rate": 8.029050698153875e-05, "loss": 0.1251, "step": 49350 }, { "epoch": 13.88, "learning_rate": 8.027176459563303e-05, "loss": 0.1163, "step": 49380 }, { "epoch": 13.89, "learning_rate": 8.025302220972731e-05, "loss": 0.1359, "step": 49410 }, { "epoch": 13.9, "learning_rate": 8.023427982382158e-05, "loss": 0.1242, "step": 49440 }, { "epoch": 13.91, "learning_rate": 8.021553743791586e-05, "loss": 0.1106, "step": 49470 }, { "epoch": 13.92, "learning_rate": 8.019679505201012e-05, "loss": 0.1297, "step": 49500 }, { "epoch": 13.92, "learning_rate": 8.017805266610439e-05, "loss": 0.1153, "step": 49530 }, { "epoch": 13.93, "learning_rate": 8.015931028019867e-05, "loss": 0.1262, "step": 49560 }, { "epoch": 13.94, "learning_rate": 8.014056789429295e-05, "loss": 0.124, "step": 49590 }, { "epoch": 13.95, "learning_rate": 8.012182550838722e-05, "loss": 0.1129, "step": 49620 }, { "epoch": 13.96, "learning_rate": 8.010308312248149e-05, "loss": 0.1315, "step": 49650 }, { "epoch": 13.97, "learning_rate": 8.008434073657577e-05, "loss": 0.1142, "step": 49680 }, { "epoch": 13.98, "learning_rate": 8.006559835067005e-05, "loss": 0.1238, "step": 49710 }, { "epoch": 13.98, "learning_rate": 8.004685596476432e-05, "loss": 0.1246, "step": 49740 }, { "epoch": 13.99, "learning_rate": 8.002811357885859e-05, "loss": 0.1124, "step": 49770 }, { "epoch": 14.0, "eval_loss": 0.18678802251815796, "eval_runtime": 477.9923, "eval_samples_per_second": 33.542, "eval_steps_per_second": 1.05, "eval_wer": 0.17144104922686393, "step": 49798 }, { "epoch": 14.0, "learning_rate": 8.000937119295287e-05, "loss": 0.1446, "step": 49800 }, { "epoch": 14.01, "learning_rate": 7.999062880704715e-05, "loss": 0.1044, "step": 49830 }, { "epoch": 14.02, "learning_rate": 7.997188642114141e-05, "loss": 0.1248, "step": 49860 }, { "epoch": 14.03, "learning_rate": 7.99531440352357e-05, "loss": 0.1121, "step": 49890 }, { "epoch": 14.03, "learning_rate": 7.993440164932996e-05, "loss": 0.1138, "step": 49920 }, { "epoch": 14.04, "learning_rate": 7.991565926342423e-05, "loss": 0.1254, "step": 49950 }, { "epoch": 14.05, "learning_rate": 7.989691687751851e-05, "loss": 0.1065, "step": 49980 }, { "epoch": 14.06, "learning_rate": 7.987817449161279e-05, "loss": 0.121, "step": 50010 }, { "epoch": 14.07, "learning_rate": 7.985943210570706e-05, "loss": 0.1147, "step": 50040 }, { "epoch": 14.08, "learning_rate": 7.984068971980133e-05, "loss": 0.1176, "step": 50070 }, { "epoch": 14.08, "learning_rate": 7.982194733389561e-05, "loss": 0.1235, "step": 50100 }, { "epoch": 14.09, "learning_rate": 7.980320494798989e-05, "loss": 0.1075, "step": 50130 }, { "epoch": 14.1, "learning_rate": 7.978446256208416e-05, "loss": 0.1209, "step": 50160 }, { "epoch": 14.11, "learning_rate": 7.976572017617842e-05, "loss": 0.1125, "step": 50190 }, { "epoch": 14.12, "learning_rate": 7.97469777902727e-05, "loss": 0.116, "step": 50220 }, { "epoch": 14.13, "learning_rate": 7.972823540436699e-05, "loss": 0.1269, "step": 50250 }, { "epoch": 14.14, "learning_rate": 7.970949301846125e-05, "loss": 0.1052, "step": 50280 }, { "epoch": 14.14, "learning_rate": 7.969075063255553e-05, "loss": 0.1191, "step": 50310 }, { "epoch": 14.15, "learning_rate": 7.96720082466498e-05, "loss": 0.1106, "step": 50340 }, { "epoch": 14.16, "learning_rate": 7.965326586074407e-05, "loss": 0.1185, "step": 50370 }, { "epoch": 14.17, "learning_rate": 7.963452347483835e-05, "loss": 0.1263, "step": 50400 }, { "epoch": 14.18, "learning_rate": 7.961578108893263e-05, "loss": 0.102, "step": 50430 }, { "epoch": 14.19, "learning_rate": 7.95970387030269e-05, "loss": 0.1217, "step": 50460 }, { "epoch": 14.19, "learning_rate": 7.957829631712117e-05, "loss": 0.1099, "step": 50490 }, { "epoch": 14.2, "learning_rate": 7.955955393121545e-05, "loss": 0.1166, "step": 50520 }, { "epoch": 14.21, "learning_rate": 7.954081154530973e-05, "loss": 0.1237, "step": 50550 }, { "epoch": 14.22, "learning_rate": 7.9522069159404e-05, "loss": 0.1172, "step": 50580 }, { "epoch": 14.23, "learning_rate": 7.950332677349826e-05, "loss": 0.134, "step": 50610 }, { "epoch": 14.24, "learning_rate": 7.948458438759254e-05, "loss": 0.1155, "step": 50640 }, { "epoch": 14.25, "learning_rate": 7.946584200168682e-05, "loss": 0.1188, "step": 50670 }, { "epoch": 14.25, "learning_rate": 7.944709961578109e-05, "loss": 0.1204, "step": 50700 }, { "epoch": 14.26, "learning_rate": 7.942835722987537e-05, "loss": 0.1074, "step": 50730 }, { "epoch": 14.27, "learning_rate": 7.940961484396964e-05, "loss": 0.1268, "step": 50760 }, { "epoch": 14.28, "learning_rate": 7.939087245806391e-05, "loss": 0.1134, "step": 50790 }, { "epoch": 14.29, "learning_rate": 7.937213007215819e-05, "loss": 0.1181, "step": 50820 }, { "epoch": 14.3, "learning_rate": 7.935338768625247e-05, "loss": 0.1254, "step": 50850 }, { "epoch": 14.3, "learning_rate": 7.933464530034674e-05, "loss": 0.1021, "step": 50880 }, { "epoch": 14.31, "learning_rate": 7.9315902914441e-05, "loss": 0.1252, "step": 50910 }, { "epoch": 14.32, "learning_rate": 7.929716052853529e-05, "loss": 0.1114, "step": 50940 }, { "epoch": 14.33, "learning_rate": 7.927904288882641e-05, "loss": 0.1214, "step": 50970 }, { "epoch": 14.34, "learning_rate": 7.92603005029207e-05, "loss": 0.1237, "step": 51000 }, { "epoch": 14.35, "learning_rate": 7.924155811701497e-05, "loss": 0.1001, "step": 51030 }, { "epoch": 14.35, "learning_rate": 7.922281573110924e-05, "loss": 0.1224, "step": 51060 }, { "epoch": 14.36, "learning_rate": 7.920407334520351e-05, "loss": 0.1115, "step": 51090 }, { "epoch": 14.37, "learning_rate": 7.918533095929779e-05, "loss": 0.1233, "step": 51120 }, { "epoch": 14.38, "learning_rate": 7.916658857339206e-05, "loss": 0.1283, "step": 51150 }, { "epoch": 14.39, "learning_rate": 7.914784618748634e-05, "loss": 0.1084, "step": 51180 }, { "epoch": 14.4, "learning_rate": 7.91291038015806e-05, "loss": 0.1236, "step": 51210 }, { "epoch": 14.41, "learning_rate": 7.911036141567489e-05, "loss": 0.1153, "step": 51240 }, { "epoch": 14.41, "learning_rate": 7.909161902976915e-05, "loss": 0.1201, "step": 51270 }, { "epoch": 14.42, "learning_rate": 7.907287664386344e-05, "loss": 0.1267, "step": 51300 }, { "epoch": 14.43, "learning_rate": 7.905413425795772e-05, "loss": 0.1054, "step": 51330 }, { "epoch": 14.44, "learning_rate": 7.903539187205198e-05, "loss": 0.1218, "step": 51360 }, { "epoch": 14.45, "learning_rate": 7.901664948614625e-05, "loss": 0.1168, "step": 51390 }, { "epoch": 14.46, "learning_rate": 7.899790710024053e-05, "loss": 0.1181, "step": 51420 }, { "epoch": 14.46, "learning_rate": 7.897916471433481e-05, "loss": 0.1348, "step": 51450 }, { "epoch": 14.47, "learning_rate": 7.896042232842908e-05, "loss": 0.108, "step": 51480 }, { "epoch": 14.48, "learning_rate": 7.894167994252335e-05, "loss": 0.128, "step": 51510 }, { "epoch": 14.49, "learning_rate": 7.892293755661763e-05, "loss": 0.1127, "step": 51540 }, { "epoch": 14.5, "learning_rate": 7.89041951707119e-05, "loss": 0.1173, "step": 51570 }, { "epoch": 14.51, "learning_rate": 7.888545278480618e-05, "loss": 0.1281, "step": 51600 }, { "epoch": 14.51, "learning_rate": 7.886671039890044e-05, "loss": 0.105, "step": 51630 }, { "epoch": 14.52, "learning_rate": 7.884796801299473e-05, "loss": 0.1245, "step": 51660 }, { "epoch": 14.53, "learning_rate": 7.8829225627089e-05, "loss": 0.1153, "step": 51690 }, { "epoch": 14.54, "learning_rate": 7.881048324118327e-05, "loss": 0.1195, "step": 51720 }, { "epoch": 14.55, "learning_rate": 7.879174085527756e-05, "loss": 0.1238, "step": 51750 }, { "epoch": 14.56, "learning_rate": 7.877299846937182e-05, "loss": 0.1054, "step": 51780 }, { "epoch": 14.57, "learning_rate": 7.875425608346609e-05, "loss": 0.1259, "step": 51810 }, { "epoch": 14.57, "learning_rate": 7.873551369756037e-05, "loss": 0.1233, "step": 51840 }, { "epoch": 14.58, "learning_rate": 7.871677131165465e-05, "loss": 0.1216, "step": 51870 }, { "epoch": 14.59, "learning_rate": 7.869802892574892e-05, "loss": 0.1265, "step": 51900 }, { "epoch": 14.6, "learning_rate": 7.867928653984319e-05, "loss": 0.1006, "step": 51930 }, { "epoch": 14.61, "learning_rate": 7.866054415393747e-05, "loss": 0.1201, "step": 51960 }, { "epoch": 14.62, "learning_rate": 7.864180176803175e-05, "loss": 0.11, "step": 51990 }, { "epoch": 14.62, "learning_rate": 7.862305938212602e-05, "loss": 0.1239, "step": 52020 }, { "epoch": 14.63, "learning_rate": 7.860431699622028e-05, "loss": 0.1289, "step": 52050 }, { "epoch": 14.64, "learning_rate": 7.858557461031456e-05, "loss": 0.1077, "step": 52080 }, { "epoch": 14.65, "learning_rate": 7.856683222440883e-05, "loss": 0.1233, "step": 52110 }, { "epoch": 14.66, "learning_rate": 7.854808983850311e-05, "loss": 0.1114, "step": 52140 }, { "epoch": 14.67, "learning_rate": 7.85293474525974e-05, "loss": 0.1144, "step": 52170 }, { "epoch": 14.68, "learning_rate": 7.851060506669166e-05, "loss": 0.1286, "step": 52200 }, { "epoch": 14.68, "learning_rate": 7.849186268078593e-05, "loss": 0.107, "step": 52230 }, { "epoch": 14.69, "learning_rate": 7.847312029488021e-05, "loss": 0.1249, "step": 52260 }, { "epoch": 14.7, "learning_rate": 7.845437790897449e-05, "loss": 0.1106, "step": 52290 }, { "epoch": 14.71, "learning_rate": 7.843563552306876e-05, "loss": 0.1197, "step": 52320 }, { "epoch": 14.72, "learning_rate": 7.841689313716303e-05, "loss": 0.1247, "step": 52350 }, { "epoch": 14.73, "learning_rate": 7.83981507512573e-05, "loss": 0.1042, "step": 52380 }, { "epoch": 14.73, "learning_rate": 7.837940836535159e-05, "loss": 0.1233, "step": 52410 }, { "epoch": 14.74, "learning_rate": 7.836066597944585e-05, "loss": 0.1105, "step": 52440 }, { "epoch": 14.75, "learning_rate": 7.834192359354012e-05, "loss": 0.1189, "step": 52470 }, { "epoch": 14.76, "learning_rate": 7.83231812076344e-05, "loss": 0.1251, "step": 52500 }, { "epoch": 14.77, "learning_rate": 7.830443882172867e-05, "loss": 0.1052, "step": 52530 }, { "epoch": 14.78, "learning_rate": 7.828569643582295e-05, "loss": 0.1214, "step": 52560 }, { "epoch": 14.78, "learning_rate": 7.826695404991723e-05, "loss": 0.1133, "step": 52590 }, { "epoch": 14.79, "learning_rate": 7.82482116640115e-05, "loss": 0.1126, "step": 52620 }, { "epoch": 14.8, "learning_rate": 7.822946927810577e-05, "loss": 0.1238, "step": 52650 }, { "epoch": 14.81, "learning_rate": 7.821072689220005e-05, "loss": 0.1031, "step": 52680 }, { "epoch": 14.82, "learning_rate": 7.819198450629433e-05, "loss": 0.1207, "step": 52710 }, { "epoch": 14.83, "learning_rate": 7.81732421203886e-05, "loss": 0.1115, "step": 52740 }, { "epoch": 14.84, "learning_rate": 7.815449973448286e-05, "loss": 0.1096, "step": 52770 }, { "epoch": 14.84, "learning_rate": 7.813575734857715e-05, "loss": 0.1262, "step": 52800 }, { "epoch": 14.85, "learning_rate": 7.811701496267143e-05, "loss": 0.1025, "step": 52830 }, { "epoch": 14.86, "learning_rate": 7.80982725767657e-05, "loss": 0.1263, "step": 52860 }, { "epoch": 14.87, "learning_rate": 7.807953019085996e-05, "loss": 0.1144, "step": 52890 }, { "epoch": 14.88, "learning_rate": 7.806078780495424e-05, "loss": 0.1192, "step": 52920 }, { "epoch": 14.89, "learning_rate": 7.804204541904851e-05, "loss": 0.1352, "step": 52950 }, { "epoch": 14.89, "learning_rate": 7.802330303314279e-05, "loss": 0.1102, "step": 52980 }, { "epoch": 14.9, "learning_rate": 7.800456064723707e-05, "loss": 0.1233, "step": 53010 }, { "epoch": 14.91, "learning_rate": 7.798581826133134e-05, "loss": 0.1162, "step": 53040 }, { "epoch": 14.92, "learning_rate": 7.79670758754256e-05, "loss": 0.1214, "step": 53070 }, { "epoch": 14.93, "learning_rate": 7.794833348951989e-05, "loss": 0.1302, "step": 53100 }, { "epoch": 14.94, "learning_rate": 7.792959110361417e-05, "loss": 0.1029, "step": 53130 }, { "epoch": 14.95, "learning_rate": 7.791084871770844e-05, "loss": 0.1164, "step": 53160 }, { "epoch": 14.95, "learning_rate": 7.78921063318027e-05, "loss": 0.1147, "step": 53190 }, { "epoch": 14.96, "learning_rate": 7.787336394589698e-05, "loss": 0.1186, "step": 53220 }, { "epoch": 14.97, "learning_rate": 7.785462155999126e-05, "loss": 0.1225, "step": 53250 }, { "epoch": 14.98, "learning_rate": 7.783587917408553e-05, "loss": 0.1043, "step": 53280 }, { "epoch": 14.99, "learning_rate": 7.78171367881798e-05, "loss": 0.1225, "step": 53310 }, { "epoch": 15.0, "learning_rate": 7.779839440227408e-05, "loss": 0.1112, "step": 53340 }, { "epoch": 15.0, "eval_loss": 0.18052412569522858, "eval_runtime": 480.525, "eval_samples_per_second": 33.366, "eval_steps_per_second": 1.045, "eval_wer": 0.16497209067460047, "step": 53355 }, { "epoch": 15.0, "learning_rate": 7.777965201636835e-05, "loss": 0.1152, "step": 53370 }, { "epoch": 15.01, "learning_rate": 7.776090963046263e-05, "loss": 0.1118, "step": 53400 }, { "epoch": 15.02, "learning_rate": 7.774216724455691e-05, "loss": 0.1098, "step": 53430 }, { "epoch": 15.03, "learning_rate": 7.772342485865118e-05, "loss": 0.1218, "step": 53460 }, { "epoch": 15.04, "learning_rate": 7.770468247274544e-05, "loss": 0.1046, "step": 53490 }, { "epoch": 15.05, "learning_rate": 7.768594008683973e-05, "loss": 0.1181, "step": 53520 }, { "epoch": 15.05, "learning_rate": 7.7667197700934e-05, "loss": 0.11, "step": 53550 }, { "epoch": 15.06, "learning_rate": 7.764845531502827e-05, "loss": 0.1103, "step": 53580 }, { "epoch": 15.07, "learning_rate": 7.762971292912254e-05, "loss": 0.1236, "step": 53610 }, { "epoch": 15.08, "learning_rate": 7.761097054321682e-05, "loss": 0.1036, "step": 53640 }, { "epoch": 15.09, "learning_rate": 7.75922281573111e-05, "loss": 0.1174, "step": 53670 }, { "epoch": 15.1, "learning_rate": 7.757348577140537e-05, "loss": 0.1093, "step": 53700 }, { "epoch": 15.11, "learning_rate": 7.755474338549964e-05, "loss": 0.1113, "step": 53730 }, { "epoch": 15.11, "learning_rate": 7.753600099959392e-05, "loss": 0.1227, "step": 53760 }, { "epoch": 15.12, "learning_rate": 7.751725861368819e-05, "loss": 0.1027, "step": 53790 }, { "epoch": 15.13, "learning_rate": 7.749851622778247e-05, "loss": 0.1183, "step": 53820 }, { "epoch": 15.14, "learning_rate": 7.747977384187675e-05, "loss": 0.109, "step": 53850 }, { "epoch": 15.15, "learning_rate": 7.746103145597102e-05, "loss": 0.1085, "step": 53880 }, { "epoch": 15.16, "learning_rate": 7.744228907006528e-05, "loss": 0.1211, "step": 53910 }, { "epoch": 15.16, "learning_rate": 7.742354668415956e-05, "loss": 0.1044, "step": 53940 }, { "epoch": 15.17, "learning_rate": 7.740480429825385e-05, "loss": 0.1217, "step": 53970 }, { "epoch": 15.18, "learning_rate": 7.738606191234811e-05, "loss": 0.116, "step": 54000 }, { "epoch": 15.19, "learning_rate": 7.736731952644238e-05, "loss": 0.1133, "step": 54030 }, { "epoch": 15.2, "learning_rate": 7.734857714053666e-05, "loss": 0.1236, "step": 54060 }, { "epoch": 15.21, "learning_rate": 7.732983475463094e-05, "loss": 0.1054, "step": 54090 }, { "epoch": 15.22, "learning_rate": 7.731109236872521e-05, "loss": 0.1137, "step": 54120 }, { "epoch": 15.22, "learning_rate": 7.729234998281948e-05, "loss": 0.1101, "step": 54150 }, { "epoch": 15.23, "learning_rate": 7.727360759691376e-05, "loss": 0.1095, "step": 54180 }, { "epoch": 15.24, "learning_rate": 7.725486521100803e-05, "loss": 0.125, "step": 54210 }, { "epoch": 15.25, "learning_rate": 7.72361228251023e-05, "loss": 0.1027, "step": 54240 }, { "epoch": 15.26, "learning_rate": 7.721738043919659e-05, "loss": 0.1194, "step": 54270 }, { "epoch": 15.27, "learning_rate": 7.719863805329085e-05, "loss": 0.1073, "step": 54300 }, { "epoch": 15.27, "learning_rate": 7.717989566738512e-05, "loss": 0.1084, "step": 54330 }, { "epoch": 15.28, "learning_rate": 7.71611532814794e-05, "loss": 0.123, "step": 54360 }, { "epoch": 15.29, "learning_rate": 7.714241089557368e-05, "loss": 0.1038, "step": 54390 }, { "epoch": 15.3, "learning_rate": 7.712366850966795e-05, "loss": 0.1195, "step": 54420 }, { "epoch": 15.31, "learning_rate": 7.710492612376222e-05, "loss": 0.1125, "step": 54450 }, { "epoch": 15.32, "learning_rate": 7.70861837378565e-05, "loss": 0.1089, "step": 54480 }, { "epoch": 15.32, "learning_rate": 7.706744135195078e-05, "loss": 0.1225, "step": 54510 }, { "epoch": 15.33, "learning_rate": 7.704869896604505e-05, "loss": 0.1016, "step": 54540 }, { "epoch": 15.34, "learning_rate": 7.702995658013932e-05, "loss": 0.1209, "step": 54570 }, { "epoch": 15.35, "learning_rate": 7.70112141942336e-05, "loss": 0.1101, "step": 54600 }, { "epoch": 15.36, "learning_rate": 7.699247180832786e-05, "loss": 0.1126, "step": 54630 }, { "epoch": 15.37, "learning_rate": 7.697372942242214e-05, "loss": 0.1198, "step": 54660 }, { "epoch": 15.38, "learning_rate": 7.695498703651643e-05, "loss": 0.1039, "step": 54690 }, { "epoch": 15.38, "learning_rate": 7.69362446506107e-05, "loss": 0.1164, "step": 54720 }, { "epoch": 15.39, "learning_rate": 7.691750226470496e-05, "loss": 0.1102, "step": 54750 }, { "epoch": 15.4, "learning_rate": 7.689875987879924e-05, "loss": 0.1078, "step": 54780 }, { "epoch": 15.41, "learning_rate": 7.688001749289352e-05, "loss": 0.1205, "step": 54810 }, { "epoch": 15.42, "learning_rate": 7.686127510698779e-05, "loss": 0.1061, "step": 54840 }, { "epoch": 15.43, "learning_rate": 7.684253272108206e-05, "loss": 0.1205, "step": 54870 }, { "epoch": 15.43, "learning_rate": 7.682379033517634e-05, "loss": 0.1128, "step": 54900 }, { "epoch": 15.44, "learning_rate": 7.680504794927062e-05, "loss": 0.109, "step": 54930 }, { "epoch": 15.45, "learning_rate": 7.678630556336489e-05, "loss": 0.1243, "step": 54960 }, { "epoch": 15.46, "learning_rate": 7.676756317745915e-05, "loss": 0.1044, "step": 54990 }, { "epoch": 15.47, "learning_rate": 7.674882079155344e-05, "loss": 0.1143, "step": 55020 }, { "epoch": 15.48, "learning_rate": 7.673007840564772e-05, "loss": 0.1105, "step": 55050 }, { "epoch": 15.48, "learning_rate": 7.671133601974198e-05, "loss": 0.1089, "step": 55080 }, { "epoch": 15.49, "learning_rate": 7.669259363383626e-05, "loss": 0.1214, "step": 55110 }, { "epoch": 15.5, "learning_rate": 7.667385124793053e-05, "loss": 0.1021, "step": 55140 }, { "epoch": 15.51, "learning_rate": 7.66551088620248e-05, "loss": 0.124, "step": 55170 }, { "epoch": 15.52, "learning_rate": 7.663636647611908e-05, "loss": 0.1125, "step": 55200 }, { "epoch": 15.53, "learning_rate": 7.661762409021336e-05, "loss": 0.1154, "step": 55230 }, { "epoch": 15.54, "learning_rate": 7.659888170430763e-05, "loss": 0.125, "step": 55260 }, { "epoch": 15.54, "learning_rate": 7.65801393184019e-05, "loss": 0.1042, "step": 55290 }, { "epoch": 15.55, "learning_rate": 7.656139693249618e-05, "loss": 0.1173, "step": 55320 }, { "epoch": 15.56, "learning_rate": 7.654265454659046e-05, "loss": 0.1201, "step": 55350 }, { "epoch": 15.57, "learning_rate": 7.652391216068473e-05, "loss": 0.1115, "step": 55380 }, { "epoch": 15.58, "learning_rate": 7.650516977477899e-05, "loss": 0.1237, "step": 55410 }, { "epoch": 15.59, "learning_rate": 7.648642738887327e-05, "loss": 0.11, "step": 55440 }, { "epoch": 15.59, "learning_rate": 7.64683097491644e-05, "loss": 0.1174, "step": 55470 }, { "epoch": 15.6, "learning_rate": 7.644956736325868e-05, "loss": 0.1106, "step": 55500 }, { "epoch": 15.61, "learning_rate": 7.643082497735295e-05, "loss": 0.1088, "step": 55530 }, { "epoch": 15.62, "learning_rate": 7.641208259144723e-05, "loss": 0.1248, "step": 55560 }, { "epoch": 15.63, "learning_rate": 7.63933402055415e-05, "loss": 0.1051, "step": 55590 }, { "epoch": 15.64, "learning_rate": 7.637459781963578e-05, "loss": 0.121, "step": 55620 }, { "epoch": 15.65, "learning_rate": 7.635585543373005e-05, "loss": 0.1185, "step": 55650 }, { "epoch": 15.65, "learning_rate": 7.633711304782433e-05, "loss": 0.1174, "step": 55680 }, { "epoch": 15.66, "learning_rate": 7.631837066191861e-05, "loss": 0.1173, "step": 55710 }, { "epoch": 15.67, "learning_rate": 7.629962827601286e-05, "loss": 0.1022, "step": 55740 }, { "epoch": 15.68, "learning_rate": 7.628088589010714e-05, "loss": 0.1189, "step": 55770 }, { "epoch": 15.69, "learning_rate": 7.626214350420142e-05, "loss": 0.1106, "step": 55800 }, { "epoch": 15.7, "learning_rate": 7.62434011182957e-05, "loss": 0.1096, "step": 55830 }, { "epoch": 15.7, "learning_rate": 7.622465873238997e-05, "loss": 0.122, "step": 55860 }, { "epoch": 15.71, "learning_rate": 7.620591634648424e-05, "loss": 0.1078, "step": 55890 }, { "epoch": 15.72, "learning_rate": 7.618717396057852e-05, "loss": 0.1106, "step": 55920 }, { "epoch": 15.73, "learning_rate": 7.616843157467279e-05, "loss": 0.1087, "step": 55950 }, { "epoch": 15.74, "learning_rate": 7.614968918876707e-05, "loss": 0.115, "step": 55980 }, { "epoch": 15.75, "learning_rate": 7.613094680286134e-05, "loss": 0.1257, "step": 56010 }, { "epoch": 15.75, "learning_rate": 7.611220441695562e-05, "loss": 0.1011, "step": 56040 }, { "epoch": 15.76, "learning_rate": 7.609346203104989e-05, "loss": 0.1181, "step": 56070 }, { "epoch": 15.77, "learning_rate": 7.607471964514417e-05, "loss": 0.1134, "step": 56100 }, { "epoch": 15.78, "learning_rate": 7.605597725923845e-05, "loss": 0.1146, "step": 56130 }, { "epoch": 15.79, "learning_rate": 7.603723487333271e-05, "loss": 0.1225, "step": 56160 }, { "epoch": 15.8, "learning_rate": 7.601849248742698e-05, "loss": 0.1049, "step": 56190 }, { "epoch": 15.81, "learning_rate": 7.599975010152126e-05, "loss": 0.1238, "step": 56220 }, { "epoch": 15.81, "learning_rate": 7.598100771561554e-05, "loss": 0.1097, "step": 56250 }, { "epoch": 15.82, "learning_rate": 7.596226532970981e-05, "loss": 0.1109, "step": 56280 }, { "epoch": 15.83, "learning_rate": 7.594352294380408e-05, "loss": 0.1233, "step": 56310 }, { "epoch": 15.84, "learning_rate": 7.592478055789836e-05, "loss": 0.0993, "step": 56340 }, { "epoch": 15.85, "learning_rate": 7.590603817199263e-05, "loss": 0.1169, "step": 56370 }, { "epoch": 15.86, "learning_rate": 7.588729578608691e-05, "loss": 0.1185, "step": 56400 }, { "epoch": 15.86, "learning_rate": 7.586855340018118e-05, "loss": 0.1075, "step": 56430 }, { "epoch": 15.87, "learning_rate": 7.584981101427546e-05, "loss": 0.1231, "step": 56460 }, { "epoch": 15.88, "learning_rate": 7.583106862836972e-05, "loss": 0.1021, "step": 56490 }, { "epoch": 15.89, "learning_rate": 7.5812326242464e-05, "loss": 0.1184, "step": 56520 }, { "epoch": 15.9, "learning_rate": 7.579358385655829e-05, "loss": 0.1124, "step": 56550 }, { "epoch": 15.91, "learning_rate": 7.577484147065255e-05, "loss": 0.1109, "step": 56580 }, { "epoch": 15.91, "learning_rate": 7.575609908474682e-05, "loss": 0.1229, "step": 56610 }, { "epoch": 15.92, "learning_rate": 7.57373566988411e-05, "loss": 0.106, "step": 56640 }, { "epoch": 15.93, "learning_rate": 7.571861431293538e-05, "loss": 0.1108, "step": 56670 }, { "epoch": 15.94, "learning_rate": 7.569987192702965e-05, "loss": 0.1108, "step": 56700 }, { "epoch": 15.95, "learning_rate": 7.568112954112392e-05, "loss": 0.1114, "step": 56730 }, { "epoch": 15.96, "learning_rate": 7.56623871552182e-05, "loss": 0.1179, "step": 56760 }, { "epoch": 15.97, "learning_rate": 7.564364476931247e-05, "loss": 0.1047, "step": 56790 }, { "epoch": 15.97, "learning_rate": 7.562490238340675e-05, "loss": 0.1134, "step": 56820 }, { "epoch": 15.98, "learning_rate": 7.560615999750101e-05, "loss": 0.1205, "step": 56850 }, { "epoch": 15.99, "learning_rate": 7.55874176115953e-05, "loss": 0.1121, "step": 56880 }, { "epoch": 16.0, "learning_rate": 7.556867522568956e-05, "loss": 0.1209, "step": 56910 }, { "epoch": 16.0, "eval_loss": 0.18599531054496765, "eval_runtime": 482.85, "eval_samples_per_second": 33.205, "eval_steps_per_second": 1.04, "eval_wer": 0.16138959780546722, "step": 56912 }, { "epoch": 16.01, "learning_rate": 7.554993283978384e-05, "loss": 0.1057, "step": 56940 }, { "epoch": 16.02, "learning_rate": 7.553119045387812e-05, "loss": 0.1149, "step": 56970 }, { "epoch": 16.02, "learning_rate": 7.551244806797239e-05, "loss": 0.104, "step": 57000 }, { "epoch": 16.03, "learning_rate": 7.549370568206666e-05, "loss": 0.1114, "step": 57030 }, { "epoch": 16.04, "learning_rate": 7.547496329616094e-05, "loss": 0.1081, "step": 57060 }, { "epoch": 16.05, "learning_rate": 7.545622091025522e-05, "loss": 0.1041, "step": 57090 }, { "epoch": 16.06, "learning_rate": 7.543747852434949e-05, "loss": 0.1169, "step": 57120 }, { "epoch": 16.07, "learning_rate": 7.541873613844376e-05, "loss": 0.0974, "step": 57150 }, { "epoch": 16.08, "learning_rate": 7.539999375253804e-05, "loss": 0.1164, "step": 57180 }, { "epoch": 16.08, "learning_rate": 7.53812513666323e-05, "loss": 0.1173, "step": 57210 }, { "epoch": 16.09, "learning_rate": 7.536250898072659e-05, "loss": 0.1016, "step": 57240 }, { "epoch": 16.1, "learning_rate": 7.534376659482085e-05, "loss": 0.1165, "step": 57270 }, { "epoch": 16.11, "learning_rate": 7.532502420891513e-05, "loss": 0.102, "step": 57300 }, { "epoch": 16.12, "learning_rate": 7.53062818230094e-05, "loss": 0.1141, "step": 57330 }, { "epoch": 16.13, "learning_rate": 7.528753943710368e-05, "loss": 0.1121, "step": 57360 }, { "epoch": 16.13, "learning_rate": 7.526879705119796e-05, "loss": 0.104, "step": 57390 }, { "epoch": 16.14, "learning_rate": 7.525005466529223e-05, "loss": 0.1166, "step": 57420 }, { "epoch": 16.15, "learning_rate": 7.52313122793865e-05, "loss": 0.104, "step": 57450 }, { "epoch": 16.16, "learning_rate": 7.521256989348078e-05, "loss": 0.113, "step": 57480 }, { "epoch": 16.17, "learning_rate": 7.519382750757506e-05, "loss": 0.1123, "step": 57510 }, { "epoch": 16.18, "learning_rate": 7.517508512166933e-05, "loss": 0.1082, "step": 57540 }, { "epoch": 16.18, "learning_rate": 7.51563427357636e-05, "loss": 0.1162, "step": 57570 }, { "epoch": 16.19, "learning_rate": 7.513760034985788e-05, "loss": 0.104, "step": 57600 }, { "epoch": 16.2, "learning_rate": 7.511885796395214e-05, "loss": 0.1072, "step": 57630 }, { "epoch": 16.21, "learning_rate": 7.510011557804642e-05, "loss": 0.1094, "step": 57660 }, { "epoch": 16.22, "learning_rate": 7.508137319214069e-05, "loss": 0.1076, "step": 57690 }, { "epoch": 16.23, "learning_rate": 7.506263080623497e-05, "loss": 0.113, "step": 57720 }, { "epoch": 16.24, "learning_rate": 7.504388842032924e-05, "loss": 0.0999, "step": 57750 }, { "epoch": 16.24, "learning_rate": 7.502514603442352e-05, "loss": 0.1131, "step": 57780 }, { "epoch": 16.25, "learning_rate": 7.50064036485178e-05, "loss": 0.1118, "step": 57810 }, { "epoch": 16.26, "learning_rate": 7.498766126261207e-05, "loss": 0.1039, "step": 57840 }, { "epoch": 16.27, "learning_rate": 7.496891887670634e-05, "loss": 0.1186, "step": 57870 }, { "epoch": 16.28, "learning_rate": 7.495017649080062e-05, "loss": 0.1026, "step": 57900 }, { "epoch": 16.29, "learning_rate": 7.49314341048949e-05, "loss": 0.1134, "step": 57930 }, { "epoch": 16.29, "learning_rate": 7.491269171898917e-05, "loss": 0.1138, "step": 57960 }, { "epoch": 16.3, "learning_rate": 7.489394933308343e-05, "loss": 0.1086, "step": 57990 }, { "epoch": 16.31, "learning_rate": 7.487520694717771e-05, "loss": 0.1149, "step": 58020 }, { "epoch": 16.32, "learning_rate": 7.485646456127198e-05, "loss": 0.1041, "step": 58050 }, { "epoch": 16.33, "learning_rate": 7.483772217536626e-05, "loss": 0.132, "step": 58080 }, { "epoch": 16.34, "learning_rate": 7.481897978946053e-05, "loss": 0.114, "step": 58110 }, { "epoch": 16.35, "learning_rate": 7.480086214975167e-05, "loss": 0.1066, "step": 58140 }, { "epoch": 16.35, "learning_rate": 7.478211976384594e-05, "loss": 0.1142, "step": 58170 }, { "epoch": 16.36, "learning_rate": 7.476337737794022e-05, "loss": 0.1037, "step": 58200 }, { "epoch": 16.37, "learning_rate": 7.474463499203449e-05, "loss": 0.1154, "step": 58230 }, { "epoch": 16.38, "learning_rate": 7.472589260612877e-05, "loss": 0.109, "step": 58260 }, { "epoch": 16.39, "learning_rate": 7.470715022022305e-05, "loss": 0.1069, "step": 58290 }, { "epoch": 16.4, "learning_rate": 7.46884078343173e-05, "loss": 0.118, "step": 58320 }, { "epoch": 16.4, "learning_rate": 7.466966544841158e-05, "loss": 0.1016, "step": 58350 }, { "epoch": 16.41, "learning_rate": 7.465092306250586e-05, "loss": 0.1086, "step": 58380 }, { "epoch": 16.42, "learning_rate": 7.463218067660013e-05, "loss": 0.1108, "step": 58410 }, { "epoch": 16.43, "learning_rate": 7.46134382906944e-05, "loss": 0.1, "step": 58440 }, { "epoch": 16.44, "learning_rate": 7.459469590478868e-05, "loss": 0.1183, "step": 58470 }, { "epoch": 16.45, "learning_rate": 7.457595351888296e-05, "loss": 0.1011, "step": 58500 }, { "epoch": 16.45, "learning_rate": 7.455721113297723e-05, "loss": 0.1147, "step": 58530 }, { "epoch": 16.46, "learning_rate": 7.453846874707151e-05, "loss": 0.1079, "step": 58560 }, { "epoch": 16.47, "learning_rate": 7.451972636116578e-05, "loss": 0.1054, "step": 58590 }, { "epoch": 16.48, "learning_rate": 7.450098397526006e-05, "loss": 0.1135, "step": 58620 }, { "epoch": 16.49, "learning_rate": 7.448224158935433e-05, "loss": 0.1066, "step": 58650 }, { "epoch": 16.5, "learning_rate": 7.44634992034486e-05, "loss": 0.1149, "step": 58680 }, { "epoch": 16.51, "learning_rate": 7.444475681754289e-05, "loss": 0.1198, "step": 58710 }, { "epoch": 16.51, "learning_rate": 7.442601443163714e-05, "loss": 0.1022, "step": 58740 }, { "epoch": 16.52, "learning_rate": 7.440727204573142e-05, "loss": 0.1136, "step": 58770 }, { "epoch": 16.53, "learning_rate": 7.43885296598257e-05, "loss": 0.1034, "step": 58800 }, { "epoch": 16.54, "learning_rate": 7.436978727391997e-05, "loss": 0.1126, "step": 58830 }, { "epoch": 16.55, "learning_rate": 7.435104488801424e-05, "loss": 0.1137, "step": 58860 }, { "epoch": 16.56, "learning_rate": 7.433230250210852e-05, "loss": 0.102, "step": 58890 }, { "epoch": 16.56, "learning_rate": 7.43135601162028e-05, "loss": 0.1154, "step": 58920 }, { "epoch": 16.57, "learning_rate": 7.429481773029707e-05, "loss": 0.098, "step": 58950 }, { "epoch": 16.58, "learning_rate": 7.427607534439135e-05, "loss": 0.1214, "step": 58980 }, { "epoch": 16.59, "learning_rate": 7.425733295848562e-05, "loss": 0.1157, "step": 59010 }, { "epoch": 16.6, "learning_rate": 7.42385905725799e-05, "loss": 0.1017, "step": 59040 }, { "epoch": 16.61, "learning_rate": 7.421984818667416e-05, "loss": 0.1129, "step": 59070 }, { "epoch": 16.62, "learning_rate": 7.420110580076845e-05, "loss": 0.1024, "step": 59100 }, { "epoch": 16.62, "learning_rate": 7.418236341486273e-05, "loss": 0.1134, "step": 59130 }, { "epoch": 16.63, "learning_rate": 7.416362102895698e-05, "loss": 0.1085, "step": 59160 }, { "epoch": 16.64, "learning_rate": 7.414487864305126e-05, "loss": 0.1083, "step": 59190 }, { "epoch": 16.65, "learning_rate": 7.412613625714554e-05, "loss": 0.1192, "step": 59220 }, { "epoch": 16.66, "learning_rate": 7.410739387123982e-05, "loss": 0.1021, "step": 59250 }, { "epoch": 16.67, "learning_rate": 7.408865148533408e-05, "loss": 0.1139, "step": 59280 }, { "epoch": 16.67, "learning_rate": 7.406990909942836e-05, "loss": 0.1098, "step": 59310 }, { "epoch": 16.68, "learning_rate": 7.405116671352264e-05, "loss": 0.1042, "step": 59340 }, { "epoch": 16.69, "learning_rate": 7.40324243276169e-05, "loss": 0.1161, "step": 59370 }, { "epoch": 16.7, "learning_rate": 7.401368194171119e-05, "loss": 0.104, "step": 59400 }, { "epoch": 16.71, "learning_rate": 7.399493955580545e-05, "loss": 0.1136, "step": 59430 }, { "epoch": 16.72, "learning_rate": 7.397619716989974e-05, "loss": 0.1141, "step": 59460 }, { "epoch": 16.72, "learning_rate": 7.3957454783994e-05, "loss": 0.1043, "step": 59490 }, { "epoch": 16.73, "learning_rate": 7.393871239808828e-05, "loss": 0.1129, "step": 59520 }, { "epoch": 16.74, "learning_rate": 7.391997001218255e-05, "loss": 0.1023, "step": 59550 }, { "epoch": 16.75, "learning_rate": 7.390185237247369e-05, "loss": 0.1085, "step": 59580 }, { "epoch": 16.76, "learning_rate": 7.388310998656796e-05, "loss": 0.1074, "step": 59610 }, { "epoch": 16.77, "learning_rate": 7.386436760066223e-05, "loss": 0.1013, "step": 59640 }, { "epoch": 16.78, "learning_rate": 7.384562521475651e-05, "loss": 0.1198, "step": 59670 }, { "epoch": 16.78, "learning_rate": 7.382688282885079e-05, "loss": 0.0998, "step": 59700 }, { "epoch": 16.79, "learning_rate": 7.380814044294506e-05, "loss": 0.1151, "step": 59730 }, { "epoch": 16.8, "learning_rate": 7.378939805703932e-05, "loss": 0.11, "step": 59760 }, { "epoch": 16.81, "learning_rate": 7.37706556711336e-05, "loss": 0.1066, "step": 59790 }, { "epoch": 16.82, "learning_rate": 7.375191328522789e-05, "loss": 0.1179, "step": 59820 }, { "epoch": 16.83, "learning_rate": 7.373317089932215e-05, "loss": 0.0971, "step": 59850 }, { "epoch": 16.83, "learning_rate": 7.371442851341643e-05, "loss": 0.1134, "step": 59880 }, { "epoch": 16.84, "learning_rate": 7.36956861275107e-05, "loss": 0.1158, "step": 59910 }, { "epoch": 16.85, "learning_rate": 7.367694374160497e-05, "loss": 0.1018, "step": 59940 }, { "epoch": 16.86, "learning_rate": 7.365820135569925e-05, "loss": 0.1129, "step": 59970 }, { "epoch": 16.87, "learning_rate": 7.363945896979353e-05, "loss": 0.1013, "step": 60000 }, { "epoch": 16.88, "learning_rate": 7.36207165838878e-05, "loss": 0.1144, "step": 60030 }, { "epoch": 16.88, "learning_rate": 7.360197419798207e-05, "loss": 0.1108, "step": 60060 }, { "epoch": 16.89, "learning_rate": 7.358323181207635e-05, "loss": 0.1038, "step": 60090 }, { "epoch": 16.9, "learning_rate": 7.356448942617063e-05, "loss": 0.1161, "step": 60120 }, { "epoch": 16.91, "learning_rate": 7.35457470402649e-05, "loss": 0.1002, "step": 60150 }, { "epoch": 16.92, "learning_rate": 7.352700465435916e-05, "loss": 0.1178, "step": 60180 }, { "epoch": 16.93, "learning_rate": 7.350826226845344e-05, "loss": 0.1102, "step": 60210 }, { "epoch": 16.94, "learning_rate": 7.348951988254772e-05, "loss": 0.1, "step": 60240 }, { "epoch": 16.94, "learning_rate": 7.347077749664199e-05, "loss": 0.1173, "step": 60270 }, { "epoch": 16.95, "learning_rate": 7.345203511073626e-05, "loss": 0.1006, "step": 60300 }, { "epoch": 16.96, "learning_rate": 7.343329272483054e-05, "loss": 0.107, "step": 60330 }, { "epoch": 16.97, "learning_rate": 7.341455033892482e-05, "loss": 0.1133, "step": 60360 }, { "epoch": 16.98, "learning_rate": 7.339580795301909e-05, "loss": 0.1079, "step": 60390 }, { "epoch": 16.99, "learning_rate": 7.337706556711337e-05, "loss": 0.1203, "step": 60420 }, { "epoch": 16.99, "learning_rate": 7.335832318120764e-05, "loss": 0.1002, "step": 60450 }, { "epoch": 17.0, "eval_loss": 0.18275776505470276, "eval_runtime": 488.8565, "eval_samples_per_second": 32.797, "eval_steps_per_second": 1.027, "eval_wer": 0.16040697118993352, "step": 60469 }, { "epoch": 17.0, "learning_rate": 7.33395807953019e-05, "loss": 0.1185, "step": 60480 }, { "epoch": 17.01, "learning_rate": 7.332083840939619e-05, "loss": 0.1053, "step": 60510 }, { "epoch": 17.02, "learning_rate": 7.330209602349047e-05, "loss": 0.1076, "step": 60540 }, { "epoch": 17.03, "learning_rate": 7.328335363758473e-05, "loss": 0.1197, "step": 60570 }, { "epoch": 17.04, "learning_rate": 7.3264611251679e-05, "loss": 0.0961, "step": 60600 }, { "epoch": 17.05, "learning_rate": 7.324586886577328e-05, "loss": 0.1129, "step": 60630 }, { "epoch": 17.05, "learning_rate": 7.322712647986756e-05, "loss": 0.1, "step": 60660 }, { "epoch": 17.06, "learning_rate": 7.320838409396183e-05, "loss": 0.1019, "step": 60690 }, { "epoch": 17.07, "learning_rate": 7.31896417080561e-05, "loss": 0.1202, "step": 60720 }, { "epoch": 17.08, "learning_rate": 7.317089932215038e-05, "loss": 0.0919, "step": 60750 }, { "epoch": 17.09, "learning_rate": 7.315215693624466e-05, "loss": 0.1064, "step": 60780 }, { "epoch": 17.1, "learning_rate": 7.313341455033893e-05, "loss": 0.0991, "step": 60810 }, { "epoch": 17.1, "learning_rate": 7.311467216443321e-05, "loss": 0.1061, "step": 60840 }, { "epoch": 17.11, "learning_rate": 7.309592977852748e-05, "loss": 0.1117, "step": 60870 }, { "epoch": 17.12, "learning_rate": 7.307718739262174e-05, "loss": 0.0942, "step": 60900 }, { "epoch": 17.13, "learning_rate": 7.305844500671602e-05, "loss": 0.111, "step": 60930 }, { "epoch": 17.14, "learning_rate": 7.30397026208103e-05, "loss": 0.1044, "step": 60960 }, { "epoch": 17.15, "learning_rate": 7.302096023490457e-05, "loss": 0.1077, "step": 60990 }, { "epoch": 17.15, "learning_rate": 7.300221784899884e-05, "loss": 0.1103, "step": 61020 }, { "epoch": 17.16, "learning_rate": 7.298347546309312e-05, "loss": 0.094, "step": 61050 }, { "epoch": 17.17, "learning_rate": 7.29647330771874e-05, "loss": 0.1097, "step": 61080 }, { "epoch": 17.18, "learning_rate": 7.294599069128167e-05, "loss": 0.0986, "step": 61110 }, { "epoch": 17.19, "learning_rate": 7.292724830537594e-05, "loss": 0.1039, "step": 61140 }, { "epoch": 17.2, "learning_rate": 7.290850591947022e-05, "loss": 0.1066, "step": 61170 }, { "epoch": 17.21, "learning_rate": 7.28897635335645e-05, "loss": 0.0945, "step": 61200 }, { "epoch": 17.21, "learning_rate": 7.287102114765877e-05, "loss": 0.1213, "step": 61230 }, { "epoch": 17.22, "learning_rate": 7.285227876175305e-05, "loss": 0.1002, "step": 61260 }, { "epoch": 17.23, "learning_rate": 7.283353637584731e-05, "loss": 0.11, "step": 61290 }, { "epoch": 17.24, "learning_rate": 7.281479398994158e-05, "loss": 0.1133, "step": 61320 }, { "epoch": 17.25, "learning_rate": 7.279605160403586e-05, "loss": 0.0981, "step": 61350 }, { "epoch": 17.26, "learning_rate": 7.277730921813014e-05, "loss": 0.1163, "step": 61380 }, { "epoch": 17.26, "learning_rate": 7.275856683222441e-05, "loss": 0.0986, "step": 61410 }, { "epoch": 17.27, "learning_rate": 7.273982444631868e-05, "loss": 0.1054, "step": 61440 }, { "epoch": 17.28, "learning_rate": 7.272108206041296e-05, "loss": 0.1176, "step": 61470 }, { "epoch": 17.29, "learning_rate": 7.270233967450724e-05, "loss": 0.0973, "step": 61500 }, { "epoch": 17.3, "learning_rate": 7.268359728860151e-05, "loss": 0.1126, "step": 61530 }, { "epoch": 17.31, "learning_rate": 7.266485490269578e-05, "loss": 0.1053, "step": 61560 }, { "epoch": 17.32, "learning_rate": 7.264611251679006e-05, "loss": 0.1058, "step": 61590 }, { "epoch": 17.32, "learning_rate": 7.262737013088434e-05, "loss": 0.1189, "step": 61620 }, { "epoch": 17.33, "learning_rate": 7.26086277449786e-05, "loss": 0.0924, "step": 61650 }, { "epoch": 17.34, "learning_rate": 7.258988535907289e-05, "loss": 0.1132, "step": 61680 }, { "epoch": 17.35, "learning_rate": 7.257114297316715e-05, "loss": 0.1037, "step": 61710 }, { "epoch": 17.36, "learning_rate": 7.255240058726142e-05, "loss": 0.1031, "step": 61740 }, { "epoch": 17.37, "learning_rate": 7.25336582013557e-05, "loss": 0.1161, "step": 61770 }, { "epoch": 17.37, "learning_rate": 7.251491581544998e-05, "loss": 0.0959, "step": 61800 }, { "epoch": 17.38, "learning_rate": 7.249617342954425e-05, "loss": 0.111, "step": 61830 }, { "epoch": 17.39, "learning_rate": 7.247743104363852e-05, "loss": 0.1024, "step": 61860 }, { "epoch": 17.4, "learning_rate": 7.24586886577328e-05, "loss": 0.1058, "step": 61890 }, { "epoch": 17.41, "learning_rate": 7.243994627182708e-05, "loss": 0.1188, "step": 61920 }, { "epoch": 17.42, "learning_rate": 7.242120388592135e-05, "loss": 0.097, "step": 61950 }, { "epoch": 17.42, "learning_rate": 7.240246150001561e-05, "loss": 0.1079, "step": 61980 }, { "epoch": 17.43, "learning_rate": 7.23837191141099e-05, "loss": 0.0996, "step": 62010 }, { "epoch": 17.44, "learning_rate": 7.236497672820418e-05, "loss": 0.1152, "step": 62040 }, { "epoch": 17.45, "learning_rate": 7.234623434229844e-05, "loss": 0.1167, "step": 62070 }, { "epoch": 17.46, "learning_rate": 7.232749195639272e-05, "loss": 0.0957, "step": 62100 }, { "epoch": 17.47, "learning_rate": 7.230874957048699e-05, "loss": 0.1087, "step": 62130 }, { "epoch": 17.48, "learning_rate": 7.229000718458126e-05, "loss": 0.1013, "step": 62160 }, { "epoch": 17.48, "learning_rate": 7.227126479867554e-05, "loss": 0.1123, "step": 62190 }, { "epoch": 17.49, "learning_rate": 7.225252241276982e-05, "loss": 0.1183, "step": 62220 }, { "epoch": 17.5, "learning_rate": 7.223378002686409e-05, "loss": 0.0954, "step": 62250 }, { "epoch": 17.51, "learning_rate": 7.221503764095836e-05, "loss": 0.1181, "step": 62280 }, { "epoch": 17.52, "learning_rate": 7.219629525505264e-05, "loss": 0.1007, "step": 62310 }, { "epoch": 17.53, "learning_rate": 7.217755286914692e-05, "loss": 0.106, "step": 62340 }, { "epoch": 17.53, "learning_rate": 7.215881048324119e-05, "loss": 0.1131, "step": 62370 }, { "epoch": 17.54, "learning_rate": 7.214006809733545e-05, "loss": 0.0923, "step": 62400 }, { "epoch": 17.55, "learning_rate": 7.21219504576266e-05, "loss": 0.1169, "step": 62430 }, { "epoch": 17.56, "learning_rate": 7.210320807172086e-05, "loss": 0.1009, "step": 62460 }, { "epoch": 17.57, "learning_rate": 7.208446568581514e-05, "loss": 0.1042, "step": 62490 }, { "epoch": 17.58, "learning_rate": 7.206572329990941e-05, "loss": 0.1077, "step": 62520 }, { "epoch": 17.58, "learning_rate": 7.204698091400369e-05, "loss": 0.0955, "step": 62550 }, { "epoch": 17.59, "learning_rate": 7.202823852809797e-05, "loss": 0.1196, "step": 62580 }, { "epoch": 17.6, "learning_rate": 7.200949614219224e-05, "loss": 0.1006, "step": 62610 }, { "epoch": 17.61, "learning_rate": 7.19907537562865e-05, "loss": 0.1077, "step": 62640 }, { "epoch": 17.62, "learning_rate": 7.197201137038079e-05, "loss": 0.1178, "step": 62670 }, { "epoch": 17.63, "learning_rate": 7.195326898447507e-05, "loss": 0.0981, "step": 62700 }, { "epoch": 17.64, "learning_rate": 7.193452659856934e-05, "loss": 0.1185, "step": 62730 }, { "epoch": 17.64, "learning_rate": 7.19157842126636e-05, "loss": 0.1058, "step": 62760 }, { "epoch": 17.65, "learning_rate": 7.189704182675788e-05, "loss": 0.1062, "step": 62790 }, { "epoch": 17.66, "learning_rate": 7.187829944085216e-05, "loss": 0.1159, "step": 62820 }, { "epoch": 17.67, "learning_rate": 7.185955705494643e-05, "loss": 0.0978, "step": 62850 }, { "epoch": 17.68, "learning_rate": 7.18408146690407e-05, "loss": 0.1161, "step": 62880 }, { "epoch": 17.69, "learning_rate": 7.182207228313498e-05, "loss": 0.104, "step": 62910 }, { "epoch": 17.69, "learning_rate": 7.180332989722925e-05, "loss": 0.1077, "step": 62940 }, { "epoch": 17.7, "learning_rate": 7.178458751132353e-05, "loss": 0.1148, "step": 62970 }, { "epoch": 17.71, "learning_rate": 7.176584512541781e-05, "loss": 0.1019, "step": 63000 }, { "epoch": 17.72, "learning_rate": 7.174710273951208e-05, "loss": 0.1124, "step": 63030 }, { "epoch": 17.73, "learning_rate": 7.172836035360634e-05, "loss": 0.102, "step": 63060 }, { "epoch": 17.74, "learning_rate": 7.170961796770063e-05, "loss": 0.1031, "step": 63090 }, { "epoch": 17.75, "learning_rate": 7.169087558179491e-05, "loss": 0.1219, "step": 63120 }, { "epoch": 17.75, "learning_rate": 7.167213319588917e-05, "loss": 0.096, "step": 63150 }, { "epoch": 17.76, "learning_rate": 7.165339080998344e-05, "loss": 0.1223, "step": 63180 }, { "epoch": 17.77, "learning_rate": 7.163464842407772e-05, "loss": 0.1004, "step": 63210 }, { "epoch": 17.78, "learning_rate": 7.1615906038172e-05, "loss": 0.1006, "step": 63240 }, { "epoch": 17.79, "learning_rate": 7.159716365226627e-05, "loss": 0.1104, "step": 63270 }, { "epoch": 17.8, "learning_rate": 7.157842126636054e-05, "loss": 0.0967, "step": 63300 }, { "epoch": 17.8, "learning_rate": 7.155967888045482e-05, "loss": 0.1117, "step": 63330 }, { "epoch": 17.81, "learning_rate": 7.154093649454909e-05, "loss": 0.1049, "step": 63360 }, { "epoch": 17.82, "learning_rate": 7.152219410864337e-05, "loss": 0.1011, "step": 63390 }, { "epoch": 17.83, "learning_rate": 7.150345172273765e-05, "loss": 0.1216, "step": 63420 }, { "epoch": 17.84, "learning_rate": 7.148470933683192e-05, "loss": 0.0968, "step": 63450 }, { "epoch": 17.85, "learning_rate": 7.146596695092618e-05, "loss": 0.1151, "step": 63480 }, { "epoch": 17.85, "learning_rate": 7.144722456502046e-05, "loss": 0.1018, "step": 63510 }, { "epoch": 17.86, "learning_rate": 7.142848217911475e-05, "loss": 0.1079, "step": 63540 }, { "epoch": 17.87, "learning_rate": 7.140973979320901e-05, "loss": 0.1129, "step": 63570 }, { "epoch": 17.88, "learning_rate": 7.139099740730328e-05, "loss": 0.0953, "step": 63600 }, { "epoch": 17.89, "learning_rate": 7.137225502139756e-05, "loss": 0.1147, "step": 63630 }, { "epoch": 17.9, "learning_rate": 7.135351263549184e-05, "loss": 0.1023, "step": 63660 }, { "epoch": 17.91, "learning_rate": 7.133477024958611e-05, "loss": 0.106, "step": 63690 }, { "epoch": 17.91, "learning_rate": 7.131602786368038e-05, "loss": 0.1124, "step": 63720 }, { "epoch": 17.92, "learning_rate": 7.129728547777466e-05, "loss": 0.1036, "step": 63750 }, { "epoch": 17.93, "learning_rate": 7.127854309186894e-05, "loss": 0.1174, "step": 63780 }, { "epoch": 17.94, "learning_rate": 7.12598007059632e-05, "loss": 0.1006, "step": 63810 }, { "epoch": 17.95, "learning_rate": 7.124105832005749e-05, "loss": 0.1088, "step": 63840 }, { "epoch": 17.96, "learning_rate": 7.122231593415175e-05, "loss": 0.1132, "step": 63870 }, { "epoch": 17.96, "learning_rate": 7.120357354824602e-05, "loss": 0.0997, "step": 63900 }, { "epoch": 17.97, "learning_rate": 7.11848311623403e-05, "loss": 0.1125, "step": 63930 }, { "epoch": 17.98, "learning_rate": 7.116608877643458e-05, "loss": 0.0998, "step": 63960 }, { "epoch": 17.99, "learning_rate": 7.114734639052885e-05, "loss": 0.1046, "step": 63990 }, { "epoch": 18.0, "learning_rate": 7.112860400462312e-05, "loss": 0.118, "step": 64020 }, { "epoch": 18.0, "eval_loss": 0.18319498002529144, "eval_runtime": 490.7803, "eval_samples_per_second": 32.668, "eval_steps_per_second": 1.023, "eval_wer": 0.15797769983486415, "step": 64026 }, { "epoch": 18.01, "learning_rate": 7.11098616187174e-05, "loss": 0.0957, "step": 64050 }, { "epoch": 18.02, "learning_rate": 7.109111923281168e-05, "loss": 0.1128, "step": 64080 }, { "epoch": 18.02, "learning_rate": 7.107237684690595e-05, "loss": 0.0958, "step": 64110 }, { "epoch": 18.03, "learning_rate": 7.105363446100022e-05, "loss": 0.1036, "step": 64140 }, { "epoch": 18.04, "learning_rate": 7.10348920750945e-05, "loss": 0.0984, "step": 64170 }, { "epoch": 18.05, "learning_rate": 7.101614968918878e-05, "loss": 0.0978, "step": 64200 }, { "epoch": 18.06, "learning_rate": 7.099740730328305e-05, "loss": 0.1047, "step": 64230 }, { "epoch": 18.07, "learning_rate": 7.097866491737733e-05, "loss": 0.0965, "step": 64260 }, { "epoch": 18.07, "learning_rate": 7.09599225314716e-05, "loss": 0.1093, "step": 64290 }, { "epoch": 18.08, "learning_rate": 7.094118014556586e-05, "loss": 0.0999, "step": 64320 }, { "epoch": 18.09, "learning_rate": 7.092243775966014e-05, "loss": 0.1039, "step": 64350 }, { "epoch": 18.1, "learning_rate": 7.090369537375442e-05, "loss": 0.113, "step": 64380 }, { "epoch": 18.11, "learning_rate": 7.088495298784869e-05, "loss": 0.0963, "step": 64410 }, { "epoch": 18.12, "learning_rate": 7.086621060194296e-05, "loss": 0.1074, "step": 64440 }, { "epoch": 18.12, "learning_rate": 7.084746821603724e-05, "loss": 0.1056, "step": 64470 }, { "epoch": 18.13, "learning_rate": 7.082872583013152e-05, "loss": 0.1032, "step": 64500 }, { "epoch": 18.14, "learning_rate": 7.080998344422579e-05, "loss": 0.113, "step": 64530 }, { "epoch": 18.15, "learning_rate": 7.079124105832005e-05, "loss": 0.092, "step": 64560 }, { "epoch": 18.16, "learning_rate": 7.077249867241434e-05, "loss": 0.1066, "step": 64590 }, { "epoch": 18.17, "learning_rate": 7.075375628650862e-05, "loss": 0.0995, "step": 64620 }, { "epoch": 18.18, "learning_rate": 7.073501390060288e-05, "loss": 0.106, "step": 64650 }, { "epoch": 18.18, "learning_rate": 7.071627151469715e-05, "loss": 0.1113, "step": 64680 }, { "epoch": 18.19, "learning_rate": 7.069752912879143e-05, "loss": 0.0944, "step": 64710 }, { "epoch": 18.2, "learning_rate": 7.06787867428857e-05, "loss": 0.1118, "step": 64740 }, { "epoch": 18.21, "learning_rate": 7.066004435697998e-05, "loss": 0.1007, "step": 64770 }, { "epoch": 18.22, "learning_rate": 7.064130197107426e-05, "loss": 0.0998, "step": 64800 }, { "epoch": 18.23, "learning_rate": 7.062255958516853e-05, "loss": 0.1093, "step": 64830 }, { "epoch": 18.23, "learning_rate": 7.06038171992628e-05, "loss": 0.095, "step": 64860 }, { "epoch": 18.24, "learning_rate": 7.058507481335708e-05, "loss": 0.1087, "step": 64890 }, { "epoch": 18.25, "learning_rate": 7.056633242745136e-05, "loss": 0.101, "step": 64920 }, { "epoch": 18.26, "learning_rate": 7.054759004154563e-05, "loss": 0.1046, "step": 64950 }, { "epoch": 18.27, "learning_rate": 7.052884765563989e-05, "loss": 0.1116, "step": 64980 }, { "epoch": 18.28, "learning_rate": 7.051010526973417e-05, "loss": 0.0912, "step": 65010 }, { "epoch": 18.29, "learning_rate": 7.049136288382845e-05, "loss": 0.1096, "step": 65040 }, { "epoch": 18.29, "learning_rate": 7.047262049792272e-05, "loss": 0.1093, "step": 65070 }, { "epoch": 18.3, "learning_rate": 7.045387811201699e-05, "loss": 0.0976, "step": 65100 }, { "epoch": 18.31, "learning_rate": 7.043513572611127e-05, "loss": 0.1079, "step": 65130 }, { "epoch": 18.32, "learning_rate": 7.041639334020554e-05, "loss": 0.0989, "step": 65160 }, { "epoch": 18.33, "learning_rate": 7.039765095429982e-05, "loss": 0.1051, "step": 65190 }, { "epoch": 18.34, "learning_rate": 7.03789085683941e-05, "loss": 0.1016, "step": 65220 }, { "epoch": 18.34, "learning_rate": 7.036016618248837e-05, "loss": 0.1046, "step": 65250 }, { "epoch": 18.35, "learning_rate": 7.034142379658263e-05, "loss": 0.11, "step": 65280 }, { "epoch": 18.36, "learning_rate": 7.032268141067692e-05, "loss": 0.0949, "step": 65310 }, { "epoch": 18.37, "learning_rate": 7.03039390247712e-05, "loss": 0.1015, "step": 65340 }, { "epoch": 18.38, "learning_rate": 7.028519663886546e-05, "loss": 0.0995, "step": 65370 }, { "epoch": 18.39, "learning_rate": 7.026645425295973e-05, "loss": 0.1011, "step": 65400 }, { "epoch": 18.39, "learning_rate": 7.024771186705401e-05, "loss": 0.1081, "step": 65430 }, { "epoch": 18.4, "learning_rate": 7.02289694811483e-05, "loss": 0.0955, "step": 65460 }, { "epoch": 18.41, "learning_rate": 7.021022709524256e-05, "loss": 0.1054, "step": 65490 }, { "epoch": 18.42, "learning_rate": 7.019148470933683e-05, "loss": 0.0987, "step": 65520 }, { "epoch": 18.43, "learning_rate": 7.017274232343111e-05, "loss": 0.1082, "step": 65550 }, { "epoch": 18.44, "learning_rate": 7.015399993752538e-05, "loss": 0.116, "step": 65580 }, { "epoch": 18.45, "learning_rate": 7.013525755161966e-05, "loss": 0.0965, "step": 65610 }, { "epoch": 18.45, "learning_rate": 7.011651516571394e-05, "loss": 0.1075, "step": 65640 }, { "epoch": 18.46, "learning_rate": 7.00977727798082e-05, "loss": 0.0992, "step": 65670 }, { "epoch": 18.47, "learning_rate": 7.007903039390247e-05, "loss": 0.1035, "step": 65700 }, { "epoch": 18.48, "learning_rate": 7.006028800799675e-05, "loss": 0.1175, "step": 65730 }, { "epoch": 18.49, "learning_rate": 7.004154562209104e-05, "loss": 0.1027, "step": 65760 }, { "epoch": 18.5, "learning_rate": 7.00228032361853e-05, "loss": 0.1049, "step": 65790 }, { "epoch": 18.5, "learning_rate": 7.000406085027957e-05, "loss": 0.096, "step": 65820 }, { "epoch": 18.51, "learning_rate": 6.998531846437385e-05, "loss": 0.0972, "step": 65850 }, { "epoch": 18.52, "learning_rate": 6.996657607846813e-05, "loss": 0.1071, "step": 65880 }, { "epoch": 18.53, "learning_rate": 6.99478336925624e-05, "loss": 0.0942, "step": 65910 }, { "epoch": 18.54, "learning_rate": 6.992909130665667e-05, "loss": 0.1089, "step": 65940 }, { "epoch": 18.55, "learning_rate": 6.991034892075095e-05, "loss": 0.0967, "step": 65970 }, { "epoch": 18.55, "learning_rate": 6.989160653484522e-05, "loss": 0.1021, "step": 66000 }, { "epoch": 18.56, "learning_rate": 6.98728641489395e-05, "loss": 0.1093, "step": 66030 }, { "epoch": 18.57, "learning_rate": 6.985412176303378e-05, "loss": 0.0913, "step": 66060 }, { "epoch": 18.58, "learning_rate": 6.983537937712804e-05, "loss": 0.1137, "step": 66090 }, { "epoch": 18.59, "learning_rate": 6.981663699122231e-05, "loss": 0.0984, "step": 66120 }, { "epoch": 18.6, "learning_rate": 6.97978946053166e-05, "loss": 0.1054, "step": 66150 }, { "epoch": 18.61, "learning_rate": 6.977915221941087e-05, "loss": 0.1143, "step": 66180 }, { "epoch": 18.61, "learning_rate": 6.976040983350514e-05, "loss": 0.09, "step": 66210 }, { "epoch": 18.62, "learning_rate": 6.974166744759941e-05, "loss": 0.1103, "step": 66240 }, { "epoch": 18.63, "learning_rate": 6.972292506169369e-05, "loss": 0.0995, "step": 66270 }, { "epoch": 18.64, "learning_rate": 6.970418267578797e-05, "loss": 0.1061, "step": 66300 }, { "epoch": 18.65, "learning_rate": 6.968544028988224e-05, "loss": 0.1125, "step": 66330 }, { "epoch": 18.66, "learning_rate": 6.96666979039765e-05, "loss": 0.0972, "step": 66360 }, { "epoch": 18.66, "learning_rate": 6.964795551807079e-05, "loss": 0.1121, "step": 66390 }, { "epoch": 18.67, "learning_rate": 6.962921313216505e-05, "loss": 0.1064, "step": 66420 }, { "epoch": 18.68, "learning_rate": 6.961047074625934e-05, "loss": 0.1025, "step": 66450 }, { "epoch": 18.69, "learning_rate": 6.959172836035362e-05, "loss": 0.1122, "step": 66480 }, { "epoch": 18.7, "learning_rate": 6.957298597444788e-05, "loss": 0.0927, "step": 66510 }, { "epoch": 18.71, "learning_rate": 6.955424358854215e-05, "loss": 0.1043, "step": 66540 }, { "epoch": 18.72, "learning_rate": 6.953550120263643e-05, "loss": 0.1014, "step": 66570 }, { "epoch": 18.72, "learning_rate": 6.951675881673071e-05, "loss": 0.1046, "step": 66600 }, { "epoch": 18.73, "learning_rate": 6.949801643082498e-05, "loss": 0.1095, "step": 66630 }, { "epoch": 18.74, "learning_rate": 6.947927404491925e-05, "loss": 0.0927, "step": 66660 }, { "epoch": 18.75, "learning_rate": 6.946053165901353e-05, "loss": 0.1151, "step": 66690 }, { "epoch": 18.76, "learning_rate": 6.944178927310781e-05, "loss": 0.0999, "step": 66720 }, { "epoch": 18.77, "learning_rate": 6.942304688720208e-05, "loss": 0.1028, "step": 66750 }, { "epoch": 18.77, "learning_rate": 6.940430450129634e-05, "loss": 0.1076, "step": 66780 }, { "epoch": 18.78, "learning_rate": 6.938556211539063e-05, "loss": 0.0961, "step": 66810 }, { "epoch": 18.79, "learning_rate": 6.93668197294849e-05, "loss": 0.1088, "step": 66840 }, { "epoch": 18.8, "learning_rate": 6.934807734357917e-05, "loss": 0.1009, "step": 66870 }, { "epoch": 18.81, "learning_rate": 6.932933495767345e-05, "loss": 0.0993, "step": 66900 }, { "epoch": 18.82, "learning_rate": 6.931059257176772e-05, "loss": 0.1104, "step": 66930 }, { "epoch": 18.82, "learning_rate": 6.929185018586199e-05, "loss": 0.093, "step": 66960 }, { "epoch": 18.83, "learning_rate": 6.927310779995627e-05, "loss": 0.1068, "step": 66990 }, { "epoch": 18.84, "learning_rate": 6.925436541405055e-05, "loss": 0.1026, "step": 67020 }, { "epoch": 18.85, "learning_rate": 6.923562302814482e-05, "loss": 0.1081, "step": 67050 }, { "epoch": 18.86, "learning_rate": 6.921688064223909e-05, "loss": 0.1129, "step": 67080 }, { "epoch": 18.87, "learning_rate": 6.919813825633337e-05, "loss": 0.0944, "step": 67110 }, { "epoch": 18.88, "learning_rate": 6.917939587042765e-05, "loss": 0.1052, "step": 67140 }, { "epoch": 18.88, "learning_rate": 6.916065348452192e-05, "loss": 0.1053, "step": 67170 }, { "epoch": 18.89, "learning_rate": 6.914191109861618e-05, "loss": 0.0995, "step": 67200 }, { "epoch": 18.9, "learning_rate": 6.912316871271046e-05, "loss": 0.1094, "step": 67230 }, { "epoch": 18.91, "learning_rate": 6.910442632680475e-05, "loss": 0.0939, "step": 67260 }, { "epoch": 18.92, "learning_rate": 6.908568394089901e-05, "loss": 0.1072, "step": 67290 }, { "epoch": 18.93, "learning_rate": 6.90669415549933e-05, "loss": 0.1008, "step": 67320 }, { "epoch": 18.93, "learning_rate": 6.904819916908756e-05, "loss": 0.0974, "step": 67350 }, { "epoch": 18.94, "learning_rate": 6.902945678318183e-05, "loss": 0.1133, "step": 67380 }, { "epoch": 18.95, "learning_rate": 6.901071439727611e-05, "loss": 0.0942, "step": 67410 }, { "epoch": 18.96, "learning_rate": 6.899197201137039e-05, "loss": 0.1098, "step": 67440 }, { "epoch": 18.97, "learning_rate": 6.897322962546466e-05, "loss": 0.1027, "step": 67470 }, { "epoch": 18.98, "learning_rate": 6.895448723955893e-05, "loss": 0.0993, "step": 67500 }, { "epoch": 18.98, "learning_rate": 6.89357448536532e-05, "loss": 0.1138, "step": 67530 }, { "epoch": 18.99, "learning_rate": 6.891700246774749e-05, "loss": 0.0974, "step": 67560 }, { "epoch": 19.0, "eval_loss": 0.1771358996629715, "eval_runtime": 488.1062, "eval_samples_per_second": 32.847, "eval_steps_per_second": 1.028, "eval_wer": 0.15545289533661785, "step": 67583 }, { "epoch": 19.0, "learning_rate": 6.889826008184175e-05, "loss": 0.1123, "step": 67590 }, { "epoch": 19.01, "learning_rate": 6.887951769593602e-05, "loss": 0.0894, "step": 67620 }, { "epoch": 19.02, "learning_rate": 6.886140005622716e-05, "loss": 0.0998, "step": 67650 }, { "epoch": 19.03, "learning_rate": 6.884265767032143e-05, "loss": 0.0999, "step": 67680 }, { "epoch": 19.04, "learning_rate": 6.882391528441571e-05, "loss": 0.093, "step": 67710 }, { "epoch": 19.04, "learning_rate": 6.880517289850998e-05, "loss": 0.111, "step": 67740 }, { "epoch": 19.05, "learning_rate": 6.878643051260426e-05, "loss": 0.0922, "step": 67770 }, { "epoch": 19.06, "learning_rate": 6.876768812669854e-05, "loss": 0.1035, "step": 67800 }, { "epoch": 19.07, "learning_rate": 6.874894574079281e-05, "loss": 0.1017, "step": 67830 }, { "epoch": 19.08, "learning_rate": 6.873020335488708e-05, "loss": 0.0932, "step": 67860 }, { "epoch": 19.09, "learning_rate": 6.871146096898136e-05, "loss": 0.1098, "step": 67890 }, { "epoch": 19.09, "learning_rate": 6.869271858307564e-05, "loss": 0.0905, "step": 67920 }, { "epoch": 19.1, "learning_rate": 6.867460094336676e-05, "loss": 0.1092, "step": 67950 }, { "epoch": 19.11, "learning_rate": 6.865585855746105e-05, "loss": 0.108, "step": 67980 }, { "epoch": 19.12, "learning_rate": 6.86371161715553e-05, "loss": 0.0963, "step": 68010 }, { "epoch": 19.13, "learning_rate": 6.861837378564958e-05, "loss": 0.105, "step": 68040 }, { "epoch": 19.14, "learning_rate": 6.859963139974386e-05, "loss": 0.0944, "step": 68070 }, { "epoch": 19.15, "learning_rate": 6.858088901383813e-05, "loss": 0.099, "step": 68100 }, { "epoch": 19.15, "learning_rate": 6.856214662793241e-05, "loss": 0.1086, "step": 68130 }, { "epoch": 19.16, "learning_rate": 6.854340424202668e-05, "loss": 0.0993, "step": 68160 }, { "epoch": 19.17, "learning_rate": 6.852466185612096e-05, "loss": 0.1077, "step": 68190 }, { "epoch": 19.18, "learning_rate": 6.850591947021523e-05, "loss": 0.0953, "step": 68220 }, { "epoch": 19.19, "learning_rate": 6.84871770843095e-05, "loss": 0.1038, "step": 68250 }, { "epoch": 19.2, "learning_rate": 6.846843469840377e-05, "loss": 0.1011, "step": 68280 }, { "epoch": 19.2, "learning_rate": 6.844969231249806e-05, "loss": 0.0969, "step": 68310 }, { "epoch": 19.21, "learning_rate": 6.843094992659232e-05, "loss": 0.1042, "step": 68340 }, { "epoch": 19.22, "learning_rate": 6.84122075406866e-05, "loss": 0.0889, "step": 68370 }, { "epoch": 19.23, "learning_rate": 6.839346515478088e-05, "loss": 0.1036, "step": 68400 }, { "epoch": 19.24, "learning_rate": 6.837472276887514e-05, "loss": 0.101, "step": 68430 }, { "epoch": 19.25, "learning_rate": 6.835598038296942e-05, "loss": 0.0987, "step": 68460 }, { "epoch": 19.25, "learning_rate": 6.83372379970637e-05, "loss": 0.106, "step": 68490 }, { "epoch": 19.26, "learning_rate": 6.831849561115797e-05, "loss": 0.0906, "step": 68520 }, { "epoch": 19.27, "learning_rate": 6.829975322525225e-05, "loss": 0.099, "step": 68550 }, { "epoch": 19.28, "learning_rate": 6.828101083934652e-05, "loss": 0.1017, "step": 68580 }, { "epoch": 19.29, "learning_rate": 6.82622684534408e-05, "loss": 0.102, "step": 68610 }, { "epoch": 19.3, "learning_rate": 6.824352606753506e-05, "loss": 0.1098, "step": 68640 }, { "epoch": 19.31, "learning_rate": 6.822478368162935e-05, "loss": 0.1002, "step": 68670 }, { "epoch": 19.31, "learning_rate": 6.820604129572361e-05, "loss": 0.1032, "step": 68700 }, { "epoch": 19.32, "learning_rate": 6.81872989098179e-05, "loss": 0.1009, "step": 68730 }, { "epoch": 19.33, "learning_rate": 6.816855652391216e-05, "loss": 0.094, "step": 68760 }, { "epoch": 19.34, "learning_rate": 6.814981413800644e-05, "loss": 0.1047, "step": 68790 }, { "epoch": 19.35, "learning_rate": 6.813107175210072e-05, "loss": 0.0919, "step": 68820 }, { "epoch": 19.36, "learning_rate": 6.811232936619498e-05, "loss": 0.1049, "step": 68850 }, { "epoch": 19.36, "learning_rate": 6.809358698028926e-05, "loss": 0.0989, "step": 68880 }, { "epoch": 19.37, "learning_rate": 6.807484459438354e-05, "loss": 0.0982, "step": 68910 }, { "epoch": 19.38, "learning_rate": 6.80561022084778e-05, "loss": 0.1088, "step": 68940 }, { "epoch": 19.39, "learning_rate": 6.803735982257209e-05, "loss": 0.0919, "step": 68970 }, { "epoch": 19.4, "learning_rate": 6.801861743666635e-05, "loss": 0.1043, "step": 69000 }, { "epoch": 19.41, "learning_rate": 6.799987505076064e-05, "loss": 0.1, "step": 69030 }, { "epoch": 19.42, "learning_rate": 6.79811326648549e-05, "loss": 0.0997, "step": 69060 }, { "epoch": 19.42, "learning_rate": 6.796239027894918e-05, "loss": 0.1081, "step": 69090 }, { "epoch": 19.43, "learning_rate": 6.794364789304345e-05, "loss": 0.0879, "step": 69120 }, { "epoch": 19.44, "learning_rate": 6.792490550713773e-05, "loss": 0.1077, "step": 69150 }, { "epoch": 19.45, "learning_rate": 6.7906163121232e-05, "loss": 0.1, "step": 69180 }, { "epoch": 19.46, "learning_rate": 6.788742073532628e-05, "loss": 0.0995, "step": 69210 }, { "epoch": 19.47, "learning_rate": 6.786867834942056e-05, "loss": 0.1106, "step": 69240 }, { "epoch": 19.47, "learning_rate": 6.784993596351482e-05, "loss": 0.0973, "step": 69270 }, { "epoch": 19.48, "learning_rate": 6.78311935776091e-05, "loss": 0.102, "step": 69300 }, { "epoch": 19.49, "learning_rate": 6.781245119170338e-05, "loss": 0.1005, "step": 69330 }, { "epoch": 19.5, "learning_rate": 6.779370880579764e-05, "loss": 0.0957, "step": 69360 }, { "epoch": 19.51, "learning_rate": 6.777496641989193e-05, "loss": 0.1084, "step": 69390 }, { "epoch": 19.52, "learning_rate": 6.77562240339862e-05, "loss": 0.0951, "step": 69420 }, { "epoch": 19.52, "learning_rate": 6.773748164808047e-05, "loss": 0.1102, "step": 69450 }, { "epoch": 19.53, "learning_rate": 6.771873926217474e-05, "loss": 0.1024, "step": 69480 }, { "epoch": 19.54, "learning_rate": 6.769999687626902e-05, "loss": 0.0908, "step": 69510 }, { "epoch": 19.55, "learning_rate": 6.768125449036329e-05, "loss": 0.1097, "step": 69540 }, { "epoch": 19.56, "learning_rate": 6.766251210445757e-05, "loss": 0.0884, "step": 69570 }, { "epoch": 19.57, "learning_rate": 6.764376971855184e-05, "loss": 0.1043, "step": 69600 }, { "epoch": 19.58, "learning_rate": 6.762502733264612e-05, "loss": 0.1006, "step": 69630 }, { "epoch": 19.58, "learning_rate": 6.76062849467404e-05, "loss": 0.0977, "step": 69660 }, { "epoch": 19.59, "learning_rate": 6.758754256083465e-05, "loss": 0.1091, "step": 69690 }, { "epoch": 19.6, "learning_rate": 6.756880017492894e-05, "loss": 0.0919, "step": 69720 }, { "epoch": 19.61, "learning_rate": 6.755005778902322e-05, "loss": 0.1035, "step": 69750 }, { "epoch": 19.62, "learning_rate": 6.753131540311748e-05, "loss": 0.0988, "step": 69780 }, { "epoch": 19.63, "learning_rate": 6.751257301721175e-05, "loss": 0.0976, "step": 69810 }, { "epoch": 19.63, "learning_rate": 6.749383063130603e-05, "loss": 0.1107, "step": 69840 }, { "epoch": 19.64, "learning_rate": 6.747508824540031e-05, "loss": 0.0914, "step": 69870 }, { "epoch": 19.65, "learning_rate": 6.745634585949458e-05, "loss": 0.103, "step": 69900 }, { "epoch": 19.66, "learning_rate": 6.743760347358886e-05, "loss": 0.1086, "step": 69930 }, { "epoch": 19.67, "learning_rate": 6.741886108768313e-05, "loss": 0.0938, "step": 69960 }, { "epoch": 19.68, "learning_rate": 6.740011870177741e-05, "loss": 0.1071, "step": 69990 }, { "epoch": 19.69, "learning_rate": 6.738137631587168e-05, "loss": 0.093, "step": 70020 }, { "epoch": 19.69, "learning_rate": 6.736263392996596e-05, "loss": 0.1046, "step": 70050 }, { "epoch": 19.7, "learning_rate": 6.734389154406024e-05, "loss": 0.1021, "step": 70080 }, { "epoch": 19.71, "learning_rate": 6.732514915815449e-05, "loss": 0.0982, "step": 70110 }, { "epoch": 19.72, "learning_rate": 6.730640677224877e-05, "loss": 0.1069, "step": 70140 }, { "epoch": 19.73, "learning_rate": 6.728766438634305e-05, "loss": 0.0912, "step": 70170 }, { "epoch": 19.74, "learning_rate": 6.726892200043732e-05, "loss": 0.1036, "step": 70200 }, { "epoch": 19.74, "learning_rate": 6.725017961453159e-05, "loss": 0.1075, "step": 70230 }, { "epoch": 19.75, "learning_rate": 6.723143722862587e-05, "loss": 0.0996, "step": 70260 }, { "epoch": 19.76, "learning_rate": 6.721269484272015e-05, "loss": 0.1122, "step": 70290 }, { "epoch": 19.77, "learning_rate": 6.719395245681442e-05, "loss": 0.0951, "step": 70320 }, { "epoch": 19.78, "learning_rate": 6.71752100709087e-05, "loss": 0.1156, "step": 70350 }, { "epoch": 19.79, "learning_rate": 6.715646768500297e-05, "loss": 0.1007, "step": 70380 }, { "epoch": 19.79, "learning_rate": 6.713772529909725e-05, "loss": 0.0958, "step": 70410 }, { "epoch": 19.8, "learning_rate": 6.711898291319152e-05, "loss": 0.1101, "step": 70440 }, { "epoch": 19.81, "learning_rate": 6.71002405272858e-05, "loss": 0.0887, "step": 70470 }, { "epoch": 19.82, "learning_rate": 6.708149814138008e-05, "loss": 0.1066, "step": 70500 }, { "epoch": 19.83, "learning_rate": 6.706275575547433e-05, "loss": 0.0971, "step": 70530 }, { "epoch": 19.84, "learning_rate": 6.704401336956861e-05, "loss": 0.0976, "step": 70560 }, { "epoch": 19.85, "learning_rate": 6.70252709836629e-05, "loss": 0.1099, "step": 70590 }, { "epoch": 19.85, "learning_rate": 6.700652859775717e-05, "loss": 0.091, "step": 70620 }, { "epoch": 19.86, "learning_rate": 6.698778621185143e-05, "loss": 0.1028, "step": 70650 }, { "epoch": 19.87, "learning_rate": 6.696904382594571e-05, "loss": 0.0995, "step": 70680 }, { "epoch": 19.88, "learning_rate": 6.695030144003999e-05, "loss": 0.0949, "step": 70710 }, { "epoch": 19.89, "learning_rate": 6.693155905413426e-05, "loss": 0.1015, "step": 70740 }, { "epoch": 19.9, "learning_rate": 6.691281666822854e-05, "loss": 0.0958, "step": 70770 }, { "epoch": 19.9, "learning_rate": 6.68940742823228e-05, "loss": 0.107, "step": 70800 }, { "epoch": 19.91, "learning_rate": 6.687533189641709e-05, "loss": 0.1014, "step": 70830 }, { "epoch": 19.92, "learning_rate": 6.685658951051135e-05, "loss": 0.0955, "step": 70860 }, { "epoch": 19.93, "learning_rate": 6.683784712460564e-05, "loss": 0.1046, "step": 70890 }, { "epoch": 19.94, "learning_rate": 6.681910473869992e-05, "loss": 0.0939, "step": 70920 }, { "epoch": 19.95, "learning_rate": 6.680036235279417e-05, "loss": 0.1079, "step": 70950 }, { "epoch": 19.95, "learning_rate": 6.678161996688845e-05, "loss": 0.1017, "step": 70980 }, { "epoch": 19.96, "learning_rate": 6.676287758098273e-05, "loss": 0.0968, "step": 71010 }, { "epoch": 19.97, "learning_rate": 6.674413519507701e-05, "loss": 0.1056, "step": 71040 }, { "epoch": 19.98, "learning_rate": 6.672539280917127e-05, "loss": 0.094, "step": 71070 }, { "epoch": 19.99, "learning_rate": 6.670665042326555e-05, "loss": 0.1013, "step": 71100 }, { "epoch": 20.0, "learning_rate": 6.668790803735983e-05, "loss": 0.1007, "step": 71130 }, { "epoch": 20.0, "eval_loss": 0.18122704327106476, "eval_runtime": 490.4096, "eval_samples_per_second": 32.693, "eval_steps_per_second": 1.024, "eval_wer": 0.1531873950841374, "step": 71140 }, { "epoch": 20.01, "learning_rate": 6.66691656514541e-05, "loss": 0.0832, "step": 71160 }, { "epoch": 20.01, "learning_rate": 6.665042326554838e-05, "loss": 0.1068, "step": 71190 }, { "epoch": 20.02, "learning_rate": 6.663168087964264e-05, "loss": 0.0816, "step": 71220 }, { "epoch": 20.03, "learning_rate": 6.661293849373693e-05, "loss": 0.1002, "step": 71250 }, { "epoch": 20.04, "learning_rate": 6.659419610783119e-05, "loss": 0.087, "step": 71280 }, { "epoch": 20.05, "learning_rate": 6.657545372192547e-05, "loss": 0.0935, "step": 71310 }, { "epoch": 20.06, "learning_rate": 6.655671133601976e-05, "loss": 0.1067, "step": 71340 }, { "epoch": 20.06, "learning_rate": 6.653796895011402e-05, "loss": 0.0843, "step": 71370 }, { "epoch": 20.07, "learning_rate": 6.651922656420829e-05, "loss": 0.0997, "step": 71400 }, { "epoch": 20.08, "learning_rate": 6.650048417830257e-05, "loss": 0.0902, "step": 71430 }, { "epoch": 20.09, "learning_rate": 6.648174179239685e-05, "loss": 0.0941, "step": 71460 }, { "epoch": 20.1, "learning_rate": 6.64629994064911e-05, "loss": 0.1033, "step": 71490 }, { "epoch": 20.11, "learning_rate": 6.644425702058539e-05, "loss": 0.0856, "step": 71520 }, { "epoch": 20.12, "learning_rate": 6.642551463467967e-05, "loss": 0.1067, "step": 71550 }, { "epoch": 20.12, "learning_rate": 6.640677224877394e-05, "loss": 0.0924, "step": 71580 }, { "epoch": 20.13, "learning_rate": 6.638802986286822e-05, "loss": 0.0941, "step": 71610 }, { "epoch": 20.14, "learning_rate": 6.636928747696248e-05, "loss": 0.1004, "step": 71640 }, { "epoch": 20.15, "learning_rate": 6.635054509105676e-05, "loss": 0.0873, "step": 71670 }, { "epoch": 20.16, "learning_rate": 6.633180270515103e-05, "loss": 0.1021, "step": 71700 }, { "epoch": 20.17, "learning_rate": 6.631306031924531e-05, "loss": 0.0882, "step": 71730 }, { "epoch": 20.17, "learning_rate": 6.62943179333396e-05, "loss": 0.0968, "step": 71760 }, { "epoch": 20.18, "learning_rate": 6.627557554743386e-05, "loss": 0.1072, "step": 71790 }, { "epoch": 20.19, "learning_rate": 6.625683316152813e-05, "loss": 0.0872, "step": 71820 }, { "epoch": 20.2, "learning_rate": 6.623809077562241e-05, "loss": 0.1014, "step": 71850 }, { "epoch": 20.21, "learning_rate": 6.621934838971669e-05, "loss": 0.0874, "step": 71880 }, { "epoch": 20.22, "learning_rate": 6.620060600381094e-05, "loss": 0.0957, "step": 71910 }, { "epoch": 20.22, "learning_rate": 6.618186361790523e-05, "loss": 0.1076, "step": 71940 }, { "epoch": 20.23, "learning_rate": 6.61631212319995e-05, "loss": 0.0835, "step": 71970 }, { "epoch": 20.24, "learning_rate": 6.614437884609377e-05, "loss": 0.0982, "step": 72000 }, { "epoch": 20.25, "learning_rate": 6.612563646018805e-05, "loss": 0.0887, "step": 72030 }, { "epoch": 20.26, "learning_rate": 6.610689407428232e-05, "loss": 0.095, "step": 72060 }, { "epoch": 20.27, "learning_rate": 6.60881516883766e-05, "loss": 0.1108, "step": 72090 }, { "epoch": 20.28, "learning_rate": 6.606940930247087e-05, "loss": 0.0951, "step": 72120 }, { "epoch": 20.28, "learning_rate": 6.605066691656515e-05, "loss": 0.1091, "step": 72150 }, { "epoch": 20.29, "learning_rate": 6.603192453065943e-05, "loss": 0.0897, "step": 72180 }, { "epoch": 20.3, "learning_rate": 6.60131821447537e-05, "loss": 0.0941, "step": 72210 }, { "epoch": 20.31, "learning_rate": 6.599443975884797e-05, "loss": 0.1009, "step": 72240 }, { "epoch": 20.32, "learning_rate": 6.597569737294225e-05, "loss": 0.0877, "step": 72270 }, { "epoch": 20.33, "learning_rate": 6.595695498703653e-05, "loss": 0.1032, "step": 72300 }, { "epoch": 20.33, "learning_rate": 6.593821260113078e-05, "loss": 0.0901, "step": 72330 }, { "epoch": 20.34, "learning_rate": 6.591947021522506e-05, "loss": 0.0985, "step": 72360 }, { "epoch": 20.35, "learning_rate": 6.590072782931934e-05, "loss": 0.1042, "step": 72390 }, { "epoch": 20.36, "learning_rate": 6.588198544341361e-05, "loss": 0.0863, "step": 72420 }, { "epoch": 20.37, "learning_rate": 6.586386780370475e-05, "loss": 0.0994, "step": 72450 }, { "epoch": 20.38, "learning_rate": 6.584512541779902e-05, "loss": 0.09, "step": 72480 }, { "epoch": 20.39, "learning_rate": 6.58263830318933e-05, "loss": 0.0919, "step": 72510 }, { "epoch": 20.39, "learning_rate": 6.580764064598757e-05, "loss": 0.1083, "step": 72540 }, { "epoch": 20.4, "learning_rate": 6.578889826008185e-05, "loss": 0.0856, "step": 72570 }, { "epoch": 20.41, "learning_rate": 6.577015587417612e-05, "loss": 0.1011, "step": 72600 }, { "epoch": 20.42, "learning_rate": 6.57514134882704e-05, "loss": 0.0931, "step": 72630 }, { "epoch": 20.43, "learning_rate": 6.573267110236467e-05, "loss": 0.1012, "step": 72660 }, { "epoch": 20.44, "learning_rate": 6.571392871645893e-05, "loss": 0.1066, "step": 72690 }, { "epoch": 20.44, "learning_rate": 6.569518633055321e-05, "loss": 0.0876, "step": 72720 }, { "epoch": 20.45, "learning_rate": 6.56764439446475e-05, "loss": 0.1006, "step": 72750 }, { "epoch": 20.46, "learning_rate": 6.565770155874176e-05, "loss": 0.0882, "step": 72780 }, { "epoch": 20.47, "learning_rate": 6.563895917283603e-05, "loss": 0.0945, "step": 72810 }, { "epoch": 20.48, "learning_rate": 6.562021678693031e-05, "loss": 0.1038, "step": 72840 }, { "epoch": 20.49, "learning_rate": 6.560147440102459e-05, "loss": 0.0908, "step": 72870 }, { "epoch": 20.49, "learning_rate": 6.558273201511886e-05, "loss": 0.0993, "step": 72900 }, { "epoch": 20.5, "learning_rate": 6.556398962921314e-05, "loss": 0.087, "step": 72930 }, { "epoch": 20.51, "learning_rate": 6.554524724330741e-05, "loss": 0.1007, "step": 72960 }, { "epoch": 20.52, "learning_rate": 6.552650485740169e-05, "loss": 0.1041, "step": 72990 }, { "epoch": 20.53, "learning_rate": 6.550776247149596e-05, "loss": 0.0845, "step": 73020 }, { "epoch": 20.54, "learning_rate": 6.548902008559024e-05, "loss": 0.0989, "step": 73050 }, { "epoch": 20.55, "learning_rate": 6.54702776996845e-05, "loss": 0.085, "step": 73080 }, { "epoch": 20.55, "learning_rate": 6.545153531377877e-05, "loss": 0.098, "step": 73110 }, { "epoch": 20.56, "learning_rate": 6.543279292787305e-05, "loss": 0.1048, "step": 73140 }, { "epoch": 20.57, "learning_rate": 6.541405054196733e-05, "loss": 0.0855, "step": 73170 }, { "epoch": 20.58, "learning_rate": 6.53953081560616e-05, "loss": 0.0995, "step": 73200 }, { "epoch": 20.59, "learning_rate": 6.537656577015587e-05, "loss": 0.0978, "step": 73230 }, { "epoch": 20.6, "learning_rate": 6.535782338425015e-05, "loss": 0.1018, "step": 73260 }, { "epoch": 20.6, "learning_rate": 6.533908099834443e-05, "loss": 0.1015, "step": 73290 }, { "epoch": 20.61, "learning_rate": 6.53203386124387e-05, "loss": 0.0896, "step": 73320 }, { "epoch": 20.62, "learning_rate": 6.530159622653298e-05, "loss": 0.1, "step": 73350 }, { "epoch": 20.63, "learning_rate": 6.528285384062725e-05, "loss": 0.0872, "step": 73380 }, { "epoch": 20.64, "learning_rate": 6.526411145472153e-05, "loss": 0.1023, "step": 73410 }, { "epoch": 20.65, "learning_rate": 6.52453690688158e-05, "loss": 0.106, "step": 73440 }, { "epoch": 20.65, "learning_rate": 6.522662668291008e-05, "loss": 0.0848, "step": 73470 }, { "epoch": 20.66, "learning_rate": 6.520788429700434e-05, "loss": 0.0971, "step": 73500 }, { "epoch": 20.67, "learning_rate": 6.518914191109861e-05, "loss": 0.0956, "step": 73530 }, { "epoch": 20.68, "learning_rate": 6.517039952519289e-05, "loss": 0.0994, "step": 73560 }, { "epoch": 20.69, "learning_rate": 6.515165713928717e-05, "loss": 0.1042, "step": 73590 }, { "epoch": 20.7, "learning_rate": 6.513291475338144e-05, "loss": 0.0823, "step": 73620 }, { "epoch": 20.71, "learning_rate": 6.511417236747571e-05, "loss": 0.0984, "step": 73650 }, { "epoch": 20.71, "learning_rate": 6.509542998156999e-05, "loss": 0.0931, "step": 73680 }, { "epoch": 20.72, "learning_rate": 6.507668759566427e-05, "loss": 0.1084, "step": 73710 }, { "epoch": 20.73, "learning_rate": 6.505794520975854e-05, "loss": 0.1032, "step": 73740 }, { "epoch": 20.74, "learning_rate": 6.503920282385282e-05, "loss": 0.0868, "step": 73770 }, { "epoch": 20.75, "learning_rate": 6.502046043794709e-05, "loss": 0.1069, "step": 73800 }, { "epoch": 20.76, "learning_rate": 6.500171805204137e-05, "loss": 0.0901, "step": 73830 }, { "epoch": 20.76, "learning_rate": 6.498297566613563e-05, "loss": 0.1024, "step": 73860 }, { "epoch": 20.77, "learning_rate": 6.496423328022991e-05, "loss": 0.1037, "step": 73890 }, { "epoch": 20.78, "learning_rate": 6.494549089432418e-05, "loss": 0.0885, "step": 73920 }, { "epoch": 20.79, "learning_rate": 6.492674850841845e-05, "loss": 0.1046, "step": 73950 }, { "epoch": 20.8, "learning_rate": 6.490800612251273e-05, "loss": 0.0902, "step": 73980 }, { "epoch": 20.81, "learning_rate": 6.488926373660701e-05, "loss": 0.0999, "step": 74010 }, { "epoch": 20.82, "learning_rate": 6.487052135070128e-05, "loss": 0.1074, "step": 74040 }, { "epoch": 20.82, "learning_rate": 6.485177896479555e-05, "loss": 0.0874, "step": 74070 }, { "epoch": 20.83, "learning_rate": 6.483303657888983e-05, "loss": 0.1052, "step": 74100 }, { "epoch": 20.84, "learning_rate": 6.481429419298411e-05, "loss": 0.093, "step": 74130 }, { "epoch": 20.85, "learning_rate": 6.479555180707838e-05, "loss": 0.0919, "step": 74160 }, { "epoch": 20.86, "learning_rate": 6.477680942117264e-05, "loss": 0.1047, "step": 74190 }, { "epoch": 20.87, "learning_rate": 6.475806703526692e-05, "loss": 0.0858, "step": 74220 }, { "epoch": 20.87, "learning_rate": 6.47393246493612e-05, "loss": 0.1063, "step": 74250 }, { "epoch": 20.88, "learning_rate": 6.472058226345547e-05, "loss": 0.0914, "step": 74280 }, { "epoch": 20.89, "learning_rate": 6.470183987754975e-05, "loss": 0.0996, "step": 74310 }, { "epoch": 20.9, "learning_rate": 6.468309749164402e-05, "loss": 0.1036, "step": 74340 }, { "epoch": 20.91, "learning_rate": 6.466435510573829e-05, "loss": 0.0895, "step": 74370 }, { "epoch": 20.92, "learning_rate": 6.464561271983257e-05, "loss": 0.1012, "step": 74400 }, { "epoch": 20.92, "learning_rate": 6.462687033392685e-05, "loss": 0.0939, "step": 74430 }, { "epoch": 20.93, "learning_rate": 6.460812794802113e-05, "loss": 0.0999, "step": 74460 }, { "epoch": 20.94, "learning_rate": 6.458938556211538e-05, "loss": 0.1043, "step": 74490 }, { "epoch": 20.95, "learning_rate": 6.457064317620967e-05, "loss": 0.0844, "step": 74520 }, { "epoch": 20.96, "learning_rate": 6.455190079030395e-05, "loss": 0.098, "step": 74550 }, { "epoch": 20.97, "learning_rate": 6.453315840439821e-05, "loss": 0.0859, "step": 74580 }, { "epoch": 20.98, "learning_rate": 6.451441601849248e-05, "loss": 0.0982, "step": 74610 }, { "epoch": 20.98, "learning_rate": 6.449567363258676e-05, "loss": 0.1069, "step": 74640 }, { "epoch": 20.99, "learning_rate": 6.447693124668104e-05, "loss": 0.0866, "step": 74670 }, { "epoch": 21.0, "eval_loss": 0.17515245079994202, "eval_runtime": 503.7384, "eval_samples_per_second": 31.828, "eval_steps_per_second": 0.997, "eval_wer": 0.1504169339320077, "step": 74697 }, { "epoch": 21.0, "learning_rate": 6.445818886077531e-05, "loss": 0.11, "step": 74700 }, { "epoch": 21.01, "learning_rate": 6.443944647486959e-05, "loss": 0.0902, "step": 74730 }, { "epoch": 21.02, "learning_rate": 6.442132883516072e-05, "loss": 0.1021, "step": 74760 }, { "epoch": 21.03, "learning_rate": 6.4402586449255e-05, "loss": 0.0912, "step": 74790 }, { "epoch": 21.03, "learning_rate": 6.438384406334927e-05, "loss": 0.0911, "step": 74820 }, { "epoch": 21.04, "learning_rate": 6.436510167744354e-05, "loss": 0.0956, "step": 74850 }, { "epoch": 21.05, "learning_rate": 6.434635929153782e-05, "loss": 0.0848, "step": 74880 }, { "epoch": 21.06, "learning_rate": 6.43276169056321e-05, "loss": 0.0995, "step": 74910 }, { "epoch": 21.07, "learning_rate": 6.430887451972636e-05, "loss": 0.0897, "step": 74940 }, { "epoch": 21.08, "learning_rate": 6.429013213382063e-05, "loss": 0.0911, "step": 74970 }, { "epoch": 21.09, "learning_rate": 6.427138974791491e-05, "loss": 0.0971, "step": 75000 }, { "epoch": 21.09, "learning_rate": 6.42526473620092e-05, "loss": 0.084, "step": 75030 }, { "epoch": 21.1, "learning_rate": 6.423390497610346e-05, "loss": 0.098, "step": 75060 }, { "epoch": 21.11, "learning_rate": 6.421516259019773e-05, "loss": 0.0882, "step": 75090 }, { "epoch": 21.12, "learning_rate": 6.419642020429201e-05, "loss": 0.0931, "step": 75120 }, { "epoch": 21.13, "learning_rate": 6.417767781838628e-05, "loss": 0.0954, "step": 75150 }, { "epoch": 21.14, "learning_rate": 6.415893543248056e-05, "loss": 0.0813, "step": 75180 }, { "epoch": 21.14, "learning_rate": 6.414019304657484e-05, "loss": 0.0998, "step": 75210 }, { "epoch": 21.15, "learning_rate": 6.41214506606691e-05, "loss": 0.0874, "step": 75240 }, { "epoch": 21.16, "learning_rate": 6.410270827476337e-05, "loss": 0.0928, "step": 75270 }, { "epoch": 21.17, "learning_rate": 6.408396588885765e-05, "loss": 0.097, "step": 75300 }, { "epoch": 21.18, "learning_rate": 6.406522350295194e-05, "loss": 0.0841, "step": 75330 }, { "epoch": 21.19, "learning_rate": 6.40464811170462e-05, "loss": 0.0913, "step": 75360 }, { "epoch": 21.19, "learning_rate": 6.402773873114047e-05, "loss": 0.0924, "step": 75390 }, { "epoch": 21.2, "learning_rate": 6.400899634523475e-05, "loss": 0.0949, "step": 75420 }, { "epoch": 21.21, "learning_rate": 6.399025395932903e-05, "loss": 0.1002, "step": 75450 }, { "epoch": 21.22, "learning_rate": 6.39715115734233e-05, "loss": 0.0857, "step": 75480 }, { "epoch": 21.23, "learning_rate": 6.395276918751757e-05, "loss": 0.0921, "step": 75510 }, { "epoch": 21.24, "learning_rate": 6.393402680161185e-05, "loss": 0.1005, "step": 75540 }, { "epoch": 21.25, "learning_rate": 6.391528441570613e-05, "loss": 0.097, "step": 75570 }, { "epoch": 21.25, "learning_rate": 6.38965420298004e-05, "loss": 0.098, "step": 75600 }, { "epoch": 21.26, "learning_rate": 6.387779964389468e-05, "loss": 0.0828, "step": 75630 }, { "epoch": 21.27, "learning_rate": 6.385905725798894e-05, "loss": 0.0935, "step": 75660 }, { "epoch": 21.28, "learning_rate": 6.384031487208321e-05, "loss": 0.0942, "step": 75690 }, { "epoch": 21.29, "learning_rate": 6.38215724861775e-05, "loss": 0.0906, "step": 75720 }, { "epoch": 21.3, "learning_rate": 6.380283010027177e-05, "loss": 0.1015, "step": 75750 }, { "epoch": 21.3, "learning_rate": 6.378408771436604e-05, "loss": 0.0827, "step": 75780 }, { "epoch": 21.31, "learning_rate": 6.376534532846031e-05, "loss": 0.0985, "step": 75810 }, { "epoch": 21.32, "learning_rate": 6.374660294255459e-05, "loss": 0.0928, "step": 75840 }, { "epoch": 21.33, "learning_rate": 6.372786055664887e-05, "loss": 0.0897, "step": 75870 }, { "epoch": 21.34, "learning_rate": 6.370911817074314e-05, "loss": 0.0953, "step": 75900 }, { "epoch": 21.35, "learning_rate": 6.36903757848374e-05, "loss": 0.0837, "step": 75930 }, { "epoch": 21.36, "learning_rate": 6.367163339893169e-05, "loss": 0.0935, "step": 75960 }, { "epoch": 21.36, "learning_rate": 6.365289101302597e-05, "loss": 0.0962, "step": 75990 }, { "epoch": 21.37, "learning_rate": 6.363414862712024e-05, "loss": 0.0919, "step": 76020 }, { "epoch": 21.38, "learning_rate": 6.361540624121452e-05, "loss": 0.0988, "step": 76050 }, { "epoch": 21.39, "learning_rate": 6.359666385530878e-05, "loss": 0.0867, "step": 76080 }, { "epoch": 21.4, "learning_rate": 6.357792146940305e-05, "loss": 0.0975, "step": 76110 }, { "epoch": 21.41, "learning_rate": 6.355917908349733e-05, "loss": 0.0979, "step": 76140 }, { "epoch": 21.41, "learning_rate": 6.354043669759161e-05, "loss": 0.0924, "step": 76170 }, { "epoch": 21.42, "learning_rate": 6.352169431168588e-05, "loss": 0.1027, "step": 76200 }, { "epoch": 21.43, "learning_rate": 6.350295192578015e-05, "loss": 0.0862, "step": 76230 }, { "epoch": 21.44, "learning_rate": 6.348420953987443e-05, "loss": 0.1067, "step": 76260 }, { "epoch": 21.45, "learning_rate": 6.346546715396871e-05, "loss": 0.0912, "step": 76290 }, { "epoch": 21.46, "learning_rate": 6.344672476806298e-05, "loss": 0.0943, "step": 76320 }, { "epoch": 21.46, "learning_rate": 6.342860712835412e-05, "loss": 0.1022, "step": 76350 }, { "epoch": 21.47, "learning_rate": 6.340986474244839e-05, "loss": 0.0851, "step": 76380 }, { "epoch": 21.48, "learning_rate": 6.339112235654265e-05, "loss": 0.0982, "step": 76410 }, { "epoch": 21.49, "learning_rate": 6.337237997063693e-05, "loss": 0.09, "step": 76440 }, { "epoch": 21.5, "learning_rate": 6.33536375847312e-05, "loss": 0.0955, "step": 76470 }, { "epoch": 21.51, "learning_rate": 6.333489519882548e-05, "loss": 0.0966, "step": 76500 }, { "epoch": 21.52, "learning_rate": 6.331615281291975e-05, "loss": 0.083, "step": 76530 }, { "epoch": 21.52, "learning_rate": 6.329741042701403e-05, "loss": 0.093, "step": 76560 }, { "epoch": 21.53, "learning_rate": 6.32786680411083e-05, "loss": 0.0922, "step": 76590 }, { "epoch": 21.54, "learning_rate": 6.325992565520258e-05, "loss": 0.0881, "step": 76620 }, { "epoch": 21.55, "learning_rate": 6.324118326929686e-05, "loss": 0.1021, "step": 76650 }, { "epoch": 21.56, "learning_rate": 6.322244088339113e-05, "loss": 0.0838, "step": 76680 }, { "epoch": 21.57, "learning_rate": 6.32036984974854e-05, "loss": 0.1031, "step": 76710 }, { "epoch": 21.57, "learning_rate": 6.318495611157968e-05, "loss": 0.0905, "step": 76740 }, { "epoch": 21.58, "learning_rate": 6.316621372567396e-05, "loss": 0.0944, "step": 76770 }, { "epoch": 21.59, "learning_rate": 6.314747133976822e-05, "loss": 0.0957, "step": 76800 }, { "epoch": 21.6, "learning_rate": 6.312872895386249e-05, "loss": 0.0841, "step": 76830 }, { "epoch": 21.61, "learning_rate": 6.310998656795677e-05, "loss": 0.0977, "step": 76860 }, { "epoch": 21.62, "learning_rate": 6.309124418205104e-05, "loss": 0.0896, "step": 76890 }, { "epoch": 21.62, "learning_rate": 6.307250179614532e-05, "loss": 0.0899, "step": 76920 }, { "epoch": 21.63, "learning_rate": 6.305375941023959e-05, "loss": 0.1022, "step": 76950 }, { "epoch": 21.64, "learning_rate": 6.303501702433387e-05, "loss": 0.0867, "step": 76980 }, { "epoch": 21.65, "learning_rate": 6.301627463842814e-05, "loss": 0.0982, "step": 77010 }, { "epoch": 21.66, "learning_rate": 6.299753225252242e-05, "loss": 0.0916, "step": 77040 }, { "epoch": 21.67, "learning_rate": 6.29787898666167e-05, "loss": 0.094, "step": 77070 }, { "epoch": 21.68, "learning_rate": 6.296004748071097e-05, "loss": 0.1011, "step": 77100 }, { "epoch": 21.68, "learning_rate": 6.294130509480523e-05, "loss": 0.0869, "step": 77130 }, { "epoch": 21.69, "learning_rate": 6.292256270889951e-05, "loss": 0.0969, "step": 77160 }, { "epoch": 21.7, "learning_rate": 6.29038203229938e-05, "loss": 0.0958, "step": 77190 }, { "epoch": 21.71, "learning_rate": 6.288507793708806e-05, "loss": 0.091, "step": 77220 }, { "epoch": 21.72, "learning_rate": 6.286633555118233e-05, "loss": 0.0994, "step": 77250 }, { "epoch": 21.73, "learning_rate": 6.284759316527661e-05, "loss": 0.0838, "step": 77280 }, { "epoch": 21.73, "learning_rate": 6.282885077937088e-05, "loss": 0.1009, "step": 77310 }, { "epoch": 21.74, "learning_rate": 6.281010839346516e-05, "loss": 0.0908, "step": 77340 }, { "epoch": 21.75, "learning_rate": 6.279136600755943e-05, "loss": 0.0974, "step": 77370 }, { "epoch": 21.76, "learning_rate": 6.277262362165371e-05, "loss": 0.1025, "step": 77400 }, { "epoch": 21.77, "learning_rate": 6.275388123574798e-05, "loss": 0.0836, "step": 77430 }, { "epoch": 21.78, "learning_rate": 6.273513884984226e-05, "loss": 0.0997, "step": 77460 }, { "epoch": 21.79, "learning_rate": 6.271639646393654e-05, "loss": 0.0941, "step": 77490 }, { "epoch": 21.79, "learning_rate": 6.26976540780308e-05, "loss": 0.0985, "step": 77520 }, { "epoch": 21.8, "learning_rate": 6.267891169212507e-05, "loss": 0.1066, "step": 77550 }, { "epoch": 21.81, "learning_rate": 6.266016930621935e-05, "loss": 0.0851, "step": 77580 }, { "epoch": 21.82, "learning_rate": 6.264142692031363e-05, "loss": 0.1011, "step": 77610 }, { "epoch": 21.83, "learning_rate": 6.26226845344079e-05, "loss": 0.0937, "step": 77640 }, { "epoch": 21.84, "learning_rate": 6.260394214850217e-05, "loss": 0.0957, "step": 77670 }, { "epoch": 21.84, "learning_rate": 6.258519976259645e-05, "loss": 0.1, "step": 77700 }, { "epoch": 21.85, "learning_rate": 6.256645737669072e-05, "loss": 0.0842, "step": 77730 }, { "epoch": 21.86, "learning_rate": 6.2547714990785e-05, "loss": 0.1, "step": 77760 }, { "epoch": 21.87, "learning_rate": 6.252897260487927e-05, "loss": 0.0912, "step": 77790 }, { "epoch": 21.88, "learning_rate": 6.251023021897355e-05, "loss": 0.0992, "step": 77820 }, { "epoch": 21.89, "learning_rate": 6.249148783306781e-05, "loss": 0.1045, "step": 77850 }, { "epoch": 21.89, "learning_rate": 6.24727454471621e-05, "loss": 0.0867, "step": 77880 }, { "epoch": 21.9, "learning_rate": 6.245400306125638e-05, "loss": 0.1005, "step": 77910 }, { "epoch": 21.91, "learning_rate": 6.243526067535064e-05, "loss": 0.0901, "step": 77940 }, { "epoch": 21.92, "learning_rate": 6.241651828944491e-05, "loss": 0.0971, "step": 77970 }, { "epoch": 21.93, "learning_rate": 6.239777590353919e-05, "loss": 0.1068, "step": 78000 }, { "epoch": 21.94, "learning_rate": 6.237903351763347e-05, "loss": 0.0858, "step": 78030 }, { "epoch": 21.95, "learning_rate": 6.236029113172774e-05, "loss": 0.1032, "step": 78060 }, { "epoch": 21.95, "learning_rate": 6.234154874582201e-05, "loss": 0.0857, "step": 78090 }, { "epoch": 21.96, "learning_rate": 6.232280635991629e-05, "loss": 0.0954, "step": 78120 }, { "epoch": 21.97, "learning_rate": 6.230406397401056e-05, "loss": 0.0997, "step": 78150 }, { "epoch": 21.98, "learning_rate": 6.228532158810484e-05, "loss": 0.0838, "step": 78180 }, { "epoch": 21.99, "learning_rate": 6.22665792021991e-05, "loss": 0.0995, "step": 78210 }, { "epoch": 22.0, "learning_rate": 6.224783681629339e-05, "loss": 0.0901, "step": 78240 }, { "epoch": 22.0, "eval_loss": 0.1689508855342865, "eval_runtime": 503.8188, "eval_samples_per_second": 31.823, "eval_steps_per_second": 0.996, "eval_wer": 0.1476532965758192, "step": 78254 }, { "epoch": 22.0, "learning_rate": 6.222909443038765e-05, "loss": 0.0977, "step": 78270 }, { "epoch": 22.01, "learning_rate": 6.221035204448193e-05, "loss": 0.0944, "step": 78300 }, { "epoch": 22.02, "learning_rate": 6.219160965857621e-05, "loss": 0.0864, "step": 78330 }, { "epoch": 22.03, "learning_rate": 6.217286727267048e-05, "loss": 0.094, "step": 78360 }, { "epoch": 22.04, "learning_rate": 6.215412488676475e-05, "loss": 0.0862, "step": 78390 }, { "epoch": 22.05, "learning_rate": 6.213538250085903e-05, "loss": 0.0935, "step": 78420 }, { "epoch": 22.06, "learning_rate": 6.211664011495331e-05, "loss": 0.0925, "step": 78450 }, { "epoch": 22.06, "learning_rate": 6.209789772904758e-05, "loss": 0.0886, "step": 78480 }, { "epoch": 22.07, "learning_rate": 6.207915534314185e-05, "loss": 0.1043, "step": 78510 }, { "epoch": 22.08, "learning_rate": 6.206041295723613e-05, "loss": 0.0778, "step": 78540 }, { "epoch": 22.09, "learning_rate": 6.20416705713304e-05, "loss": 0.0892, "step": 78570 }, { "epoch": 22.1, "learning_rate": 6.202292818542468e-05, "loss": 0.0946, "step": 78600 }, { "epoch": 22.11, "learning_rate": 6.200418579951894e-05, "loss": 0.0867, "step": 78630 }, { "epoch": 22.11, "learning_rate": 6.198544341361322e-05, "loss": 0.0987, "step": 78660 }, { "epoch": 22.12, "learning_rate": 6.196670102770749e-05, "loss": 0.0858, "step": 78690 }, { "epoch": 22.13, "learning_rate": 6.194795864180177e-05, "loss": 0.0934, "step": 78720 }, { "epoch": 22.14, "learning_rate": 6.192921625589605e-05, "loss": 0.0866, "step": 78750 }, { "epoch": 22.15, "learning_rate": 6.191047386999032e-05, "loss": 0.0881, "step": 78780 }, { "epoch": 22.16, "learning_rate": 6.189173148408459e-05, "loss": 0.0925, "step": 78810 }, { "epoch": 22.16, "learning_rate": 6.187298909817887e-05, "loss": 0.0813, "step": 78840 }, { "epoch": 22.17, "learning_rate": 6.185424671227315e-05, "loss": 0.0971, "step": 78870 }, { "epoch": 22.18, "learning_rate": 6.183550432636742e-05, "loss": 0.09, "step": 78900 }, { "epoch": 22.19, "learning_rate": 6.181676194046169e-05, "loss": 0.087, "step": 78930 }, { "epoch": 22.2, "learning_rate": 6.179801955455597e-05, "loss": 0.0986, "step": 78960 }, { "epoch": 22.21, "learning_rate": 6.177927716865025e-05, "loss": 0.0811, "step": 78990 }, { "epoch": 22.22, "learning_rate": 6.176053478274451e-05, "loss": 0.0936, "step": 79020 }, { "epoch": 22.22, "learning_rate": 6.174179239683878e-05, "loss": 0.0894, "step": 79050 }, { "epoch": 22.23, "learning_rate": 6.172305001093306e-05, "loss": 0.088, "step": 79080 }, { "epoch": 22.24, "learning_rate": 6.170430762502733e-05, "loss": 0.0985, "step": 79110 }, { "epoch": 22.25, "learning_rate": 6.168556523912161e-05, "loss": 0.0785, "step": 79140 }, { "epoch": 22.26, "learning_rate": 6.166682285321589e-05, "loss": 0.0915, "step": 79170 }, { "epoch": 22.27, "learning_rate": 6.164808046731016e-05, "loss": 0.0902, "step": 79200 }, { "epoch": 22.27, "learning_rate": 6.162933808140443e-05, "loss": 0.0908, "step": 79230 }, { "epoch": 22.28, "learning_rate": 6.161059569549871e-05, "loss": 0.0902, "step": 79260 }, { "epoch": 22.29, "learning_rate": 6.159185330959299e-05, "loss": 0.0831, "step": 79290 }, { "epoch": 22.3, "learning_rate": 6.157311092368726e-05, "loss": 0.094, "step": 79320 }, { "epoch": 22.31, "learning_rate": 6.155436853778152e-05, "loss": 0.0895, "step": 79350 }, { "epoch": 22.32, "learning_rate": 6.15356261518758e-05, "loss": 0.0919, "step": 79380 }, { "epoch": 22.32, "learning_rate": 6.151688376597009e-05, "loss": 0.1012, "step": 79410 }, { "epoch": 22.33, "learning_rate": 6.149814138006435e-05, "loss": 0.0853, "step": 79440 }, { "epoch": 22.34, "learning_rate": 6.147939899415862e-05, "loss": 0.0983, "step": 79470 }, { "epoch": 22.35, "learning_rate": 6.14606566082529e-05, "loss": 0.0947, "step": 79500 }, { "epoch": 22.36, "learning_rate": 6.144191422234717e-05, "loss": 0.0862, "step": 79530 }, { "epoch": 22.37, "learning_rate": 6.142317183644145e-05, "loss": 0.1026, "step": 79560 }, { "epoch": 22.38, "learning_rate": 6.140442945053573e-05, "loss": 0.0817, "step": 79590 }, { "epoch": 22.38, "learning_rate": 6.138568706463e-05, "loss": 0.0901, "step": 79620 }, { "epoch": 22.39, "learning_rate": 6.136694467872427e-05, "loss": 0.0937, "step": 79650 }, { "epoch": 22.4, "learning_rate": 6.134820229281855e-05, "loss": 0.088, "step": 79680 }, { "epoch": 22.41, "learning_rate": 6.132945990691283e-05, "loss": 0.0966, "step": 79710 }, { "epoch": 22.42, "learning_rate": 6.13107175210071e-05, "loss": 0.0798, "step": 79740 }, { "epoch": 22.43, "learning_rate": 6.129197513510136e-05, "loss": 0.0895, "step": 79770 }, { "epoch": 22.43, "learning_rate": 6.127323274919564e-05, "loss": 0.0903, "step": 79800 }, { "epoch": 22.44, "learning_rate": 6.125449036328992e-05, "loss": 0.0902, "step": 79830 }, { "epoch": 22.45, "learning_rate": 6.123574797738419e-05, "loss": 0.1, "step": 79860 }, { "epoch": 22.46, "learning_rate": 6.121700559147846e-05, "loss": 0.0843, "step": 79890 }, { "epoch": 22.47, "learning_rate": 6.119826320557274e-05, "loss": 0.0924, "step": 79920 }, { "epoch": 22.48, "learning_rate": 6.117952081966701e-05, "loss": 0.0926, "step": 79950 }, { "epoch": 22.49, "learning_rate": 6.116077843376129e-05, "loss": 0.0866, "step": 79980 }, { "epoch": 22.49, "learning_rate": 6.114203604785557e-05, "loss": 0.0958, "step": 80010 }, { "epoch": 22.5, "learning_rate": 6.112329366194984e-05, "loss": 0.083, "step": 80040 }, { "epoch": 22.51, "learning_rate": 6.11045512760441e-05, "loss": 0.0946, "step": 80070 }, { "epoch": 22.52, "learning_rate": 6.108580889013839e-05, "loss": 0.0865, "step": 80100 }, { "epoch": 22.53, "learning_rate": 6.106706650423267e-05, "loss": 0.086, "step": 80130 }, { "epoch": 22.54, "learning_rate": 6.104832411832693e-05, "loss": 0.0981, "step": 80160 }, { "epoch": 22.54, "learning_rate": 6.10295817324212e-05, "loss": 0.0821, "step": 80190 }, { "epoch": 22.55, "learning_rate": 6.101083934651548e-05, "loss": 0.099, "step": 80220 }, { "epoch": 22.56, "learning_rate": 6.0992096960609756e-05, "loss": 0.0893, "step": 80250 }, { "epoch": 22.57, "learning_rate": 6.097335457470403e-05, "loss": 0.0876, "step": 80280 }, { "epoch": 22.58, "learning_rate": 6.09546121887983e-05, "loss": 0.0959, "step": 80310 }, { "epoch": 22.59, "learning_rate": 6.093586980289258e-05, "loss": 0.0838, "step": 80340 }, { "epoch": 22.59, "learning_rate": 6.091712741698685e-05, "loss": 0.0925, "step": 80370 }, { "epoch": 22.6, "learning_rate": 6.089838503108113e-05, "loss": 0.0904, "step": 80400 }, { "epoch": 22.61, "learning_rate": 6.087964264517541e-05, "loss": 0.0896, "step": 80430 }, { "epoch": 22.62, "learning_rate": 6.086090025926967e-05, "loss": 0.1, "step": 80460 }, { "epoch": 22.63, "learning_rate": 6.084215787336395e-05, "loss": 0.0886, "step": 80490 }, { "epoch": 22.64, "learning_rate": 6.082404023365508e-05, "loss": 0.095, "step": 80520 }, { "epoch": 22.65, "learning_rate": 6.080529784774935e-05, "loss": 0.0905, "step": 80550 }, { "epoch": 22.65, "learning_rate": 6.078655546184363e-05, "loss": 0.0882, "step": 80580 }, { "epoch": 22.66, "learning_rate": 6.0767813075937906e-05, "loss": 0.0944, "step": 80610 }, { "epoch": 22.67, "learning_rate": 6.0749070690032174e-05, "loss": 0.0856, "step": 80640 }, { "epoch": 22.68, "learning_rate": 6.073032830412645e-05, "loss": 0.0946, "step": 80670 }, { "epoch": 22.69, "learning_rate": 6.071158591822073e-05, "loss": 0.0964, "step": 80700 }, { "epoch": 22.7, "learning_rate": 6.0692843532315e-05, "loss": 0.0852, "step": 80730 }, { "epoch": 22.7, "learning_rate": 6.067410114640928e-05, "loss": 0.0985, "step": 80760 }, { "epoch": 22.71, "learning_rate": 6.0655358760503545e-05, "loss": 0.0888, "step": 80790 }, { "epoch": 22.72, "learning_rate": 6.063661637459782e-05, "loss": 0.0967, "step": 80820 }, { "epoch": 22.73, "learning_rate": 6.06178739886921e-05, "loss": 0.0974, "step": 80850 }, { "epoch": 22.74, "learning_rate": 6.0599131602786374e-05, "loss": 0.0877, "step": 80880 }, { "epoch": 22.75, "learning_rate": 6.058038921688064e-05, "loss": 0.108, "step": 80910 }, { "epoch": 22.76, "learning_rate": 6.0561646830974916e-05, "loss": 0.0797, "step": 80940 }, { "epoch": 22.76, "learning_rate": 6.054290444506919e-05, "loss": 0.0985, "step": 80970 }, { "epoch": 22.77, "learning_rate": 6.052416205916347e-05, "loss": 0.0904, "step": 81000 }, { "epoch": 22.78, "learning_rate": 6.0505419673257745e-05, "loss": 0.0913, "step": 81030 }, { "epoch": 22.79, "learning_rate": 6.048667728735201e-05, "loss": 0.1001, "step": 81060 }, { "epoch": 22.8, "learning_rate": 6.046793490144629e-05, "loss": 0.0899, "step": 81090 }, { "epoch": 22.81, "learning_rate": 6.044919251554057e-05, "loss": 0.0933, "step": 81120 }, { "epoch": 22.81, "learning_rate": 6.043045012963484e-05, "loss": 0.0877, "step": 81150 }, { "epoch": 22.82, "learning_rate": 6.0411707743729116e-05, "loss": 0.0882, "step": 81180 }, { "epoch": 22.83, "learning_rate": 6.0392965357823384e-05, "loss": 0.0974, "step": 81210 }, { "epoch": 22.84, "learning_rate": 6.037422297191766e-05, "loss": 0.0882, "step": 81240 }, { "epoch": 22.85, "learning_rate": 6.035548058601194e-05, "loss": 0.0925, "step": 81270 }, { "epoch": 22.86, "learning_rate": 6.033673820010621e-05, "loss": 0.0925, "step": 81300 }, { "epoch": 22.86, "learning_rate": 6.031799581420048e-05, "loss": 0.084, "step": 81330 }, { "epoch": 22.87, "learning_rate": 6.0299253428294754e-05, "loss": 0.0994, "step": 81360 }, { "epoch": 22.88, "learning_rate": 6.028051104238903e-05, "loss": 0.0873, "step": 81390 }, { "epoch": 22.89, "learning_rate": 6.026176865648331e-05, "loss": 0.098, "step": 81420 }, { "epoch": 22.9, "learning_rate": 6.0243026270577584e-05, "loss": 0.0902, "step": 81450 }, { "epoch": 22.91, "learning_rate": 6.022428388467185e-05, "loss": 0.0894, "step": 81480 }, { "epoch": 22.92, "learning_rate": 6.0205541498766125e-05, "loss": 0.0956, "step": 81510 }, { "epoch": 22.92, "learning_rate": 6.0186799112860406e-05, "loss": 0.0848, "step": 81540 }, { "epoch": 22.93, "learning_rate": 6.016805672695468e-05, "loss": 0.0961, "step": 81570 }, { "epoch": 22.94, "learning_rate": 6.0149314341048955e-05, "loss": 0.0908, "step": 81600 }, { "epoch": 22.95, "learning_rate": 6.013057195514322e-05, "loss": 0.0901, "step": 81630 }, { "epoch": 22.96, "learning_rate": 6.0111829569237496e-05, "loss": 0.1035, "step": 81660 }, { "epoch": 22.97, "learning_rate": 6.009308718333178e-05, "loss": 0.0859, "step": 81690 }, { "epoch": 22.97, "learning_rate": 6.007434479742605e-05, "loss": 0.0979, "step": 81720 }, { "epoch": 22.98, "learning_rate": 6.005560241152032e-05, "loss": 0.0898, "step": 81750 }, { "epoch": 22.99, "learning_rate": 6.003686002561459e-05, "loss": 0.0918, "step": 81780 }, { "epoch": 23.0, "learning_rate": 6.001811763970887e-05, "loss": 0.0964, "step": 81810 }, { "epoch": 23.0, "eval_loss": 0.17729832231998444, "eval_runtime": 539.2851, "eval_samples_per_second": 29.73, "eval_steps_per_second": 0.931, "eval_wer": 0.14893617021276595, "step": 81811 }, { "epoch": 23.01, "learning_rate": 5.999937525380315e-05, "loss": 0.0783, "step": 81840 }, { "epoch": 23.02, "learning_rate": 5.998063286789742e-05, "loss": 0.0958, "step": 81870 }, { "epoch": 23.03, "learning_rate": 5.996189048199169e-05, "loss": 0.0909, "step": 81900 }, { "epoch": 23.03, "learning_rate": 5.9943148096085964e-05, "loss": 0.0884, "step": 81930 }, { "epoch": 23.04, "learning_rate": 5.9924405710180245e-05, "loss": 0.0905, "step": 81960 }, { "epoch": 23.05, "learning_rate": 5.990566332427452e-05, "loss": 0.0843, "step": 81990 }, { "epoch": 23.06, "learning_rate": 5.9886920938368793e-05, "loss": 0.091, "step": 82020 }, { "epoch": 23.07, "learning_rate": 5.986817855246306e-05, "loss": 0.0833, "step": 82050 }, { "epoch": 23.08, "learning_rate": 5.9849436166557335e-05, "loss": 0.0912, "step": 82080 }, { "epoch": 23.08, "learning_rate": 5.9830693780651616e-05, "loss": 0.0961, "step": 82110 }, { "epoch": 23.09, "learning_rate": 5.981195139474589e-05, "loss": 0.0854, "step": 82140 }, { "epoch": 23.1, "learning_rate": 5.979320900884016e-05, "loss": 0.0906, "step": 82170 }, { "epoch": 23.11, "learning_rate": 5.977446662293443e-05, "loss": 0.0793, "step": 82200 }, { "epoch": 23.12, "learning_rate": 5.975572423702871e-05, "loss": 0.0893, "step": 82230 }, { "epoch": 23.13, "learning_rate": 5.973698185112299e-05, "loss": 0.0944, "step": 82260 }, { "epoch": 23.13, "learning_rate": 5.971823946521726e-05, "loss": 0.0794, "step": 82290 }, { "epoch": 23.14, "learning_rate": 5.969949707931153e-05, "loss": 0.0943, "step": 82320 }, { "epoch": 23.15, "learning_rate": 5.96807546934058e-05, "loss": 0.0816, "step": 82350 }, { "epoch": 23.16, "learning_rate": 5.9662012307500084e-05, "loss": 0.0886, "step": 82380 }, { "epoch": 23.17, "learning_rate": 5.964326992159436e-05, "loss": 0.0915, "step": 82410 }, { "epoch": 23.18, "learning_rate": 5.962452753568863e-05, "loss": 0.0844, "step": 82440 }, { "epoch": 23.19, "learning_rate": 5.96057851497829e-05, "loss": 0.0913, "step": 82470 }, { "epoch": 23.19, "learning_rate": 5.9587042763877174e-05, "loss": 0.0835, "step": 82500 }, { "epoch": 23.2, "learning_rate": 5.9568300377971455e-05, "loss": 0.0888, "step": 82530 }, { "epoch": 23.21, "learning_rate": 5.954955799206573e-05, "loss": 0.0953, "step": 82560 }, { "epoch": 23.22, "learning_rate": 5.9530815606159996e-05, "loss": 0.0812, "step": 82590 }, { "epoch": 23.23, "learning_rate": 5.951207322025427e-05, "loss": 0.0925, "step": 82620 }, { "epoch": 23.24, "learning_rate": 5.949333083434855e-05, "loss": 0.0802, "step": 82650 }, { "epoch": 23.24, "learning_rate": 5.9474588448442826e-05, "loss": 0.0954, "step": 82680 }, { "epoch": 23.25, "learning_rate": 5.94558460625371e-05, "loss": 0.0904, "step": 82710 }, { "epoch": 23.26, "learning_rate": 5.943710367663137e-05, "loss": 0.0817, "step": 82740 }, { "epoch": 23.27, "learning_rate": 5.941836129072564e-05, "loss": 0.0938, "step": 82770 }, { "epoch": 23.28, "learning_rate": 5.939961890481992e-05, "loss": 0.0842, "step": 82800 }, { "epoch": 23.29, "learning_rate": 5.9380876518914197e-05, "loss": 0.0955, "step": 82830 }, { "epoch": 23.29, "learning_rate": 5.936213413300847e-05, "loss": 0.0901, "step": 82860 }, { "epoch": 23.3, "learning_rate": 5.934339174710274e-05, "loss": 0.0798, "step": 82890 }, { "epoch": 23.31, "learning_rate": 5.932464936119701e-05, "loss": 0.0934, "step": 82920 }, { "epoch": 23.32, "learning_rate": 5.930590697529129e-05, "loss": 0.0869, "step": 82950 }, { "epoch": 23.33, "learning_rate": 5.928716458938557e-05, "loss": 0.0874, "step": 82980 }, { "epoch": 23.34, "learning_rate": 5.9268422203479835e-05, "loss": 0.0876, "step": 83010 }, { "epoch": 23.35, "learning_rate": 5.924967981757411e-05, "loss": 0.0826, "step": 83040 }, { "epoch": 23.35, "learning_rate": 5.923093743166839e-05, "loss": 0.0966, "step": 83070 }, { "epoch": 23.36, "learning_rate": 5.9212195045762664e-05, "loss": 0.0846, "step": 83100 }, { "epoch": 23.37, "learning_rate": 5.919345265985694e-05, "loss": 0.0957, "step": 83130 }, { "epoch": 23.38, "learning_rate": 5.917533502014807e-05, "loss": 0.0924, "step": 83160 }, { "epoch": 23.39, "learning_rate": 5.915659263424235e-05, "loss": 0.0834, "step": 83190 }, { "epoch": 23.4, "learning_rate": 5.9137850248336614e-05, "loss": 0.0944, "step": 83220 }, { "epoch": 23.4, "learning_rate": 5.911973260862774e-05, "loss": 0.0815, "step": 83250 }, { "epoch": 23.41, "learning_rate": 5.9100990222722016e-05, "loss": 0.0868, "step": 83280 }, { "epoch": 23.42, "learning_rate": 5.90822478368163e-05, "loss": 0.0916, "step": 83310 }, { "epoch": 23.43, "learning_rate": 5.906350545091057e-05, "loss": 0.0816, "step": 83340 }, { "epoch": 23.44, "learning_rate": 5.904476306500485e-05, "loss": 0.0977, "step": 83370 }, { "epoch": 23.45, "learning_rate": 5.902602067909911e-05, "loss": 0.0878, "step": 83400 }, { "epoch": 23.46, "learning_rate": 5.9007278293193394e-05, "loss": 0.0923, "step": 83430 }, { "epoch": 23.46, "learning_rate": 5.898853590728767e-05, "loss": 0.0945, "step": 83460 }, { "epoch": 23.47, "learning_rate": 5.896979352138194e-05, "loss": 0.0828, "step": 83490 }, { "epoch": 23.48, "learning_rate": 5.895105113547622e-05, "loss": 0.0895, "step": 83520 }, { "epoch": 23.49, "learning_rate": 5.8932308749570484e-05, "loss": 0.0831, "step": 83550 }, { "epoch": 23.5, "learning_rate": 5.8913566363664765e-05, "loss": 0.0948, "step": 83580 }, { "epoch": 23.51, "learning_rate": 5.889482397775904e-05, "loss": 0.093, "step": 83610 }, { "epoch": 23.51, "learning_rate": 5.887608159185331e-05, "loss": 0.0808, "step": 83640 }, { "epoch": 23.52, "learning_rate": 5.885733920594758e-05, "loss": 0.0978, "step": 83670 }, { "epoch": 23.53, "learning_rate": 5.883859682004186e-05, "loss": 0.0801, "step": 83700 }, { "epoch": 23.54, "learning_rate": 5.8819854434136136e-05, "loss": 0.0915, "step": 83730 }, { "epoch": 23.55, "learning_rate": 5.880111204823041e-05, "loss": 0.0922, "step": 83760 }, { "epoch": 23.56, "learning_rate": 5.878236966232469e-05, "loss": 0.0833, "step": 83790 }, { "epoch": 23.56, "learning_rate": 5.876362727641895e-05, "loss": 0.0937, "step": 83820 }, { "epoch": 23.57, "learning_rate": 5.874488489051323e-05, "loss": 0.0798, "step": 83850 }, { "epoch": 23.58, "learning_rate": 5.8726142504607506e-05, "loss": 0.0898, "step": 83880 }, { "epoch": 23.59, "learning_rate": 5.870740011870178e-05, "loss": 0.0969, "step": 83910 }, { "epoch": 23.6, "learning_rate": 5.868865773279606e-05, "loss": 0.0818, "step": 83940 }, { "epoch": 23.61, "learning_rate": 5.866991534689032e-05, "loss": 0.0928, "step": 83970 }, { "epoch": 23.62, "learning_rate": 5.86511729609846e-05, "loss": 0.0825, "step": 84000 }, { "epoch": 23.62, "learning_rate": 5.863243057507888e-05, "loss": 0.0906, "step": 84030 }, { "epoch": 23.63, "learning_rate": 5.861368818917315e-05, "loss": 0.0972, "step": 84060 }, { "epoch": 23.64, "learning_rate": 5.859494580326742e-05, "loss": 0.0819, "step": 84090 }, { "epoch": 23.65, "learning_rate": 5.85762034173617e-05, "loss": 0.0984, "step": 84120 }, { "epoch": 23.66, "learning_rate": 5.8557461031455974e-05, "loss": 0.0816, "step": 84150 }, { "epoch": 23.67, "learning_rate": 5.853871864555025e-05, "loss": 0.0893, "step": 84180 }, { "epoch": 23.67, "learning_rate": 5.851997625964453e-05, "loss": 0.0938, "step": 84210 }, { "epoch": 23.68, "learning_rate": 5.850123387373879e-05, "loss": 0.0804, "step": 84240 }, { "epoch": 23.69, "learning_rate": 5.848249148783307e-05, "loss": 0.0994, "step": 84270 }, { "epoch": 23.7, "learning_rate": 5.8463749101927345e-05, "loss": 0.0842, "step": 84300 }, { "epoch": 23.71, "learning_rate": 5.844500671602162e-05, "loss": 0.0933, "step": 84330 }, { "epoch": 23.72, "learning_rate": 5.84262643301159e-05, "loss": 0.0918, "step": 84360 }, { "epoch": 23.72, "learning_rate": 5.840752194421016e-05, "loss": 0.0801, "step": 84390 }, { "epoch": 23.73, "learning_rate": 5.838877955830444e-05, "loss": 0.0955, "step": 84420 }, { "epoch": 23.74, "learning_rate": 5.8370037172398716e-05, "loss": 0.0861, "step": 84450 }, { "epoch": 23.75, "learning_rate": 5.8351294786493e-05, "loss": 0.089, "step": 84480 }, { "epoch": 23.76, "learning_rate": 5.833255240058726e-05, "loss": 0.0879, "step": 84510 }, { "epoch": 23.77, "learning_rate": 5.831381001468154e-05, "loss": 0.0822, "step": 84540 }, { "epoch": 23.78, "learning_rate": 5.829506762877581e-05, "loss": 0.0994, "step": 84570 }, { "epoch": 23.78, "learning_rate": 5.827632524287009e-05, "loss": 0.0891, "step": 84600 }, { "epoch": 23.79, "learning_rate": 5.825758285696437e-05, "loss": 0.0924, "step": 84630 }, { "epoch": 23.8, "learning_rate": 5.823884047105863e-05, "loss": 0.0912, "step": 84660 }, { "epoch": 23.81, "learning_rate": 5.822009808515291e-05, "loss": 0.0844, "step": 84690 }, { "epoch": 23.82, "learning_rate": 5.8201355699247184e-05, "loss": 0.099, "step": 84720 }, { "epoch": 23.83, "learning_rate": 5.818261331334146e-05, "loss": 0.0802, "step": 84750 }, { "epoch": 23.83, "learning_rate": 5.816387092743574e-05, "loss": 0.0929, "step": 84780 }, { "epoch": 23.84, "learning_rate": 5.814512854153e-05, "loss": 0.095, "step": 84810 }, { "epoch": 23.85, "learning_rate": 5.812638615562428e-05, "loss": 0.083, "step": 84840 }, { "epoch": 23.86, "learning_rate": 5.8107643769718555e-05, "loss": 0.092, "step": 84870 }, { "epoch": 23.87, "learning_rate": 5.8088901383812836e-05, "loss": 0.0865, "step": 84900 }, { "epoch": 23.88, "learning_rate": 5.8070158997907096e-05, "loss": 0.0936, "step": 84930 }, { "epoch": 23.89, "learning_rate": 5.805141661200138e-05, "loss": 0.0945, "step": 84960 }, { "epoch": 23.89, "learning_rate": 5.803267422609565e-05, "loss": 0.0826, "step": 84990 }, { "epoch": 23.9, "learning_rate": 5.8013931840189926e-05, "loss": 0.0921, "step": 85020 }, { "epoch": 23.91, "learning_rate": 5.799518945428421e-05, "loss": 0.0818, "step": 85050 }, { "epoch": 23.92, "learning_rate": 5.797644706837847e-05, "loss": 0.0931, "step": 85080 }, { "epoch": 23.93, "learning_rate": 5.795770468247275e-05, "loss": 0.0912, "step": 85110 }, { "epoch": 23.94, "learning_rate": 5.793896229656702e-05, "loss": 0.0818, "step": 85140 }, { "epoch": 23.94, "learning_rate": 5.79202199106613e-05, "loss": 0.0919, "step": 85170 }, { "epoch": 23.95, "learning_rate": 5.790147752475558e-05, "loss": 0.0816, "step": 85200 }, { "epoch": 23.96, "learning_rate": 5.7882735138849845e-05, "loss": 0.0941, "step": 85230 }, { "epoch": 23.97, "learning_rate": 5.786399275294412e-05, "loss": 0.0885, "step": 85260 }, { "epoch": 23.98, "learning_rate": 5.7845250367038393e-05, "loss": 0.0825, "step": 85290 }, { "epoch": 23.99, "learning_rate": 5.7826507981132674e-05, "loss": 0.0936, "step": 85320 }, { "epoch": 23.99, "learning_rate": 5.7807765595226935e-05, "loss": 0.085, "step": 85350 }, { "epoch": 24.0, "eval_loss": 0.17761550843715668, "eval_runtime": 505.4452, "eval_samples_per_second": 31.721, "eval_steps_per_second": 0.993, "eval_wer": 0.1455515674259277, "step": 85368 }, { "epoch": 24.0, "learning_rate": 5.7789023209321216e-05, "loss": 0.0938, "step": 85380 }, { "epoch": 24.01, "learning_rate": 5.777028082341549e-05, "loss": 0.0848, "step": 85410 }, { "epoch": 24.02, "learning_rate": 5.7751538437509764e-05, "loss": 0.079, "step": 85440 }, { "epoch": 24.03, "learning_rate": 5.7732796051604045e-05, "loss": 0.0943, "step": 85470 }, { "epoch": 24.04, "learning_rate": 5.7714053665698306e-05, "loss": 0.0719, "step": 85500 }, { "epoch": 24.05, "learning_rate": 5.769531127979259e-05, "loss": 0.0914, "step": 85530 }, { "epoch": 24.05, "learning_rate": 5.767656889388686e-05, "loss": 0.0834, "step": 85560 }, { "epoch": 24.06, "learning_rate": 5.7657826507981135e-05, "loss": 0.0936, "step": 85590 }, { "epoch": 24.07, "learning_rate": 5.76390841220754e-05, "loss": 0.0898, "step": 85620 }, { "epoch": 24.08, "learning_rate": 5.7620341736169684e-05, "loss": 0.0802, "step": 85650 }, { "epoch": 24.09, "learning_rate": 5.760159935026396e-05, "loss": 0.0914, "step": 85680 }, { "epoch": 24.1, "learning_rate": 5.758285696435823e-05, "loss": 0.0822, "step": 85710 }, { "epoch": 24.1, "learning_rate": 5.756411457845251e-05, "loss": 0.086, "step": 85740 }, { "epoch": 24.11, "learning_rate": 5.7545372192546774e-05, "loss": 0.0894, "step": 85770 }, { "epoch": 24.12, "learning_rate": 5.7526629806641055e-05, "loss": 0.0769, "step": 85800 }, { "epoch": 24.13, "learning_rate": 5.750851216693218e-05, "loss": 0.0922, "step": 85830 }, { "epoch": 24.14, "learning_rate": 5.7489769781026456e-05, "loss": 0.0828, "step": 85860 }, { "epoch": 24.15, "learning_rate": 5.747102739512074e-05, "loss": 0.0821, "step": 85890 }, { "epoch": 24.16, "learning_rate": 5.745228500921501e-05, "loss": 0.0929, "step": 85920 }, { "epoch": 24.16, "learning_rate": 5.7433542623309286e-05, "loss": 0.0779, "step": 85950 }, { "epoch": 24.17, "learning_rate": 5.741480023740355e-05, "loss": 0.0938, "step": 85980 }, { "epoch": 24.18, "learning_rate": 5.7396057851497834e-05, "loss": 0.0811, "step": 86010 }, { "epoch": 24.19, "learning_rate": 5.737731546559211e-05, "loss": 0.0861, "step": 86040 }, { "epoch": 24.2, "learning_rate": 5.735857307968638e-05, "loss": 0.0949, "step": 86070 }, { "epoch": 24.21, "learning_rate": 5.733983069378065e-05, "loss": 0.0736, "step": 86100 }, { "epoch": 24.21, "learning_rate": 5.7321088307874924e-05, "loss": 0.092, "step": 86130 }, { "epoch": 24.22, "learning_rate": 5.7302345921969205e-05, "loss": 0.083, "step": 86160 }, { "epoch": 24.23, "learning_rate": 5.728360353606348e-05, "loss": 0.0861, "step": 86190 }, { "epoch": 24.24, "learning_rate": 5.726486115015775e-05, "loss": 0.0967, "step": 86220 }, { "epoch": 24.25, "learning_rate": 5.724611876425202e-05, "loss": 0.0779, "step": 86250 }, { "epoch": 24.26, "learning_rate": 5.7227376378346295e-05, "loss": 0.0899, "step": 86280 }, { "epoch": 24.26, "learning_rate": 5.7208633992440576e-05, "loss": 0.0845, "step": 86310 }, { "epoch": 24.27, "learning_rate": 5.718989160653485e-05, "loss": 0.0825, "step": 86340 }, { "epoch": 24.28, "learning_rate": 5.7171149220629124e-05, "loss": 0.0979, "step": 86370 }, { "epoch": 24.29, "learning_rate": 5.715240683472339e-05, "loss": 0.0793, "step": 86400 }, { "epoch": 24.3, "learning_rate": 5.713366444881767e-05, "loss": 0.0925, "step": 86430 }, { "epoch": 24.31, "learning_rate": 5.711492206291195e-05, "loss": 0.0805, "step": 86460 }, { "epoch": 24.32, "learning_rate": 5.709617967700622e-05, "loss": 0.0881, "step": 86490 }, { "epoch": 24.32, "learning_rate": 5.707743729110049e-05, "loss": 0.1005, "step": 86520 }, { "epoch": 24.33, "learning_rate": 5.705869490519476e-05, "loss": 0.0788, "step": 86550 }, { "epoch": 24.34, "learning_rate": 5.7039952519289044e-05, "loss": 0.0922, "step": 86580 }, { "epoch": 24.35, "learning_rate": 5.702121013338332e-05, "loss": 0.0865, "step": 86610 }, { "epoch": 24.36, "learning_rate": 5.700246774747759e-05, "loss": 0.0883, "step": 86640 }, { "epoch": 24.37, "learning_rate": 5.698372536157186e-05, "loss": 0.0973, "step": 86670 }, { "epoch": 24.37, "learning_rate": 5.6964982975666134e-05, "loss": 0.0847, "step": 86700 }, { "epoch": 24.38, "learning_rate": 5.6946240589760415e-05, "loss": 0.0917, "step": 86730 }, { "epoch": 24.39, "learning_rate": 5.692749820385469e-05, "loss": 0.0784, "step": 86760 }, { "epoch": 24.4, "learning_rate": 5.6908755817948956e-05, "loss": 0.0854, "step": 86790 }, { "epoch": 24.41, "learning_rate": 5.689001343204323e-05, "loss": 0.0945, "step": 86820 }, { "epoch": 24.42, "learning_rate": 5.687127104613751e-05, "loss": 0.0747, "step": 86850 }, { "epoch": 24.43, "learning_rate": 5.6852528660231786e-05, "loss": 0.0845, "step": 86880 }, { "epoch": 24.43, "learning_rate": 5.683378627432606e-05, "loss": 0.0821, "step": 86910 }, { "epoch": 24.44, "learning_rate": 5.681504388842033e-05, "loss": 0.0873, "step": 86940 }, { "epoch": 24.45, "learning_rate": 5.67963015025146e-05, "loss": 0.0975, "step": 86970 }, { "epoch": 24.46, "learning_rate": 5.677755911660888e-05, "loss": 0.0812, "step": 87000 }, { "epoch": 24.47, "learning_rate": 5.6758816730703157e-05, "loss": 0.0905, "step": 87030 }, { "epoch": 24.48, "learning_rate": 5.674007434479743e-05, "loss": 0.0812, "step": 87060 }, { "epoch": 24.48, "learning_rate": 5.67213319588917e-05, "loss": 0.0782, "step": 87090 }, { "epoch": 24.49, "learning_rate": 5.670258957298598e-05, "loss": 0.0969, "step": 87120 }, { "epoch": 24.5, "learning_rate": 5.668384718708025e-05, "loss": 0.079, "step": 87150 }, { "epoch": 24.51, "learning_rate": 5.666510480117453e-05, "loss": 0.0904, "step": 87180 }, { "epoch": 24.52, "learning_rate": 5.6646362415268795e-05, "loss": 0.0841, "step": 87210 }, { "epoch": 24.53, "learning_rate": 5.662762002936307e-05, "loss": 0.0867, "step": 87240 }, { "epoch": 24.53, "learning_rate": 5.660887764345735e-05, "loss": 0.0931, "step": 87270 }, { "epoch": 24.54, "learning_rate": 5.6590135257551624e-05, "loss": 0.0781, "step": 87300 }, { "epoch": 24.55, "learning_rate": 5.65713928716459e-05, "loss": 0.0932, "step": 87330 }, { "epoch": 24.56, "learning_rate": 5.6552650485740166e-05, "loss": 0.0797, "step": 87360 }, { "epoch": 24.57, "learning_rate": 5.653390809983444e-05, "loss": 0.0857, "step": 87390 }, { "epoch": 24.58, "learning_rate": 5.651516571392872e-05, "loss": 0.095, "step": 87420 }, { "epoch": 24.59, "learning_rate": 5.6496423328022995e-05, "loss": 0.0788, "step": 87450 }, { "epoch": 24.59, "learning_rate": 5.647768094211727e-05, "loss": 0.0921, "step": 87480 }, { "epoch": 24.6, "learning_rate": 5.645893855621154e-05, "loss": 0.0822, "step": 87510 }, { "epoch": 24.61, "learning_rate": 5.644019617030582e-05, "loss": 0.0886, "step": 87540 }, { "epoch": 24.62, "learning_rate": 5.642145378440009e-05, "loss": 0.0961, "step": 87570 }, { "epoch": 24.63, "learning_rate": 5.6402711398494366e-05, "loss": 0.0757, "step": 87600 }, { "epoch": 24.64, "learning_rate": 5.6383969012588634e-05, "loss": 0.0877, "step": 87630 }, { "epoch": 24.64, "learning_rate": 5.636522662668291e-05, "loss": 0.0839, "step": 87660 }, { "epoch": 24.65, "learning_rate": 5.634648424077719e-05, "loss": 0.0847, "step": 87690 }, { "epoch": 24.66, "learning_rate": 5.632774185487146e-05, "loss": 0.0956, "step": 87720 }, { "epoch": 24.67, "learning_rate": 5.630899946896574e-05, "loss": 0.0766, "step": 87750 }, { "epoch": 24.68, "learning_rate": 5.6290257083060005e-05, "loss": 0.0869, "step": 87780 }, { "epoch": 24.69, "learning_rate": 5.627151469715428e-05, "loss": 0.0878, "step": 87810 }, { "epoch": 24.69, "learning_rate": 5.625277231124856e-05, "loss": 0.0876, "step": 87840 }, { "epoch": 24.7, "learning_rate": 5.6234029925342834e-05, "loss": 0.0916, "step": 87870 }, { "epoch": 24.71, "learning_rate": 5.6215287539437115e-05, "loss": 0.0781, "step": 87900 }, { "epoch": 24.72, "learning_rate": 5.6196545153531375e-05, "loss": 0.0873, "step": 87930 }, { "epoch": 24.73, "learning_rate": 5.6177802767625656e-05, "loss": 0.0825, "step": 87960 }, { "epoch": 24.74, "learning_rate": 5.615906038171993e-05, "loss": 0.0903, "step": 87990 }, { "epoch": 24.75, "learning_rate": 5.6140317995814205e-05, "loss": 0.0974, "step": 88020 }, { "epoch": 24.75, "learning_rate": 5.612157560990847e-05, "loss": 0.0757, "step": 88050 }, { "epoch": 24.76, "learning_rate": 5.6102833224002746e-05, "loss": 0.0975, "step": 88080 }, { "epoch": 24.77, "learning_rate": 5.608409083809703e-05, "loss": 0.0821, "step": 88110 }, { "epoch": 24.78, "learning_rate": 5.60653484521913e-05, "loss": 0.0868, "step": 88140 }, { "epoch": 24.79, "learning_rate": 5.6046606066285576e-05, "loss": 0.0895, "step": 88170 }, { "epoch": 24.8, "learning_rate": 5.602786368037984e-05, "loss": 0.079, "step": 88200 }, { "epoch": 24.8, "learning_rate": 5.600912129447412e-05, "loss": 0.0896, "step": 88230 }, { "epoch": 24.81, "learning_rate": 5.59903789085684e-05, "loss": 0.0845, "step": 88260 }, { "epoch": 24.82, "learning_rate": 5.597163652266267e-05, "loss": 0.0872, "step": 88290 }, { "epoch": 24.83, "learning_rate": 5.5952894136756954e-05, "loss": 0.0924, "step": 88320 }, { "epoch": 24.84, "learning_rate": 5.5934151750851214e-05, "loss": 0.0772, "step": 88350 }, { "epoch": 24.85, "learning_rate": 5.5915409364945495e-05, "loss": 0.096, "step": 88380 }, { "epoch": 24.86, "learning_rate": 5.589666697903977e-05, "loss": 0.0867, "step": 88410 }, { "epoch": 24.86, "learning_rate": 5.5877924593134043e-05, "loss": 0.0925, "step": 88440 }, { "epoch": 24.87, "learning_rate": 5.585918220722831e-05, "loss": 0.098, "step": 88470 }, { "epoch": 24.88, "learning_rate": 5.5840439821322585e-05, "loss": 0.0773, "step": 88500 }, { "epoch": 24.89, "learning_rate": 5.5821697435416866e-05, "loss": 0.0894, "step": 88530 }, { "epoch": 24.9, "learning_rate": 5.580295504951114e-05, "loss": 0.0833, "step": 88560 }, { "epoch": 24.91, "learning_rate": 5.5784212663605414e-05, "loss": 0.0885, "step": 88590 }, { "epoch": 24.91, "learning_rate": 5.576547027769968e-05, "loss": 0.0983, "step": 88620 }, { "epoch": 24.92, "learning_rate": 5.574672789179396e-05, "loss": 0.0771, "step": 88650 }, { "epoch": 24.93, "learning_rate": 5.572798550588824e-05, "loss": 0.091, "step": 88680 }, { "epoch": 24.94, "learning_rate": 5.570924311998251e-05, "loss": 0.0824, "step": 88710 }, { "epoch": 24.95, "learning_rate": 5.569050073407679e-05, "loss": 0.082, "step": 88740 }, { "epoch": 24.96, "learning_rate": 5.567175834817105e-05, "loss": 0.0929, "step": 88770 }, { "epoch": 24.96, "learning_rate": 5.5653015962265334e-05, "loss": 0.0785, "step": 88800 }, { "epoch": 24.97, "learning_rate": 5.563427357635961e-05, "loss": 0.0907, "step": 88830 }, { "epoch": 24.98, "learning_rate": 5.561553119045388e-05, "loss": 0.0865, "step": 88860 }, { "epoch": 24.99, "learning_rate": 5.559678880454815e-05, "loss": 0.0906, "step": 88890 }, { "epoch": 25.0, "learning_rate": 5.5578046418642424e-05, "loss": 0.0945, "step": 88920 }, { "epoch": 25.0, "eval_loss": 0.17860166728496552, "eval_runtime": 503.6267, "eval_samples_per_second": 31.835, "eval_steps_per_second": 0.997, "eval_wer": 0.142815225253504, "step": 88925 }, { "epoch": 25.01, "learning_rate": 5.5559304032736705e-05, "loss": 0.0802, "step": 88950 }, { "epoch": 25.02, "learning_rate": 5.554056164683098e-05, "loss": 0.0906, "step": 88980 }, { "epoch": 25.02, "learning_rate": 5.552181926092525e-05, "loss": 0.076, "step": 89010 }, { "epoch": 25.03, "learning_rate": 5.550307687501952e-05, "loss": 0.0857, "step": 89040 }, { "epoch": 25.04, "learning_rate": 5.54843344891138e-05, "loss": 0.0802, "step": 89070 }, { "epoch": 25.05, "learning_rate": 5.5465592103208076e-05, "loss": 0.0799, "step": 89100 }, { "epoch": 25.06, "learning_rate": 5.544684971730235e-05, "loss": 0.0861, "step": 89130 }, { "epoch": 25.07, "learning_rate": 5.542810733139663e-05, "loss": 0.0751, "step": 89160 }, { "epoch": 25.07, "learning_rate": 5.540936494549089e-05, "loss": 0.0899, "step": 89190 }, { "epoch": 25.08, "learning_rate": 5.539062255958517e-05, "loss": 0.0826, "step": 89220 }, { "epoch": 25.09, "learning_rate": 5.537188017367945e-05, "loss": 0.0856, "step": 89250 }, { "epoch": 25.1, "learning_rate": 5.535313778777372e-05, "loss": 0.0859, "step": 89280 }, { "epoch": 25.11, "learning_rate": 5.533439540186799e-05, "loss": 0.0768, "step": 89310 }, { "epoch": 25.12, "learning_rate": 5.531565301596226e-05, "loss": 0.088, "step": 89340 }, { "epoch": 25.13, "learning_rate": 5.5296910630056543e-05, "loss": 0.0799, "step": 89370 }, { "epoch": 25.13, "learning_rate": 5.527816824415082e-05, "loss": 0.0803, "step": 89400 }, { "epoch": 25.14, "learning_rate": 5.52594258582451e-05, "loss": 0.0905, "step": 89430 }, { "epoch": 25.15, "learning_rate": 5.524068347233936e-05, "loss": 0.0751, "step": 89460 }, { "epoch": 25.16, "learning_rate": 5.522194108643364e-05, "loss": 0.0891, "step": 89490 }, { "epoch": 25.17, "learning_rate": 5.5203198700527914e-05, "loss": 0.0835, "step": 89520 }, { "epoch": 25.18, "learning_rate": 5.518445631462219e-05, "loss": 0.0835, "step": 89550 }, { "epoch": 25.18, "learning_rate": 5.516571392871647e-05, "loss": 0.0896, "step": 89580 }, { "epoch": 25.19, "learning_rate": 5.514697154281073e-05, "loss": 0.0741, "step": 89610 }, { "epoch": 25.2, "learning_rate": 5.512822915690501e-05, "loss": 0.0939, "step": 89640 }, { "epoch": 25.21, "learning_rate": 5.5109486770999285e-05, "loss": 0.0849, "step": 89670 }, { "epoch": 25.22, "learning_rate": 5.509074438509356e-05, "loss": 0.0864, "step": 89700 }, { "epoch": 25.23, "learning_rate": 5.507200199918783e-05, "loss": 0.089, "step": 89730 }, { "epoch": 25.23, "learning_rate": 5.50532596132821e-05, "loss": 0.0745, "step": 89760 }, { "epoch": 25.24, "learning_rate": 5.503451722737638e-05, "loss": 0.091, "step": 89790 }, { "epoch": 25.25, "learning_rate": 5.5015774841470656e-05, "loss": 0.0839, "step": 89820 }, { "epoch": 25.26, "learning_rate": 5.499703245556494e-05, "loss": 0.0847, "step": 89850 }, { "epoch": 25.27, "learning_rate": 5.49782900696592e-05, "loss": 0.0913, "step": 89880 }, { "epoch": 25.28, "learning_rate": 5.495954768375348e-05, "loss": 0.0784, "step": 89910 }, { "epoch": 25.29, "learning_rate": 5.494080529784775e-05, "loss": 0.0875, "step": 89940 }, { "epoch": 25.29, "learning_rate": 5.492206291194203e-05, "loss": 0.0846, "step": 89970 }, { "epoch": 25.3, "learning_rate": 5.4903320526036295e-05, "loss": 0.0829, "step": 90000 }, { "epoch": 25.31, "learning_rate": 5.488457814013057e-05, "loss": 0.0905, "step": 90030 }, { "epoch": 25.32, "learning_rate": 5.486583575422485e-05, "loss": 0.0742, "step": 90060 }, { "epoch": 25.33, "learning_rate": 5.4847093368319124e-05, "loss": 0.0862, "step": 90090 }, { "epoch": 25.34, "learning_rate": 5.48283509824134e-05, "loss": 0.0776, "step": 90120 }, { "epoch": 25.34, "learning_rate": 5.4809608596507666e-05, "loss": 0.0821, "step": 90150 }, { "epoch": 25.35, "learning_rate": 5.4790866210601947e-05, "loss": 0.0918, "step": 90180 }, { "epoch": 25.36, "learning_rate": 5.477212382469622e-05, "loss": 0.0777, "step": 90210 }, { "epoch": 25.37, "learning_rate": 5.4753381438790495e-05, "loss": 0.0873, "step": 90240 }, { "epoch": 25.38, "learning_rate": 5.4734639052884776e-05, "loss": 0.0833, "step": 90270 }, { "epoch": 25.39, "learning_rate": 5.4715896666979037e-05, "loss": 0.0772, "step": 90300 }, { "epoch": 25.39, "learning_rate": 5.469715428107332e-05, "loss": 0.0882, "step": 90330 }, { "epoch": 25.4, "learning_rate": 5.467841189516759e-05, "loss": 0.0788, "step": 90360 }, { "epoch": 25.41, "learning_rate": 5.4659669509261866e-05, "loss": 0.0884, "step": 90390 }, { "epoch": 25.42, "learning_rate": 5.464092712335613e-05, "loss": 0.085, "step": 90420 }, { "epoch": 25.43, "learning_rate": 5.462218473745041e-05, "loss": 0.0803, "step": 90450 }, { "epoch": 25.44, "learning_rate": 5.460344235154469e-05, "loss": 0.091, "step": 90480 }, { "epoch": 25.45, "learning_rate": 5.458469996563896e-05, "loss": 0.0763, "step": 90510 }, { "epoch": 25.45, "learning_rate": 5.456595757973324e-05, "loss": 0.0876, "step": 90540 }, { "epoch": 25.46, "learning_rate": 5.4547215193827504e-05, "loss": 0.0865, "step": 90570 }, { "epoch": 25.47, "learning_rate": 5.4528472807921785e-05, "loss": 0.0815, "step": 90600 }, { "epoch": 25.48, "learning_rate": 5.450973042201606e-05, "loss": 0.0901, "step": 90630 }, { "epoch": 25.49, "learning_rate": 5.4490988036110334e-05, "loss": 0.0757, "step": 90660 }, { "epoch": 25.5, "learning_rate": 5.4472245650204615e-05, "loss": 0.0904, "step": 90690 }, { "epoch": 25.5, "learning_rate": 5.4453503264298875e-05, "loss": 0.0849, "step": 90720 }, { "epoch": 25.51, "learning_rate": 5.4434760878393156e-05, "loss": 0.0843, "step": 90750 }, { "epoch": 25.52, "learning_rate": 5.4416643238684284e-05, "loss": 0.0941, "step": 90780 }, { "epoch": 25.53, "learning_rate": 5.439790085277856e-05, "loss": 0.0802, "step": 90810 }, { "epoch": 25.54, "learning_rate": 5.437915846687284e-05, "loss": 0.0852, "step": 90840 }, { "epoch": 25.55, "learning_rate": 5.436041608096711e-05, "loss": 0.0793, "step": 90870 }, { "epoch": 25.56, "learning_rate": 5.434167369506138e-05, "loss": 0.086, "step": 90900 }, { "epoch": 25.56, "learning_rate": 5.4322931309155655e-05, "loss": 0.0929, "step": 90930 }, { "epoch": 25.57, "learning_rate": 5.4304188923249936e-05, "loss": 0.0805, "step": 90960 }, { "epoch": 25.58, "learning_rate": 5.428544653734421e-05, "loss": 0.087, "step": 90990 }, { "epoch": 25.59, "learning_rate": 5.4266704151438484e-05, "loss": 0.0838, "step": 91020 }, { "epoch": 25.6, "learning_rate": 5.424796176553275e-05, "loss": 0.0808, "step": 91050 }, { "epoch": 25.61, "learning_rate": 5.4229219379627026e-05, "loss": 0.0901, "step": 91080 }, { "epoch": 25.61, "learning_rate": 5.4210476993721306e-05, "loss": 0.0757, "step": 91110 }, { "epoch": 25.62, "learning_rate": 5.419173460781558e-05, "loss": 0.0876, "step": 91140 }, { "epoch": 25.63, "learning_rate": 5.417299222190985e-05, "loss": 0.0828, "step": 91170 }, { "epoch": 25.64, "learning_rate": 5.415424983600412e-05, "loss": 0.0881, "step": 91200 }, { "epoch": 25.65, "learning_rate": 5.4135507450098396e-05, "loss": 0.0927, "step": 91230 }, { "epoch": 25.66, "learning_rate": 5.411676506419268e-05, "loss": 0.0833, "step": 91260 }, { "epoch": 25.66, "learning_rate": 5.409802267828695e-05, "loss": 0.0837, "step": 91290 }, { "epoch": 25.67, "learning_rate": 5.407928029238122e-05, "loss": 0.0846, "step": 91320 }, { "epoch": 25.68, "learning_rate": 5.406053790647549e-05, "loss": 0.0863, "step": 91350 }, { "epoch": 25.69, "learning_rate": 5.4041795520569774e-05, "loss": 0.0921, "step": 91380 }, { "epoch": 25.7, "learning_rate": 5.402305313466405e-05, "loss": 0.0763, "step": 91410 }, { "epoch": 25.71, "learning_rate": 5.400431074875832e-05, "loss": 0.0872, "step": 91440 }, { "epoch": 25.72, "learning_rate": 5.398556836285259e-05, "loss": 0.0823, "step": 91470 }, { "epoch": 25.72, "learning_rate": 5.3966825976946864e-05, "loss": 0.0841, "step": 91500 }, { "epoch": 25.73, "learning_rate": 5.3948083591041145e-05, "loss": 0.09, "step": 91530 }, { "epoch": 25.74, "learning_rate": 5.392934120513542e-05, "loss": 0.0763, "step": 91560 }, { "epoch": 25.75, "learning_rate": 5.391059881922969e-05, "loss": 0.094, "step": 91590 }, { "epoch": 25.76, "learning_rate": 5.389185643332396e-05, "loss": 0.0783, "step": 91620 }, { "epoch": 25.77, "learning_rate": 5.3873114047418235e-05, "loss": 0.0808, "step": 91650 }, { "epoch": 25.77, "learning_rate": 5.3854371661512516e-05, "loss": 0.0896, "step": 91680 }, { "epoch": 25.78, "learning_rate": 5.383562927560679e-05, "loss": 0.0768, "step": 91710 }, { "epoch": 25.79, "learning_rate": 5.381688688970106e-05, "loss": 0.0888, "step": 91740 }, { "epoch": 25.8, "learning_rate": 5.379814450379533e-05, "loss": 0.0829, "step": 91770 }, { "epoch": 25.81, "learning_rate": 5.377940211788961e-05, "loss": 0.0793, "step": 91800 }, { "epoch": 25.82, "learning_rate": 5.376065973198389e-05, "loss": 0.1, "step": 91830 }, { "epoch": 25.83, "learning_rate": 5.374191734607816e-05, "loss": 0.0743, "step": 91860 }, { "epoch": 25.83, "learning_rate": 5.372317496017243e-05, "loss": 0.0834, "step": 91890 }, { "epoch": 25.84, "learning_rate": 5.37044325742667e-05, "loss": 0.0844, "step": 91920 }, { "epoch": 25.85, "learning_rate": 5.3685690188360984e-05, "loss": 0.0853, "step": 91950 }, { "epoch": 25.86, "learning_rate": 5.366694780245526e-05, "loss": 0.0876, "step": 91980 }, { "epoch": 25.87, "learning_rate": 5.3648205416549525e-05, "loss": 0.0716, "step": 92010 }, { "epoch": 25.88, "learning_rate": 5.36294630306438e-05, "loss": 0.0894, "step": 92040 }, { "epoch": 25.88, "learning_rate": 5.361072064473808e-05, "loss": 0.0869, "step": 92070 }, { "epoch": 25.89, "learning_rate": 5.3591978258832355e-05, "loss": 0.0816, "step": 92100 }, { "epoch": 25.9, "learning_rate": 5.357323587292663e-05, "loss": 0.0904, "step": 92130 }, { "epoch": 25.91, "learning_rate": 5.3554493487020896e-05, "loss": 0.0765, "step": 92160 }, { "epoch": 25.92, "learning_rate": 5.353575110111517e-05, "loss": 0.086, "step": 92190 }, { "epoch": 25.93, "learning_rate": 5.351700871520945e-05, "loss": 0.0827, "step": 92220 }, { "epoch": 25.93, "learning_rate": 5.3498266329303726e-05, "loss": 0.0785, "step": 92250 }, { "epoch": 25.94, "learning_rate": 5.3479523943398e-05, "loss": 0.0921, "step": 92280 }, { "epoch": 25.95, "learning_rate": 5.346078155749227e-05, "loss": 0.0794, "step": 92310 }, { "epoch": 25.96, "learning_rate": 5.344203917158654e-05, "loss": 0.0864, "step": 92340 }, { "epoch": 25.97, "learning_rate": 5.342329678568082e-05, "loss": 0.083, "step": 92370 }, { "epoch": 25.98, "learning_rate": 5.34045543997751e-05, "loss": 0.0854, "step": 92400 }, { "epoch": 25.99, "learning_rate": 5.3385812013869364e-05, "loss": 0.0924, "step": 92430 }, { "epoch": 25.99, "learning_rate": 5.336706962796364e-05, "loss": 0.0804, "step": 92460 }, { "epoch": 26.0, "eval_loss": 0.17371097207069397, "eval_runtime": 507.5317, "eval_samples_per_second": 31.59, "eval_steps_per_second": 0.989, "eval_wer": 0.14286981562103368, "step": 92482 }, { "epoch": 26.0, "learning_rate": 5.334832724205792e-05, "loss": 0.0943, "step": 92490 }, { "epoch": 26.01, "learning_rate": 5.3329584856152193e-05, "loss": 0.0759, "step": 92520 }, { "epoch": 26.02, "learning_rate": 5.331084247024647e-05, "loss": 0.0836, "step": 92550 }, { "epoch": 26.03, "learning_rate": 5.3292100084340735e-05, "loss": 0.0859, "step": 92580 }, { "epoch": 26.04, "learning_rate": 5.327335769843501e-05, "loss": 0.0722, "step": 92610 }, { "epoch": 26.04, "learning_rate": 5.325461531252929e-05, "loss": 0.0867, "step": 92640 }, { "epoch": 26.05, "learning_rate": 5.3235872926623564e-05, "loss": 0.0756, "step": 92670 }, { "epoch": 26.06, "learning_rate": 5.321713054071784e-05, "loss": 0.0839, "step": 92700 }, { "epoch": 26.07, "learning_rate": 5.3198388154812106e-05, "loss": 0.0798, "step": 92730 }, { "epoch": 26.08, "learning_rate": 5.317964576890638e-05, "loss": 0.0787, "step": 92760 }, { "epoch": 26.09, "learning_rate": 5.316090338300066e-05, "loss": 0.0854, "step": 92790 }, { "epoch": 26.1, "learning_rate": 5.3142160997094935e-05, "loss": 0.0816, "step": 92820 }, { "epoch": 26.1, "learning_rate": 5.31234186111892e-05, "loss": 0.0817, "step": 92850 }, { "epoch": 26.11, "learning_rate": 5.310467622528348e-05, "loss": 0.0864, "step": 92880 }, { "epoch": 26.12, "learning_rate": 5.308593383937776e-05, "loss": 0.0767, "step": 92910 }, { "epoch": 26.13, "learning_rate": 5.306719145347203e-05, "loss": 0.0918, "step": 92940 }, { "epoch": 26.14, "learning_rate": 5.3048449067566306e-05, "loss": 0.0748, "step": 92970 }, { "epoch": 26.15, "learning_rate": 5.3029706681660574e-05, "loss": 0.0878, "step": 93000 }, { "epoch": 26.15, "learning_rate": 5.301096429575485e-05, "loss": 0.0877, "step": 93030 }, { "epoch": 26.16, "learning_rate": 5.299222190984913e-05, "loss": 0.0787, "step": 93060 }, { "epoch": 26.17, "learning_rate": 5.29734795239434e-05, "loss": 0.0941, "step": 93090 }, { "epoch": 26.18, "learning_rate": 5.295473713803768e-05, "loss": 0.078, "step": 93120 }, { "epoch": 26.19, "learning_rate": 5.2935994752131945e-05, "loss": 0.0847, "step": 93150 }, { "epoch": 26.2, "learning_rate": 5.291725236622622e-05, "loss": 0.0847, "step": 93180 }, { "epoch": 26.2, "learning_rate": 5.28985099803205e-05, "loss": 0.0773, "step": 93210 }, { "epoch": 26.21, "learning_rate": 5.2879767594414774e-05, "loss": 0.0865, "step": 93240 }, { "epoch": 26.22, "learning_rate": 5.286102520850904e-05, "loss": 0.0835, "step": 93270 }, { "epoch": 26.23, "learning_rate": 5.2842282822603316e-05, "loss": 0.082, "step": 93300 }, { "epoch": 26.24, "learning_rate": 5.2823540436697597e-05, "loss": 0.0851, "step": 93330 }, { "epoch": 26.25, "learning_rate": 5.280479805079187e-05, "loss": 0.0791, "step": 93360 }, { "epoch": 26.26, "learning_rate": 5.2786055664886145e-05, "loss": 0.0868, "step": 93390 }, { "epoch": 26.26, "learning_rate": 5.276731327898041e-05, "loss": 0.0789, "step": 93420 }, { "epoch": 26.27, "learning_rate": 5.2748570893074687e-05, "loss": 0.0805, "step": 93450 }, { "epoch": 26.28, "learning_rate": 5.272982850716897e-05, "loss": 0.0849, "step": 93480 }, { "epoch": 26.29, "learning_rate": 5.271108612126324e-05, "loss": 0.0753, "step": 93510 }, { "epoch": 26.3, "learning_rate": 5.269296848155437e-05, "loss": 0.086, "step": 93540 }, { "epoch": 26.31, "learning_rate": 5.267422609564865e-05, "loss": 0.0782, "step": 93570 }, { "epoch": 26.31, "learning_rate": 5.265548370974292e-05, "loss": 0.0837, "step": 93600 }, { "epoch": 26.32, "learning_rate": 5.263674132383719e-05, "loss": 0.0847, "step": 93630 }, { "epoch": 26.33, "learning_rate": 5.2617998937931466e-05, "loss": 0.0776, "step": 93660 }, { "epoch": 26.34, "learning_rate": 5.259925655202575e-05, "loss": 0.0878, "step": 93690 }, { "epoch": 26.35, "learning_rate": 5.258051416612002e-05, "loss": 0.0804, "step": 93720 }, { "epoch": 26.36, "learning_rate": 5.256177178021429e-05, "loss": 0.0843, "step": 93750 }, { "epoch": 26.36, "learning_rate": 5.254302939430856e-05, "loss": 0.0802, "step": 93780 }, { "epoch": 26.37, "learning_rate": 5.252428700840284e-05, "loss": 0.0787, "step": 93810 }, { "epoch": 26.38, "learning_rate": 5.250554462249712e-05, "loss": 0.0851, "step": 93840 }, { "epoch": 26.39, "learning_rate": 5.248680223659139e-05, "loss": 0.0785, "step": 93870 }, { "epoch": 26.4, "learning_rate": 5.246805985068566e-05, "loss": 0.0848, "step": 93900 }, { "epoch": 26.41, "learning_rate": 5.2449317464779934e-05, "loss": 0.0807, "step": 93930 }, { "epoch": 26.42, "learning_rate": 5.243057507887421e-05, "loss": 0.079, "step": 93960 }, { "epoch": 26.42, "learning_rate": 5.241183269296849e-05, "loss": 0.088, "step": 93990 }, { "epoch": 26.43, "learning_rate": 5.2393090307062756e-05, "loss": 0.0778, "step": 94020 }, { "epoch": 26.44, "learning_rate": 5.237434792115703e-05, "loss": 0.0871, "step": 94050 }, { "epoch": 26.45, "learning_rate": 5.2355605535251305e-05, "loss": 0.0805, "step": 94080 }, { "epoch": 26.46, "learning_rate": 5.2336863149345586e-05, "loss": 0.0832, "step": 94110 }, { "epoch": 26.47, "learning_rate": 5.231812076343986e-05, "loss": 0.0872, "step": 94140 }, { "epoch": 26.47, "learning_rate": 5.229937837753413e-05, "loss": 0.0773, "step": 94170 }, { "epoch": 26.48, "learning_rate": 5.22806359916284e-05, "loss": 0.0886, "step": 94200 }, { "epoch": 26.49, "learning_rate": 5.2261893605722676e-05, "loss": 0.0831, "step": 94230 }, { "epoch": 26.5, "learning_rate": 5.2243151219816957e-05, "loss": 0.0801, "step": 94260 }, { "epoch": 26.51, "learning_rate": 5.222440883391123e-05, "loss": 0.0872, "step": 94290 }, { "epoch": 26.52, "learning_rate": 5.22056664480055e-05, "loss": 0.0794, "step": 94320 }, { "epoch": 26.53, "learning_rate": 5.218692406209977e-05, "loss": 0.083, "step": 94350 }, { "epoch": 26.53, "learning_rate": 5.216818167619405e-05, "loss": 0.0816, "step": 94380 }, { "epoch": 26.54, "learning_rate": 5.214943929028833e-05, "loss": 0.0771, "step": 94410 }, { "epoch": 26.55, "learning_rate": 5.2130696904382595e-05, "loss": 0.0885, "step": 94440 }, { "epoch": 26.56, "learning_rate": 5.211195451847687e-05, "loss": 0.0748, "step": 94470 }, { "epoch": 26.57, "learning_rate": 5.209321213257114e-05, "loss": 0.0867, "step": 94500 }, { "epoch": 26.58, "learning_rate": 5.2074469746665424e-05, "loss": 0.0869, "step": 94530 }, { "epoch": 26.58, "learning_rate": 5.20557273607597e-05, "loss": 0.0754, "step": 94560 }, { "epoch": 26.59, "learning_rate": 5.2036984974853966e-05, "loss": 0.0903, "step": 94590 }, { "epoch": 26.6, "learning_rate": 5.201824258894824e-05, "loss": 0.0746, "step": 94620 }, { "epoch": 26.61, "learning_rate": 5.1999500203042514e-05, "loss": 0.0859, "step": 94650 }, { "epoch": 26.62, "learning_rate": 5.1980757817136795e-05, "loss": 0.0879, "step": 94680 }, { "epoch": 26.63, "learning_rate": 5.196201543123107e-05, "loss": 0.0744, "step": 94710 }, { "epoch": 26.63, "learning_rate": 5.194327304532534e-05, "loss": 0.0881, "step": 94740 }, { "epoch": 26.64, "learning_rate": 5.192453065941961e-05, "loss": 0.0761, "step": 94770 }, { "epoch": 26.65, "learning_rate": 5.190578827351389e-05, "loss": 0.0849, "step": 94800 }, { "epoch": 26.66, "learning_rate": 5.1887045887608166e-05, "loss": 0.0855, "step": 94830 }, { "epoch": 26.67, "learning_rate": 5.1868303501702434e-05, "loss": 0.076, "step": 94860 }, { "epoch": 26.68, "learning_rate": 5.184956111579671e-05, "loss": 0.0815, "step": 94890 }, { "epoch": 26.69, "learning_rate": 5.183081872989098e-05, "loss": 0.0818, "step": 94920 }, { "epoch": 26.69, "learning_rate": 5.181207634398526e-05, "loss": 0.0862, "step": 94950 }, { "epoch": 26.7, "learning_rate": 5.179333395807954e-05, "loss": 0.0882, "step": 94980 }, { "epoch": 26.71, "learning_rate": 5.1774591572173804e-05, "loss": 0.0773, "step": 95010 }, { "epoch": 26.72, "learning_rate": 5.175584918626808e-05, "loss": 0.0928, "step": 95040 }, { "epoch": 26.73, "learning_rate": 5.173710680036235e-05, "loss": 0.0805, "step": 95070 }, { "epoch": 26.74, "learning_rate": 5.1718364414456634e-05, "loss": 0.0857, "step": 95100 }, { "epoch": 26.74, "learning_rate": 5.169962202855091e-05, "loss": 0.0881, "step": 95130 }, { "epoch": 26.75, "learning_rate": 5.1680879642645175e-05, "loss": 0.0795, "step": 95160 }, { "epoch": 26.76, "learning_rate": 5.166213725673945e-05, "loss": 0.083, "step": 95190 }, { "epoch": 26.77, "learning_rate": 5.164339487083373e-05, "loss": 0.075, "step": 95220 }, { "epoch": 26.78, "learning_rate": 5.1624652484928005e-05, "loss": 0.082, "step": 95250 }, { "epoch": 26.79, "learning_rate": 5.160591009902227e-05, "loss": 0.0811, "step": 95280 }, { "epoch": 26.79, "learning_rate": 5.1587167713116546e-05, "loss": 0.0798, "step": 95310 }, { "epoch": 26.8, "learning_rate": 5.156842532721082e-05, "loss": 0.0893, "step": 95340 }, { "epoch": 26.81, "learning_rate": 5.15496829413051e-05, "loss": 0.0768, "step": 95370 }, { "epoch": 26.82, "learning_rate": 5.1530940555399376e-05, "loss": 0.0892, "step": 95400 }, { "epoch": 26.83, "learning_rate": 5.151219816949364e-05, "loss": 0.084, "step": 95430 }, { "epoch": 26.84, "learning_rate": 5.149345578358792e-05, "loss": 0.079, "step": 95460 }, { "epoch": 26.85, "learning_rate": 5.147471339768219e-05, "loss": 0.0995, "step": 95490 }, { "epoch": 26.85, "learning_rate": 5.145597101177647e-05, "loss": 0.0821, "step": 95520 }, { "epoch": 26.86, "learning_rate": 5.143722862587074e-05, "loss": 0.0874, "step": 95550 }, { "epoch": 26.87, "learning_rate": 5.1418486239965014e-05, "loss": 0.0838, "step": 95580 }, { "epoch": 26.88, "learning_rate": 5.139974385405929e-05, "loss": 0.0803, "step": 95610 }, { "epoch": 26.89, "learning_rate": 5.138100146815357e-05, "loss": 0.089, "step": 95640 }, { "epoch": 26.9, "learning_rate": 5.1362259082247843e-05, "loss": 0.0766, "step": 95670 }, { "epoch": 26.9, "learning_rate": 5.134351669634211e-05, "loss": 0.0893, "step": 95700 }, { "epoch": 26.91, "learning_rate": 5.1324774310436385e-05, "loss": 0.0878, "step": 95730 }, { "epoch": 26.92, "learning_rate": 5.130603192453066e-05, "loss": 0.0833, "step": 95760 }, { "epoch": 26.93, "learning_rate": 5.128728953862494e-05, "loss": 0.0942, "step": 95790 }, { "epoch": 26.94, "learning_rate": 5.1268547152719214e-05, "loss": 0.0756, "step": 95820 }, { "epoch": 26.95, "learning_rate": 5.124980476681348e-05, "loss": 0.0826, "step": 95850 }, { "epoch": 26.96, "learning_rate": 5.1231062380907756e-05, "loss": 0.0812, "step": 95880 }, { "epoch": 26.96, "learning_rate": 5.121231999500204e-05, "loss": 0.0837, "step": 95910 }, { "epoch": 26.97, "learning_rate": 5.1194202355293164e-05, "loss": 0.0896, "step": 95940 }, { "epoch": 26.98, "learning_rate": 5.117545996938744e-05, "loss": 0.0797, "step": 95970 }, { "epoch": 26.99, "learning_rate": 5.115671758348172e-05, "loss": 0.0854, "step": 96000 }, { "epoch": 27.0, "learning_rate": 5.113797519757598e-05, "loss": 0.0832, "step": 96030 }, { "epoch": 27.0, "eval_loss": 0.17894543707370758, "eval_runtime": 507.5418, "eval_samples_per_second": 31.59, "eval_steps_per_second": 0.989, "eval_wer": 0.13943062246666577, "step": 96039 }, { "epoch": 27.01, "learning_rate": 5.111923281167026e-05, "loss": 0.081, "step": 96060 }, { "epoch": 27.01, "learning_rate": 5.1100490425764535e-05, "loss": 0.0886, "step": 96090 }, { "epoch": 27.02, "learning_rate": 5.108174803985881e-05, "loss": 0.0685, "step": 96120 }, { "epoch": 27.03, "learning_rate": 5.106300565395309e-05, "loss": 0.0845, "step": 96150 }, { "epoch": 27.04, "learning_rate": 5.104488801424422e-05, "loss": 0.0777, "step": 96180 }, { "epoch": 27.05, "learning_rate": 5.102614562833849e-05, "loss": 0.0776, "step": 96210 }, { "epoch": 27.06, "learning_rate": 5.100740324243276e-05, "loss": 0.086, "step": 96240 }, { "epoch": 27.06, "learning_rate": 5.098866085652704e-05, "loss": 0.0698, "step": 96270 }, { "epoch": 27.07, "learning_rate": 5.0969918470621315e-05, "loss": 0.082, "step": 96300 }, { "epoch": 27.08, "learning_rate": 5.095117608471559e-05, "loss": 0.0777, "step": 96330 }, { "epoch": 27.09, "learning_rate": 5.0932433698809856e-05, "loss": 0.0844, "step": 96360 }, { "epoch": 27.1, "learning_rate": 5.091369131290413e-05, "loss": 0.0874, "step": 96390 }, { "epoch": 27.11, "learning_rate": 5.089494892699841e-05, "loss": 0.0745, "step": 96420 }, { "epoch": 27.12, "learning_rate": 5.0876206541092686e-05, "loss": 0.0863, "step": 96450 }, { "epoch": 27.12, "learning_rate": 5.085746415518696e-05, "loss": 0.0814, "step": 96480 }, { "epoch": 27.13, "learning_rate": 5.083872176928123e-05, "loss": 0.0806, "step": 96510 }, { "epoch": 27.14, "learning_rate": 5.08199793833755e-05, "loss": 0.0872, "step": 96540 }, { "epoch": 27.15, "learning_rate": 5.080123699746978e-05, "loss": 0.0735, "step": 96570 }, { "epoch": 27.16, "learning_rate": 5.078249461156406e-05, "loss": 0.0811, "step": 96600 }, { "epoch": 27.17, "learning_rate": 5.076375222565834e-05, "loss": 0.0789, "step": 96630 }, { "epoch": 27.17, "learning_rate": 5.07450098397526e-05, "loss": 0.0836, "step": 96660 }, { "epoch": 27.18, "learning_rate": 5.072626745384688e-05, "loss": 0.0919, "step": 96690 }, { "epoch": 27.19, "learning_rate": 5.0707525067941153e-05, "loss": 0.0715, "step": 96720 }, { "epoch": 27.2, "learning_rate": 5.068878268203543e-05, "loss": 0.0844, "step": 96750 }, { "epoch": 27.21, "learning_rate": 5.0670040296129695e-05, "loss": 0.0794, "step": 96780 }, { "epoch": 27.22, "learning_rate": 5.065129791022397e-05, "loss": 0.0876, "step": 96810 }, { "epoch": 27.23, "learning_rate": 5.063255552431825e-05, "loss": 0.0904, "step": 96840 }, { "epoch": 27.23, "learning_rate": 5.0613813138412524e-05, "loss": 0.0739, "step": 96870 }, { "epoch": 27.24, "learning_rate": 5.05950707525068e-05, "loss": 0.0841, "step": 96900 }, { "epoch": 27.25, "learning_rate": 5.0576328366601066e-05, "loss": 0.0775, "step": 96930 }, { "epoch": 27.26, "learning_rate": 5.055758598069534e-05, "loss": 0.0806, "step": 96960 }, { "epoch": 27.27, "learning_rate": 5.053884359478962e-05, "loss": 0.0901, "step": 96990 }, { "epoch": 27.28, "learning_rate": 5.0520101208883895e-05, "loss": 0.0717, "step": 97020 }, { "epoch": 27.28, "learning_rate": 5.050135882297816e-05, "loss": 0.0798, "step": 97050 }, { "epoch": 27.29, "learning_rate": 5.048261643707244e-05, "loss": 0.0796, "step": 97080 }, { "epoch": 27.3, "learning_rate": 5.046387405116672e-05, "loss": 0.0857, "step": 97110 }, { "epoch": 27.31, "learning_rate": 5.044513166526099e-05, "loss": 0.0905, "step": 97140 }, { "epoch": 27.32, "learning_rate": 5.0426389279355266e-05, "loss": 0.0728, "step": 97170 }, { "epoch": 27.33, "learning_rate": 5.0407646893449534e-05, "loss": 0.0853, "step": 97200 }, { "epoch": 27.33, "learning_rate": 5.038890450754381e-05, "loss": 0.0789, "step": 97230 }, { "epoch": 27.34, "learning_rate": 5.037016212163809e-05, "loss": 0.0774, "step": 97260 }, { "epoch": 27.35, "learning_rate": 5.035141973573236e-05, "loss": 0.0922, "step": 97290 }, { "epoch": 27.36, "learning_rate": 5.033267734982664e-05, "loss": 0.072, "step": 97320 }, { "epoch": 27.37, "learning_rate": 5.0313934963920905e-05, "loss": 0.0839, "step": 97350 }, { "epoch": 27.38, "learning_rate": 5.0295192578015186e-05, "loss": 0.0781, "step": 97380 }, { "epoch": 27.39, "learning_rate": 5.027645019210946e-05, "loss": 0.082, "step": 97410 }, { "epoch": 27.39, "learning_rate": 5.0257707806203734e-05, "loss": 0.0847, "step": 97440 }, { "epoch": 27.4, "learning_rate": 5.0238965420298e-05, "loss": 0.0744, "step": 97470 }, { "epoch": 27.41, "learning_rate": 5.0220223034392276e-05, "loss": 0.0853, "step": 97500 }, { "epoch": 27.42, "learning_rate": 5.0201480648486557e-05, "loss": 0.073, "step": 97530 }, { "epoch": 27.43, "learning_rate": 5.018273826258083e-05, "loss": 0.0738, "step": 97560 }, { "epoch": 27.44, "learning_rate": 5.0163995876675105e-05, "loss": 0.0832, "step": 97590 }, { "epoch": 27.44, "learning_rate": 5.014525349076937e-05, "loss": 0.0737, "step": 97620 }, { "epoch": 27.45, "learning_rate": 5.0126511104863647e-05, "loss": 0.0899, "step": 97650 }, { "epoch": 27.46, "learning_rate": 5.010776871895793e-05, "loss": 0.0724, "step": 97680 }, { "epoch": 27.47, "learning_rate": 5.00890263330522e-05, "loss": 0.0775, "step": 97710 }, { "epoch": 27.48, "learning_rate": 5.0070283947146476e-05, "loss": 0.0845, "step": 97740 }, { "epoch": 27.49, "learning_rate": 5.005154156124074e-05, "loss": 0.0731, "step": 97770 }, { "epoch": 27.5, "learning_rate": 5.0032799175335024e-05, "loss": 0.0887, "step": 97800 }, { "epoch": 27.5, "learning_rate": 5.00140567894293e-05, "loss": 0.0752, "step": 97830 }, { "epoch": 27.51, "learning_rate": 4.9995314403523566e-05, "loss": 0.0789, "step": 97860 }, { "epoch": 27.52, "learning_rate": 4.997657201761785e-05, "loss": 0.088, "step": 97890 }, { "epoch": 27.53, "learning_rate": 4.995782963171212e-05, "loss": 0.0717, "step": 97920 }, { "epoch": 27.54, "learning_rate": 4.9939711992003255e-05, "loss": 0.0812, "step": 97950 }, { "epoch": 27.55, "learning_rate": 4.992096960609752e-05, "loss": 0.0775, "step": 97980 }, { "epoch": 27.55, "learning_rate": 4.99022272201918e-05, "loss": 0.0838, "step": 98010 }, { "epoch": 27.56, "learning_rate": 4.988348483428608e-05, "loss": 0.0828, "step": 98040 }, { "epoch": 27.57, "learning_rate": 4.9864742448380345e-05, "loss": 0.0754, "step": 98070 }, { "epoch": 27.58, "learning_rate": 4.9846000062474626e-05, "loss": 0.0857, "step": 98100 }, { "epoch": 27.59, "learning_rate": 4.9827257676568894e-05, "loss": 0.0792, "step": 98130 }, { "epoch": 27.6, "learning_rate": 4.9808515290663175e-05, "loss": 0.081, "step": 98160 }, { "epoch": 27.6, "learning_rate": 4.978977290475744e-05, "loss": 0.0903, "step": 98190 }, { "epoch": 27.61, "learning_rate": 4.9771030518851716e-05, "loss": 0.0697, "step": 98220 }, { "epoch": 27.62, "learning_rate": 4.9752288132946e-05, "loss": 0.0831, "step": 98250 }, { "epoch": 27.63, "learning_rate": 4.9733545747040265e-05, "loss": 0.0775, "step": 98280 }, { "epoch": 27.64, "learning_rate": 4.9714803361134546e-05, "loss": 0.0806, "step": 98310 }, { "epoch": 27.65, "learning_rate": 4.969606097522881e-05, "loss": 0.0896, "step": 98340 }, { "epoch": 27.66, "learning_rate": 4.9677318589323094e-05, "loss": 0.0721, "step": 98370 }, { "epoch": 27.66, "learning_rate": 4.965857620341736e-05, "loss": 0.0842, "step": 98400 }, { "epoch": 27.67, "learning_rate": 4.9639833817511635e-05, "loss": 0.0806, "step": 98430 }, { "epoch": 27.68, "learning_rate": 4.9621091431605916e-05, "loss": 0.0837, "step": 98460 }, { "epoch": 27.69, "learning_rate": 4.9602349045700184e-05, "loss": 0.0857, "step": 98490 }, { "epoch": 27.7, "learning_rate": 4.9583606659794465e-05, "loss": 0.072, "step": 98520 }, { "epoch": 27.71, "learning_rate": 4.956486427388873e-05, "loss": 0.0852, "step": 98550 }, { "epoch": 27.71, "learning_rate": 4.954612188798301e-05, "loss": 0.0756, "step": 98580 }, { "epoch": 27.72, "learning_rate": 4.952737950207728e-05, "loss": 0.0751, "step": 98610 }, { "epoch": 27.73, "learning_rate": 4.9508637116171555e-05, "loss": 0.0875, "step": 98640 }, { "epoch": 27.74, "learning_rate": 4.9489894730265836e-05, "loss": 0.0756, "step": 98670 }, { "epoch": 27.75, "learning_rate": 4.94711523443601e-05, "loss": 0.0835, "step": 98700 }, { "epoch": 27.76, "learning_rate": 4.9452409958454384e-05, "loss": 0.0758, "step": 98730 }, { "epoch": 27.76, "learning_rate": 4.943366757254865e-05, "loss": 0.0805, "step": 98760 }, { "epoch": 27.77, "learning_rate": 4.941492518664293e-05, "loss": 0.0908, "step": 98790 }, { "epoch": 27.78, "learning_rate": 4.93961828007372e-05, "loss": 0.0686, "step": 98820 }, { "epoch": 27.79, "learning_rate": 4.9377440414831474e-05, "loss": 0.0823, "step": 98850 }, { "epoch": 27.8, "learning_rate": 4.9358698028925755e-05, "loss": 0.0782, "step": 98880 }, { "epoch": 27.81, "learning_rate": 4.933995564302002e-05, "loss": 0.0835, "step": 98910 }, { "epoch": 27.82, "learning_rate": 4.9321213257114304e-05, "loss": 0.0905, "step": 98940 }, { "epoch": 27.82, "learning_rate": 4.930247087120857e-05, "loss": 0.0749, "step": 98970 }, { "epoch": 27.83, "learning_rate": 4.928372848530285e-05, "loss": 0.0906, "step": 99000 }, { "epoch": 27.84, "learning_rate": 4.926498609939712e-05, "loss": 0.0759, "step": 99030 }, { "epoch": 27.85, "learning_rate": 4.9246243713491394e-05, "loss": 0.0774, "step": 99060 }, { "epoch": 27.86, "learning_rate": 4.9227501327585674e-05, "loss": 0.0854, "step": 99090 }, { "epoch": 27.87, "learning_rate": 4.920875894167994e-05, "loss": 0.0737, "step": 99120 }, { "epoch": 27.87, "learning_rate": 4.919001655577422e-05, "loss": 0.0804, "step": 99150 }, { "epoch": 27.88, "learning_rate": 4.917127416986849e-05, "loss": 0.0797, "step": 99180 }, { "epoch": 27.89, "learning_rate": 4.915253178396277e-05, "loss": 0.0857, "step": 99210 }, { "epoch": 27.9, "learning_rate": 4.913378939805704e-05, "loss": 0.0884, "step": 99240 }, { "epoch": 27.91, "learning_rate": 4.911504701215131e-05, "loss": 0.071, "step": 99270 }, { "epoch": 27.92, "learning_rate": 4.9096304626245594e-05, "loss": 0.0831, "step": 99300 }, { "epoch": 27.93, "learning_rate": 4.907756224033986e-05, "loss": 0.077, "step": 99330 }, { "epoch": 27.93, "learning_rate": 4.905881985443414e-05, "loss": 0.0806, "step": 99360 }, { "epoch": 27.94, "learning_rate": 4.904007746852841e-05, "loss": 0.0897, "step": 99390 }, { "epoch": 27.95, "learning_rate": 4.902133508262269e-05, "loss": 0.0747, "step": 99420 }, { "epoch": 27.96, "learning_rate": 4.900259269671696e-05, "loss": 0.0819, "step": 99450 }, { "epoch": 27.97, "learning_rate": 4.898385031081124e-05, "loss": 0.0781, "step": 99480 }, { "epoch": 27.98, "learning_rate": 4.896510792490551e-05, "loss": 0.0808, "step": 99510 }, { "epoch": 27.98, "learning_rate": 4.894636553899978e-05, "loss": 0.0893, "step": 99540 }, { "epoch": 27.99, "learning_rate": 4.892762315309406e-05, "loss": 0.0683, "step": 99570 }, { "epoch": 28.0, "eval_loss": 0.17405028641223907, "eval_runtime": 504.0127, "eval_samples_per_second": 31.811, "eval_steps_per_second": 0.996, "eval_wer": 0.1390484898939582, "step": 99596 }, { "epoch": 28.0, "learning_rate": 4.890888076718833e-05, "loss": 0.0901, "step": 99600 }, { "epoch": 28.01, "learning_rate": 4.889013838128261e-05, "loss": 0.0696, "step": 99630 }, { "epoch": 28.02, "learning_rate": 4.887139599537688e-05, "loss": 0.0792, "step": 99660 }, { "epoch": 28.03, "learning_rate": 4.885265360947116e-05, "loss": 0.0727, "step": 99690 }, { "epoch": 28.03, "learning_rate": 4.8833911223565426e-05, "loss": 0.0806, "step": 99720 }, { "epoch": 28.04, "learning_rate": 4.88151688376597e-05, "loss": 0.0846, "step": 99750 }, { "epoch": 28.05, "learning_rate": 4.879642645175398e-05, "loss": 0.0689, "step": 99780 }, { "epoch": 28.06, "learning_rate": 4.877768406584825e-05, "loss": 0.0813, "step": 99810 }, { "epoch": 28.07, "learning_rate": 4.875894167994253e-05, "loss": 0.0765, "step": 99840 }, { "epoch": 28.08, "learning_rate": 4.87401992940368e-05, "loss": 0.0702, "step": 99870 }, { "epoch": 28.09, "learning_rate": 4.872145690813108e-05, "loss": 0.084, "step": 99900 }, { "epoch": 28.09, "learning_rate": 4.8702714522225345e-05, "loss": 0.0721, "step": 99930 }, { "epoch": 28.1, "learning_rate": 4.868397213631962e-05, "loss": 0.0775, "step": 99960 }, { "epoch": 28.11, "learning_rate": 4.86652297504139e-05, "loss": 0.0758, "step": 99990 }, { "epoch": 28.12, "learning_rate": 4.864648736450817e-05, "loss": 0.0764, "step": 100020 }, { "epoch": 28.13, "learning_rate": 4.862774497860245e-05, "loss": 0.0849, "step": 100050 }, { "epoch": 28.14, "learning_rate": 4.8609002592696716e-05, "loss": 0.0691, "step": 100080 }, { "epoch": 28.14, "learning_rate": 4.8590260206791e-05, "loss": 0.079, "step": 100110 }, { "epoch": 28.15, "learning_rate": 4.8571517820885264e-05, "loss": 0.0777, "step": 100140 }, { "epoch": 28.16, "learning_rate": 4.855277543497954e-05, "loss": 0.0761, "step": 100170 }, { "epoch": 28.17, "learning_rate": 4.853403304907382e-05, "loss": 0.0843, "step": 100200 }, { "epoch": 28.18, "learning_rate": 4.851529066316809e-05, "loss": 0.071, "step": 100230 }, { "epoch": 28.19, "learning_rate": 4.849654827726237e-05, "loss": 0.0842, "step": 100260 }, { "epoch": 28.2, "learning_rate": 4.8477805891356635e-05, "loss": 0.0778, "step": 100290 }, { "epoch": 28.2, "learning_rate": 4.8459063505450916e-05, "loss": 0.0767, "step": 100320 }, { "epoch": 28.21, "learning_rate": 4.8440321119545184e-05, "loss": 0.0876, "step": 100350 }, { "epoch": 28.22, "learning_rate": 4.842157873363946e-05, "loss": 0.0721, "step": 100380 }, { "epoch": 28.23, "learning_rate": 4.840283634773374e-05, "loss": 0.0829, "step": 100410 }, { "epoch": 28.24, "learning_rate": 4.8384093961828006e-05, "loss": 0.0797, "step": 100440 }, { "epoch": 28.25, "learning_rate": 4.836535157592229e-05, "loss": 0.0775, "step": 100470 }, { "epoch": 28.25, "learning_rate": 4.8346609190016555e-05, "loss": 0.081, "step": 100500 }, { "epoch": 28.26, "learning_rate": 4.8327866804110836e-05, "loss": 0.0684, "step": 100530 }, { "epoch": 28.27, "learning_rate": 4.83091244182051e-05, "loss": 0.0847, "step": 100560 }, { "epoch": 28.28, "learning_rate": 4.829038203229938e-05, "loss": 0.0765, "step": 100590 }, { "epoch": 28.29, "learning_rate": 4.827163964639366e-05, "loss": 0.0819, "step": 100620 }, { "epoch": 28.3, "learning_rate": 4.8252897260487926e-05, "loss": 0.0865, "step": 100650 }, { "epoch": 28.3, "learning_rate": 4.8234154874582207e-05, "loss": 0.0685, "step": 100680 }, { "epoch": 28.31, "learning_rate": 4.8215412488676474e-05, "loss": 0.0824, "step": 100710 }, { "epoch": 28.32, "learning_rate": 4.8196670102770755e-05, "loss": 0.0759, "step": 100740 }, { "epoch": 28.33, "learning_rate": 4.817792771686502e-05, "loss": 0.076, "step": 100770 }, { "epoch": 28.34, "learning_rate": 4.81591853309593e-05, "loss": 0.0874, "step": 100800 }, { "epoch": 28.35, "learning_rate": 4.814044294505358e-05, "loss": 0.0693, "step": 100830 }, { "epoch": 28.36, "learning_rate": 4.8121700559147845e-05, "loss": 0.079, "step": 100860 }, { "epoch": 28.36, "learning_rate": 4.8102958173242126e-05, "loss": 0.0758, "step": 100890 }, { "epoch": 28.37, "learning_rate": 4.808421578733639e-05, "loss": 0.0777, "step": 100920 }, { "epoch": 28.38, "learning_rate": 4.8065473401430674e-05, "loss": 0.0839, "step": 100950 }, { "epoch": 28.39, "learning_rate": 4.804673101552494e-05, "loss": 0.0735, "step": 100980 }, { "epoch": 28.4, "learning_rate": 4.802798862961922e-05, "loss": 0.0807, "step": 101010 }, { "epoch": 28.41, "learning_rate": 4.80092462437135e-05, "loss": 0.0827, "step": 101040 }, { "epoch": 28.41, "learning_rate": 4.7990503857807764e-05, "loss": 0.0817, "step": 101070 }, { "epoch": 28.42, "learning_rate": 4.7971761471902045e-05, "loss": 0.083, "step": 101100 }, { "epoch": 28.43, "learning_rate": 4.795301908599631e-05, "loss": 0.0715, "step": 101130 }, { "epoch": 28.44, "learning_rate": 4.7934276700090594e-05, "loss": 0.0833, "step": 101160 }, { "epoch": 28.45, "learning_rate": 4.791553431418486e-05, "loss": 0.0769, "step": 101190 }, { "epoch": 28.46, "learning_rate": 4.789679192827914e-05, "loss": 0.0804, "step": 101220 }, { "epoch": 28.46, "learning_rate": 4.7878049542373416e-05, "loss": 0.0848, "step": 101250 }, { "epoch": 28.47, "learning_rate": 4.7859307156467684e-05, "loss": 0.066, "step": 101280 }, { "epoch": 28.48, "learning_rate": 4.7840564770561965e-05, "loss": 0.0854, "step": 101310 }, { "epoch": 28.49, "learning_rate": 4.782182238465623e-05, "loss": 0.0778, "step": 101340 }, { "epoch": 28.5, "learning_rate": 4.780307999875051e-05, "loss": 0.0797, "step": 101370 }, { "epoch": 28.51, "learning_rate": 4.778433761284478e-05, "loss": 0.0888, "step": 101400 }, { "epoch": 28.52, "learning_rate": 4.776559522693906e-05, "loss": 0.0721, "step": 101430 }, { "epoch": 28.52, "learning_rate": 4.7746852841033336e-05, "loss": 0.0865, "step": 101460 }, { "epoch": 28.53, "learning_rate": 4.77281104551276e-05, "loss": 0.0771, "step": 101490 }, { "epoch": 28.54, "learning_rate": 4.7709368069221884e-05, "loss": 0.0756, "step": 101520 }, { "epoch": 28.55, "learning_rate": 4.769062568331615e-05, "loss": 0.0855, "step": 101550 }, { "epoch": 28.56, "learning_rate": 4.767188329741043e-05, "loss": 0.0727, "step": 101580 }, { "epoch": 28.57, "learning_rate": 4.76531409115047e-05, "loss": 0.0831, "step": 101610 }, { "epoch": 28.57, "learning_rate": 4.763439852559898e-05, "loss": 0.08, "step": 101640 }, { "epoch": 28.58, "learning_rate": 4.7615656139693255e-05, "loss": 0.076, "step": 101670 }, { "epoch": 28.59, "learning_rate": 4.759691375378752e-05, "loss": 0.0856, "step": 101700 }, { "epoch": 28.6, "learning_rate": 4.75781713678818e-05, "loss": 0.0746, "step": 101730 }, { "epoch": 28.61, "learning_rate": 4.755942898197607e-05, "loss": 0.0843, "step": 101760 }, { "epoch": 28.62, "learning_rate": 4.754068659607035e-05, "loss": 0.0768, "step": 101790 }, { "epoch": 28.63, "learning_rate": 4.752194421016462e-05, "loss": 0.0799, "step": 101820 }, { "epoch": 28.63, "learning_rate": 4.75032018242589e-05, "loss": 0.0891, "step": 101850 }, { "epoch": 28.64, "learning_rate": 4.7484459438353174e-05, "loss": 0.0719, "step": 101880 }, { "epoch": 28.65, "learning_rate": 4.746571705244744e-05, "loss": 0.0836, "step": 101910 }, { "epoch": 28.66, "learning_rate": 4.744697466654172e-05, "loss": 0.0736, "step": 101940 }, { "epoch": 28.67, "learning_rate": 4.742823228063599e-05, "loss": 0.0755, "step": 101970 }, { "epoch": 28.68, "learning_rate": 4.740948989473027e-05, "loss": 0.0851, "step": 102000 }, { "epoch": 28.68, "learning_rate": 4.739074750882454e-05, "loss": 0.0715, "step": 102030 }, { "epoch": 28.69, "learning_rate": 4.737200512291882e-05, "loss": 0.0837, "step": 102060 }, { "epoch": 28.7, "learning_rate": 4.7353262737013094e-05, "loss": 0.079, "step": 102090 }, { "epoch": 28.71, "learning_rate": 4.733452035110736e-05, "loss": 0.0755, "step": 102120 }, { "epoch": 28.72, "learning_rate": 4.731577796520164e-05, "loss": 0.0904, "step": 102150 }, { "epoch": 28.73, "learning_rate": 4.729703557929591e-05, "loss": 0.0769, "step": 102180 }, { "epoch": 28.73, "learning_rate": 4.727829319339019e-05, "loss": 0.0791, "step": 102210 }, { "epoch": 28.74, "learning_rate": 4.725955080748446e-05, "loss": 0.0824, "step": 102240 }, { "epoch": 28.75, "learning_rate": 4.724080842157874e-05, "loss": 0.0743, "step": 102270 }, { "epoch": 28.76, "learning_rate": 4.722206603567301e-05, "loss": 0.0833, "step": 102300 }, { "epoch": 28.77, "learning_rate": 4.720332364976729e-05, "loss": 0.0729, "step": 102330 }, { "epoch": 28.78, "learning_rate": 4.718458126386156e-05, "loss": 0.0796, "step": 102360 }, { "epoch": 28.79, "learning_rate": 4.716583887795583e-05, "loss": 0.0812, "step": 102390 }, { "epoch": 28.79, "learning_rate": 4.714709649205011e-05, "loss": 0.0808, "step": 102420 }, { "epoch": 28.8, "learning_rate": 4.712835410614438e-05, "loss": 0.0863, "step": 102450 }, { "epoch": 28.81, "learning_rate": 4.710961172023866e-05, "loss": 0.072, "step": 102480 }, { "epoch": 28.82, "learning_rate": 4.709086933433293e-05, "loss": 0.0865, "step": 102510 }, { "epoch": 28.83, "learning_rate": 4.7072126948427206e-05, "loss": 0.077, "step": 102540 }, { "epoch": 28.84, "learning_rate": 4.705338456252148e-05, "loss": 0.0726, "step": 102570 }, { "epoch": 28.84, "learning_rate": 4.703464217661575e-05, "loss": 0.0873, "step": 102600 }, { "epoch": 28.85, "learning_rate": 4.701589979071003e-05, "loss": 0.0751, "step": 102630 }, { "epoch": 28.86, "learning_rate": 4.6997157404804296e-05, "loss": 0.0856, "step": 102660 }, { "epoch": 28.87, "learning_rate": 4.697841501889858e-05, "loss": 0.0805, "step": 102690 }, { "epoch": 28.88, "learning_rate": 4.695967263299285e-05, "loss": 0.0808, "step": 102720 }, { "epoch": 28.89, "learning_rate": 4.6940930247087126e-05, "loss": 0.0881, "step": 102750 }, { "epoch": 28.9, "learning_rate": 4.69221878611814e-05, "loss": 0.0678, "step": 102780 }, { "epoch": 28.9, "learning_rate": 4.690344547527567e-05, "loss": 0.0798, "step": 102810 }, { "epoch": 28.91, "learning_rate": 4.688470308936995e-05, "loss": 0.0816, "step": 102840 }, { "epoch": 28.92, "learning_rate": 4.6865960703464216e-05, "loss": 0.0761, "step": 102870 }, { "epoch": 28.93, "learning_rate": 4.68472183175585e-05, "loss": 0.081, "step": 102900 }, { "epoch": 28.94, "learning_rate": 4.682847593165277e-05, "loss": 0.0742, "step": 102930 }, { "epoch": 28.95, "learning_rate": 4.6809733545747045e-05, "loss": 0.0839, "step": 102960 }, { "epoch": 28.95, "learning_rate": 4.679099115984132e-05, "loss": 0.0795, "step": 102990 }, { "epoch": 28.96, "learning_rate": 4.677287352013245e-05, "loss": 0.0747, "step": 103020 }, { "epoch": 28.97, "learning_rate": 4.675413113422673e-05, "loss": 0.0859, "step": 103050 }, { "epoch": 28.98, "learning_rate": 4.6735388748320995e-05, "loss": 0.0709, "step": 103080 }, { "epoch": 28.99, "learning_rate": 4.6716646362415276e-05, "loss": 0.0851, "step": 103110 }, { "epoch": 29.0, "learning_rate": 4.6697903976509543e-05, "loss": 0.0761, "step": 103140 }, { "epoch": 29.0, "eval_loss": 0.16884161531925201, "eval_runtime": 504.2221, "eval_samples_per_second": 31.797, "eval_steps_per_second": 0.996, "eval_wer": 0.1379225635636592, "step": 103153 }, { "epoch": 29.0, "learning_rate": 4.667916159060382e-05, "loss": 0.0795, "step": 103170 }, { "epoch": 29.01, "learning_rate": 4.666041920469809e-05, "loss": 0.0801, "step": 103200 }, { "epoch": 29.02, "learning_rate": 4.6641676818792366e-05, "loss": 0.078, "step": 103230 }, { "epoch": 29.03, "learning_rate": 4.662293443288665e-05, "loss": 0.0773, "step": 103260 }, { "epoch": 29.04, "learning_rate": 4.6604192046980914e-05, "loss": 0.073, "step": 103290 }, { "epoch": 29.05, "learning_rate": 4.6585449661075195e-05, "loss": 0.0767, "step": 103320 }, { "epoch": 29.06, "learning_rate": 4.656670727516946e-05, "loss": 0.0747, "step": 103350 }, { "epoch": 29.06, "learning_rate": 4.654796488926374e-05, "loss": 0.0705, "step": 103380 }, { "epoch": 29.07, "learning_rate": 4.652922250335801e-05, "loss": 0.0811, "step": 103410 }, { "epoch": 29.08, "learning_rate": 4.6510480117452285e-05, "loss": 0.0723, "step": 103440 }, { "epoch": 29.09, "learning_rate": 4.6491737731546566e-05, "loss": 0.0787, "step": 103470 }, { "epoch": 29.1, "learning_rate": 4.6472995345640834e-05, "loss": 0.0768, "step": 103500 }, { "epoch": 29.11, "learning_rate": 4.6454252959735115e-05, "loss": 0.0724, "step": 103530 }, { "epoch": 29.11, "learning_rate": 4.643551057382938e-05, "loss": 0.0837, "step": 103560 }, { "epoch": 29.12, "learning_rate": 4.6416768187923656e-05, "loss": 0.0678, "step": 103590 }, { "epoch": 29.13, "learning_rate": 4.639802580201793e-05, "loss": 0.0787, "step": 103620 }, { "epoch": 29.14, "learning_rate": 4.6379283416112205e-05, "loss": 0.0766, "step": 103650 }, { "epoch": 29.15, "learning_rate": 4.6360541030206486e-05, "loss": 0.0735, "step": 103680 }, { "epoch": 29.16, "learning_rate": 4.634179864430075e-05, "loss": 0.0764, "step": 103710 }, { "epoch": 29.17, "learning_rate": 4.6323056258395034e-05, "loss": 0.0708, "step": 103740 }, { "epoch": 29.17, "learning_rate": 4.63043138724893e-05, "loss": 0.0829, "step": 103770 }, { "epoch": 29.18, "learning_rate": 4.6285571486583576e-05, "loss": 0.079, "step": 103800 }, { "epoch": 29.19, "learning_rate": 4.626682910067785e-05, "loss": 0.0735, "step": 103830 }, { "epoch": 29.2, "learning_rate": 4.6248086714772124e-05, "loss": 0.0796, "step": 103860 }, { "epoch": 29.21, "learning_rate": 4.6229344328866405e-05, "loss": 0.0697, "step": 103890 }, { "epoch": 29.22, "learning_rate": 4.621060194296067e-05, "loss": 0.0766, "step": 103920 }, { "epoch": 29.22, "learning_rate": 4.619185955705495e-05, "loss": 0.0761, "step": 103950 }, { "epoch": 29.23, "learning_rate": 4.617311717114922e-05, "loss": 0.0731, "step": 103980 }, { "epoch": 29.24, "learning_rate": 4.6154374785243495e-05, "loss": 0.0812, "step": 104010 }, { "epoch": 29.25, "learning_rate": 4.613563239933777e-05, "loss": 0.0717, "step": 104040 }, { "epoch": 29.26, "learning_rate": 4.611689001343204e-05, "loss": 0.0798, "step": 104070 }, { "epoch": 29.27, "learning_rate": 4.609814762752632e-05, "loss": 0.0769, "step": 104100 }, { "epoch": 29.27, "learning_rate": 4.607940524162059e-05, "loss": 0.0744, "step": 104130 }, { "epoch": 29.28, "learning_rate": 4.606066285571487e-05, "loss": 0.0809, "step": 104160 }, { "epoch": 29.29, "learning_rate": 4.604192046980914e-05, "loss": 0.0728, "step": 104190 }, { "epoch": 29.3, "learning_rate": 4.6023178083903414e-05, "loss": 0.0783, "step": 104220 }, { "epoch": 29.31, "learning_rate": 4.600443569799769e-05, "loss": 0.0741, "step": 104250 }, { "epoch": 29.32, "learning_rate": 4.598569331209196e-05, "loss": 0.0725, "step": 104280 }, { "epoch": 29.33, "learning_rate": 4.596695092618624e-05, "loss": 0.0855, "step": 104310 }, { "epoch": 29.33, "learning_rate": 4.594820854028051e-05, "loss": 0.0706, "step": 104340 }, { "epoch": 29.34, "learning_rate": 4.592946615437479e-05, "loss": 0.0829, "step": 104370 }, { "epoch": 29.35, "learning_rate": 4.591072376846906e-05, "loss": 0.0805, "step": 104400 }, { "epoch": 29.36, "learning_rate": 4.589198138256334e-05, "loss": 0.0733, "step": 104430 }, { "epoch": 29.37, "learning_rate": 4.587323899665761e-05, "loss": 0.0785, "step": 104460 }, { "epoch": 29.38, "learning_rate": 4.585449661075188e-05, "loss": 0.067, "step": 104490 }, { "epoch": 29.38, "learning_rate": 4.5835754224846156e-05, "loss": 0.0796, "step": 104520 }, { "epoch": 29.39, "learning_rate": 4.581701183894043e-05, "loss": 0.079, "step": 104550 }, { "epoch": 29.4, "learning_rate": 4.579826945303471e-05, "loss": 0.0743, "step": 104580 }, { "epoch": 29.41, "learning_rate": 4.577952706712898e-05, "loss": 0.0806, "step": 104610 }, { "epoch": 29.42, "learning_rate": 4.576078468122326e-05, "loss": 0.0676, "step": 104640 }, { "epoch": 29.43, "learning_rate": 4.574204229531753e-05, "loss": 0.0739, "step": 104670 }, { "epoch": 29.43, "learning_rate": 4.57232999094118e-05, "loss": 0.0772, "step": 104700 }, { "epoch": 29.44, "learning_rate": 4.5704557523506076e-05, "loss": 0.0772, "step": 104730 }, { "epoch": 29.45, "learning_rate": 4.568581513760035e-05, "loss": 0.0837, "step": 104760 }, { "epoch": 29.46, "learning_rate": 4.566707275169463e-05, "loss": 0.0748, "step": 104790 }, { "epoch": 29.47, "learning_rate": 4.56483303657889e-05, "loss": 0.0779, "step": 104820 }, { "epoch": 29.48, "learning_rate": 4.562958797988318e-05, "loss": 0.0797, "step": 104850 }, { "epoch": 29.49, "learning_rate": 4.5610845593977447e-05, "loss": 0.079, "step": 104880 }, { "epoch": 29.49, "learning_rate": 4.559210320807172e-05, "loss": 0.0863, "step": 104910 }, { "epoch": 29.5, "learning_rate": 4.5573360822165995e-05, "loss": 0.0685, "step": 104940 }, { "epoch": 29.51, "learning_rate": 4.555461843626027e-05, "loss": 0.0788, "step": 104970 }, { "epoch": 29.52, "learning_rate": 4.553587605035455e-05, "loss": 0.0795, "step": 105000 }, { "epoch": 29.53, "learning_rate": 4.551713366444882e-05, "loss": 0.0681, "step": 105030 }, { "epoch": 29.54, "learning_rate": 4.549901602473995e-05, "loss": 0.0824, "step": 105060 }, { "epoch": 29.54, "learning_rate": 4.5480273638834226e-05, "loss": 0.07, "step": 105090 }, { "epoch": 29.55, "learning_rate": 4.54615312529285e-05, "loss": 0.0744, "step": 105120 }, { "epoch": 29.56, "learning_rate": 4.5442788867022774e-05, "loss": 0.0818, "step": 105150 }, { "epoch": 29.57, "learning_rate": 4.542404648111705e-05, "loss": 0.0759, "step": 105180 }, { "epoch": 29.58, "learning_rate": 4.540530409521132e-05, "loss": 0.0817, "step": 105210 }, { "epoch": 29.59, "learning_rate": 4.53865617093056e-05, "loss": 0.0694, "step": 105240 }, { "epoch": 29.6, "learning_rate": 4.536781932339987e-05, "loss": 0.0796, "step": 105270 }, { "epoch": 29.6, "learning_rate": 4.5349076937494145e-05, "loss": 0.0778, "step": 105300 }, { "epoch": 29.61, "learning_rate": 4.533033455158842e-05, "loss": 0.0717, "step": 105330 }, { "epoch": 29.62, "learning_rate": 4.5311592165682694e-05, "loss": 0.0786, "step": 105360 }, { "epoch": 29.63, "learning_rate": 4.529284977977697e-05, "loss": 0.075, "step": 105390 }, { "epoch": 29.64, "learning_rate": 4.527410739387124e-05, "loss": 0.0798, "step": 105420 }, { "epoch": 29.65, "learning_rate": 4.5255365007965516e-05, "loss": 0.0775, "step": 105450 }, { "epoch": 29.65, "learning_rate": 4.523662262205979e-05, "loss": 0.0785, "step": 105480 }, { "epoch": 29.66, "learning_rate": 4.5217880236154065e-05, "loss": 0.0831, "step": 105510 }, { "epoch": 29.67, "learning_rate": 4.519913785024834e-05, "loss": 0.0715, "step": 105540 }, { "epoch": 29.68, "learning_rate": 4.518039546434261e-05, "loss": 0.0793, "step": 105570 }, { "epoch": 29.69, "learning_rate": 4.516165307843689e-05, "loss": 0.079, "step": 105600 }, { "epoch": 29.7, "learning_rate": 4.514291069253116e-05, "loss": 0.0714, "step": 105630 }, { "epoch": 29.7, "learning_rate": 4.5124168306625435e-05, "loss": 0.081, "step": 105660 }, { "epoch": 29.71, "learning_rate": 4.510542592071971e-05, "loss": 0.0654, "step": 105690 }, { "epoch": 29.72, "learning_rate": 4.5086683534813984e-05, "loss": 0.0782, "step": 105720 }, { "epoch": 29.73, "learning_rate": 4.506794114890826e-05, "loss": 0.0768, "step": 105750 }, { "epoch": 29.74, "learning_rate": 4.504919876300253e-05, "loss": 0.0735, "step": 105780 }, { "epoch": 29.75, "learning_rate": 4.5030456377096806e-05, "loss": 0.08, "step": 105810 }, { "epoch": 29.76, "learning_rate": 4.501171399119108e-05, "loss": 0.0737, "step": 105840 }, { "epoch": 29.76, "learning_rate": 4.4992971605285355e-05, "loss": 0.0811, "step": 105870 }, { "epoch": 29.77, "learning_rate": 4.497422921937963e-05, "loss": 0.0814, "step": 105900 }, { "epoch": 29.78, "learning_rate": 4.49554868334739e-05, "loss": 0.0803, "step": 105930 }, { "epoch": 29.79, "learning_rate": 4.493674444756818e-05, "loss": 0.0851, "step": 105960 }, { "epoch": 29.8, "learning_rate": 4.491800206166245e-05, "loss": 0.0689, "step": 105990 }, { "epoch": 29.81, "learning_rate": 4.4899259675756726e-05, "loss": 0.0775, "step": 106020 }, { "epoch": 29.81, "learning_rate": 4.4880517289851e-05, "loss": 0.0799, "step": 106050 }, { "epoch": 29.82, "learning_rate": 4.4861774903945274e-05, "loss": 0.0739, "step": 106080 }, { "epoch": 29.83, "learning_rate": 4.484303251803955e-05, "loss": 0.0798, "step": 106110 }, { "epoch": 29.84, "learning_rate": 4.482429013213382e-05, "loss": 0.0688, "step": 106140 }, { "epoch": 29.85, "learning_rate": 4.48055477462281e-05, "loss": 0.0817, "step": 106170 }, { "epoch": 29.86, "learning_rate": 4.478680536032237e-05, "loss": 0.0755, "step": 106200 }, { "epoch": 29.86, "learning_rate": 4.4768062974416645e-05, "loss": 0.0779, "step": 106230 }, { "epoch": 29.87, "learning_rate": 4.474932058851092e-05, "loss": 0.0822, "step": 106260 }, { "epoch": 29.88, "learning_rate": 4.4730578202605193e-05, "loss": 0.0724, "step": 106290 }, { "epoch": 29.89, "learning_rate": 4.471183581669947e-05, "loss": 0.0782, "step": 106320 }, { "epoch": 29.9, "learning_rate": 4.469309343079374e-05, "loss": 0.0734, "step": 106350 }, { "epoch": 29.91, "learning_rate": 4.4674351044888016e-05, "loss": 0.0763, "step": 106380 }, { "epoch": 29.92, "learning_rate": 4.465560865898229e-05, "loss": 0.0879, "step": 106410 }, { "epoch": 29.92, "learning_rate": 4.4636866273076564e-05, "loss": 0.0741, "step": 106440 }, { "epoch": 29.93, "learning_rate": 4.461812388717084e-05, "loss": 0.0808, "step": 106470 }, { "epoch": 29.94, "learning_rate": 4.459938150126511e-05, "loss": 0.0785, "step": 106500 }, { "epoch": 29.95, "learning_rate": 4.458063911535939e-05, "loss": 0.0715, "step": 106530 }, { "epoch": 29.96, "learning_rate": 4.456189672945366e-05, "loss": 0.0826, "step": 106560 }, { "epoch": 29.97, "learning_rate": 4.4543154343547935e-05, "loss": 0.0769, "step": 106590 }, { "epoch": 29.97, "learning_rate": 4.452441195764221e-05, "loss": 0.0789, "step": 106620 }, { "epoch": 29.98, "learning_rate": 4.4505669571736484e-05, "loss": 0.0756, "step": 106650 }, { "epoch": 29.99, "learning_rate": 4.448692718583076e-05, "loss": 0.0798, "step": 106680 }, { "epoch": 30.0, "learning_rate": 4.446818479992503e-05, "loss": 0.0833, "step": 106710 }, { "epoch": 30.0, "eval_loss": 0.17258290946483612, "eval_runtime": 506.0764, "eval_samples_per_second": 31.681, "eval_steps_per_second": 0.992, "eval_wer": 0.13696040833594914, "step": 106710 }, { "epoch": 30.01, "learning_rate": 4.4449442414019306e-05, "loss": 0.0671, "step": 106740 }, { "epoch": 30.02, "learning_rate": 4.443070002811358e-05, "loss": 0.0827, "step": 106770 }, { "epoch": 30.03, "learning_rate": 4.4411957642207855e-05, "loss": 0.0711, "step": 106800 }, { "epoch": 30.03, "learning_rate": 4.439321525630213e-05, "loss": 0.0783, "step": 106830 }, { "epoch": 30.04, "learning_rate": 4.43744728703964e-05, "loss": 0.0789, "step": 106860 }, { "epoch": 30.05, "learning_rate": 4.435573048449068e-05, "loss": 0.0674, "step": 106890 }, { "epoch": 30.06, "learning_rate": 4.433698809858495e-05, "loss": 0.0807, "step": 106920 }, { "epoch": 30.07, "learning_rate": 4.4318245712679226e-05, "loss": 0.069, "step": 106950 }, { "epoch": 30.08, "learning_rate": 4.42995033267735e-05, "loss": 0.0757, "step": 106980 }, { "epoch": 30.08, "learning_rate": 4.4280760940867774e-05, "loss": 0.0769, "step": 107010 }, { "epoch": 30.09, "learning_rate": 4.426201855496205e-05, "loss": 0.0683, "step": 107040 }, { "epoch": 30.1, "learning_rate": 4.424327616905632e-05, "loss": 0.0827, "step": 107070 }, { "epoch": 30.11, "learning_rate": 4.42245337831506e-05, "loss": 0.0689, "step": 107100 }, { "epoch": 30.12, "learning_rate": 4.420579139724487e-05, "loss": 0.075, "step": 107130 }, { "epoch": 30.13, "learning_rate": 4.4187049011339145e-05, "loss": 0.0843, "step": 107160 }, { "epoch": 30.13, "learning_rate": 4.416830662543342e-05, "loss": 0.0668, "step": 107190 }, { "epoch": 30.14, "learning_rate": 4.4149564239527693e-05, "loss": 0.0776, "step": 107220 }, { "epoch": 30.15, "learning_rate": 4.413082185362197e-05, "loss": 0.0678, "step": 107250 }, { "epoch": 30.16, "learning_rate": 4.411207946771624e-05, "loss": 0.0759, "step": 107280 }, { "epoch": 30.17, "learning_rate": 4.4093337081810516e-05, "loss": 0.0749, "step": 107310 }, { "epoch": 30.18, "learning_rate": 4.407459469590479e-05, "loss": 0.0633, "step": 107340 }, { "epoch": 30.19, "learning_rate": 4.4055852309999064e-05, "loss": 0.075, "step": 107370 }, { "epoch": 30.19, "learning_rate": 4.403710992409334e-05, "loss": 0.0706, "step": 107400 }, { "epoch": 30.2, "learning_rate": 4.401836753818761e-05, "loss": 0.0728, "step": 107430 }, { "epoch": 30.21, "learning_rate": 4.399962515228189e-05, "loss": 0.0838, "step": 107460 }, { "epoch": 30.22, "learning_rate": 4.398088276637616e-05, "loss": 0.0633, "step": 107490 }, { "epoch": 30.23, "learning_rate": 4.3962140380470435e-05, "loss": 0.0811, "step": 107520 }, { "epoch": 30.24, "learning_rate": 4.394339799456471e-05, "loss": 0.0734, "step": 107550 }, { "epoch": 30.24, "learning_rate": 4.3924655608658984e-05, "loss": 0.074, "step": 107580 }, { "epoch": 30.25, "learning_rate": 4.390591322275326e-05, "loss": 0.0857, "step": 107610 }, { "epoch": 30.26, "learning_rate": 4.388717083684753e-05, "loss": 0.067, "step": 107640 }, { "epoch": 30.27, "learning_rate": 4.3868428450941806e-05, "loss": 0.0819, "step": 107670 }, { "epoch": 30.28, "learning_rate": 4.384968606503608e-05, "loss": 0.0696, "step": 107700 }, { "epoch": 30.29, "learning_rate": 4.3830943679130355e-05, "loss": 0.0794, "step": 107730 }, { "epoch": 30.3, "learning_rate": 4.381220129322463e-05, "loss": 0.0793, "step": 107760 }, { "epoch": 30.3, "learning_rate": 4.37934589073189e-05, "loss": 0.0663, "step": 107790 }, { "epoch": 30.31, "learning_rate": 4.377471652141318e-05, "loss": 0.0837, "step": 107820 }, { "epoch": 30.32, "learning_rate": 4.375597413550746e-05, "loss": 0.0678, "step": 107850 }, { "epoch": 30.33, "learning_rate": 4.3737231749601726e-05, "loss": 0.0759, "step": 107880 }, { "epoch": 30.34, "learning_rate": 4.3718489363696e-05, "loss": 0.0829, "step": 107910 }, { "epoch": 30.35, "learning_rate": 4.3699746977790274e-05, "loss": 0.0726, "step": 107940 }, { "epoch": 30.35, "learning_rate": 4.368100459188455e-05, "loss": 0.0777, "step": 107970 }, { "epoch": 30.36, "learning_rate": 4.366226220597882e-05, "loss": 0.0726, "step": 108000 }, { "epoch": 30.37, "learning_rate": 4.3643519820073097e-05, "loss": 0.0811, "step": 108030 }, { "epoch": 30.38, "learning_rate": 4.362477743416738e-05, "loss": 0.082, "step": 108060 }, { "epoch": 30.39, "learning_rate": 4.3606035048261645e-05, "loss": 0.0697, "step": 108090 }, { "epoch": 30.4, "learning_rate": 4.358729266235592e-05, "loss": 0.0796, "step": 108120 }, { "epoch": 30.4, "learning_rate": 4.356855027645019e-05, "loss": 0.0698, "step": 108150 }, { "epoch": 30.41, "learning_rate": 4.354980789054447e-05, "loss": 0.079, "step": 108180 }, { "epoch": 30.42, "learning_rate": 4.353106550463874e-05, "loss": 0.0828, "step": 108210 }, { "epoch": 30.43, "learning_rate": 4.3512323118733016e-05, "loss": 0.0682, "step": 108240 }, { "epoch": 30.44, "learning_rate": 4.34935807328273e-05, "loss": 0.0858, "step": 108270 }, { "epoch": 30.45, "learning_rate": 4.3474838346921564e-05, "loss": 0.076, "step": 108300 }, { "epoch": 30.46, "learning_rate": 4.345609596101584e-05, "loss": 0.0731, "step": 108330 }, { "epoch": 30.46, "learning_rate": 4.343735357511011e-05, "loss": 0.0752, "step": 108360 }, { "epoch": 30.47, "learning_rate": 4.341861118920439e-05, "loss": 0.0666, "step": 108390 }, { "epoch": 30.48, "learning_rate": 4.339986880329866e-05, "loss": 0.0776, "step": 108420 }, { "epoch": 30.49, "learning_rate": 4.3381126417392935e-05, "loss": 0.0693, "step": 108450 }, { "epoch": 30.5, "learning_rate": 4.336238403148721e-05, "loss": 0.072, "step": 108480 }, { "epoch": 30.51, "learning_rate": 4.3343641645581484e-05, "loss": 0.0791, "step": 108510 }, { "epoch": 30.51, "learning_rate": 4.332489925967576e-05, "loss": 0.0724, "step": 108540 }, { "epoch": 30.52, "learning_rate": 4.330615687377003e-05, "loss": 0.0732, "step": 108570 }, { "epoch": 30.53, "learning_rate": 4.3287414487864306e-05, "loss": 0.0653, "step": 108600 }, { "epoch": 30.54, "learning_rate": 4.326867210195858e-05, "loss": 0.0739, "step": 108630 }, { "epoch": 30.55, "learning_rate": 4.3249929716052855e-05, "loss": 0.0801, "step": 108660 }, { "epoch": 30.56, "learning_rate": 4.323118733014713e-05, "loss": 0.0671, "step": 108690 }, { "epoch": 30.57, "learning_rate": 4.32124449442414e-05, "loss": 0.0822, "step": 108720 }, { "epoch": 30.57, "learning_rate": 4.319370255833568e-05, "loss": 0.071, "step": 108750 }, { "epoch": 30.58, "learning_rate": 4.317496017242995e-05, "loss": 0.0774, "step": 108780 }, { "epoch": 30.59, "learning_rate": 4.3156217786524225e-05, "loss": 0.082, "step": 108810 }, { "epoch": 30.6, "learning_rate": 4.31374754006185e-05, "loss": 0.0675, "step": 108840 }, { "epoch": 30.61, "learning_rate": 4.3118733014712774e-05, "loss": 0.0816, "step": 108870 }, { "epoch": 30.62, "learning_rate": 4.309999062880705e-05, "loss": 0.0709, "step": 108900 }, { "epoch": 30.62, "learning_rate": 4.308124824290132e-05, "loss": 0.0743, "step": 108930 }, { "epoch": 30.63, "learning_rate": 4.3062505856995596e-05, "loss": 0.0817, "step": 108960 }, { "epoch": 30.64, "learning_rate": 4.304376347108987e-05, "loss": 0.072, "step": 108990 }, { "epoch": 30.65, "learning_rate": 4.3025021085184145e-05, "loss": 0.0858, "step": 109020 }, { "epoch": 30.66, "learning_rate": 4.300627869927842e-05, "loss": 0.0747, "step": 109050 }, { "epoch": 30.67, "learning_rate": 4.298753631337269e-05, "loss": 0.076, "step": 109080 }, { "epoch": 30.67, "learning_rate": 4.296879392746697e-05, "loss": 0.0823, "step": 109110 }, { "epoch": 30.68, "learning_rate": 4.295005154156124e-05, "loss": 0.0695, "step": 109140 }, { "epoch": 30.69, "learning_rate": 4.2931933901852376e-05, "loss": 0.0779, "step": 109170 }, { "epoch": 30.7, "learning_rate": 4.291319151594665e-05, "loss": 0.0732, "step": 109200 }, { "epoch": 30.71, "learning_rate": 4.289507387623778e-05, "loss": 0.079, "step": 109230 }, { "epoch": 30.72, "learning_rate": 4.287633149033206e-05, "loss": 0.083, "step": 109260 }, { "epoch": 30.73, "learning_rate": 4.2857589104426326e-05, "loss": 0.0726, "step": 109290 }, { "epoch": 30.73, "learning_rate": 4.28388467185206e-05, "loss": 0.0793, "step": 109320 }, { "epoch": 30.74, "learning_rate": 4.282010433261488e-05, "loss": 0.0714, "step": 109350 }, { "epoch": 30.75, "learning_rate": 4.280136194670915e-05, "loss": 0.0753, "step": 109380 }, { "epoch": 30.76, "learning_rate": 4.278261956080343e-05, "loss": 0.0886, "step": 109410 }, { "epoch": 30.77, "learning_rate": 4.27638771748977e-05, "loss": 0.0705, "step": 109440 }, { "epoch": 30.78, "learning_rate": 4.274513478899198e-05, "loss": 0.0826, "step": 109470 }, { "epoch": 30.78, "learning_rate": 4.2726392403086245e-05, "loss": 0.0712, "step": 109500 }, { "epoch": 30.79, "learning_rate": 4.2707650017180526e-05, "loss": 0.0717, "step": 109530 }, { "epoch": 30.8, "learning_rate": 4.26889076312748e-05, "loss": 0.0787, "step": 109560 }, { "epoch": 30.81, "learning_rate": 4.267016524536907e-05, "loss": 0.0677, "step": 109590 }, { "epoch": 30.82, "learning_rate": 4.265142285946335e-05, "loss": 0.0852, "step": 109620 }, { "epoch": 30.83, "learning_rate": 4.2632680473557616e-05, "loss": 0.0714, "step": 109650 }, { "epoch": 30.83, "learning_rate": 4.26139380876519e-05, "loss": 0.0792, "step": 109680 }, { "epoch": 30.84, "learning_rate": 4.2595195701746164e-05, "loss": 0.0828, "step": 109710 }, { "epoch": 30.85, "learning_rate": 4.2576453315840445e-05, "loss": 0.0699, "step": 109740 }, { "epoch": 30.86, "learning_rate": 4.255771092993472e-05, "loss": 0.0783, "step": 109770 }, { "epoch": 30.87, "learning_rate": 4.253896854402899e-05, "loss": 0.076, "step": 109800 }, { "epoch": 30.88, "learning_rate": 4.252022615812327e-05, "loss": 0.079, "step": 109830 }, { "epoch": 30.89, "learning_rate": 4.2501483772217535e-05, "loss": 0.0754, "step": 109860 }, { "epoch": 30.89, "learning_rate": 4.2482741386311816e-05, "loss": 0.066, "step": 109890 }, { "epoch": 30.9, "learning_rate": 4.2463999000406084e-05, "loss": 0.0786, "step": 109920 }, { "epoch": 30.91, "learning_rate": 4.2445256614500365e-05, "loss": 0.0684, "step": 109950 }, { "epoch": 30.92, "learning_rate": 4.242651422859464e-05, "loss": 0.076, "step": 109980 }, { "epoch": 30.93, "learning_rate": 4.2407771842688906e-05, "loss": 0.0846, "step": 110010 }, { "epoch": 30.94, "learning_rate": 4.238902945678319e-05, "loss": 0.0667, "step": 110040 }, { "epoch": 30.94, "learning_rate": 4.2370287070877455e-05, "loss": 0.0792, "step": 110070 }, { "epoch": 30.95, "learning_rate": 4.2351544684971736e-05, "loss": 0.0701, "step": 110100 }, { "epoch": 30.96, "learning_rate": 4.2332802299066e-05, "loss": 0.076, "step": 110130 }, { "epoch": 30.97, "learning_rate": 4.2314059913160284e-05, "loss": 0.0851, "step": 110160 }, { "epoch": 30.98, "learning_rate": 4.229531752725455e-05, "loss": 0.069, "step": 110190 }, { "epoch": 30.99, "learning_rate": 4.2276575141348826e-05, "loss": 0.0819, "step": 110220 }, { "epoch": 31.0, "learning_rate": 4.225783275544311e-05, "loss": 0.0753, "step": 110250 }, { "epoch": 31.0, "eval_loss": 0.17743565142154694, "eval_runtime": 503.5026, "eval_samples_per_second": 31.843, "eval_steps_per_second": 0.997, "eval_wer": 0.13531587351411845, "step": 110267 }, { "epoch": 31.0, "learning_rate": 4.2239090369537374e-05, "loss": 0.0764, "step": 110280 }, { "epoch": 31.01, "learning_rate": 4.2220347983631655e-05, "loss": 0.0728, "step": 110310 }, { "epoch": 31.02, "learning_rate": 4.220160559772592e-05, "loss": 0.0717, "step": 110340 }, { "epoch": 31.03, "learning_rate": 4.2182863211820203e-05, "loss": 0.0774, "step": 110370 }, { "epoch": 31.04, "learning_rate": 4.216412082591447e-05, "loss": 0.0677, "step": 110400 }, { "epoch": 31.05, "learning_rate": 4.2145378440008745e-05, "loss": 0.0734, "step": 110430 }, { "epoch": 31.05, "learning_rate": 4.2126636054103026e-05, "loss": 0.0719, "step": 110460 }, { "epoch": 31.06, "learning_rate": 4.2107893668197293e-05, "loss": 0.0743, "step": 110490 }, { "epoch": 31.07, "learning_rate": 4.2089151282291574e-05, "loss": 0.0812, "step": 110520 }, { "epoch": 31.08, "learning_rate": 4.207040889638584e-05, "loss": 0.0674, "step": 110550 }, { "epoch": 31.09, "learning_rate": 4.205166651048012e-05, "loss": 0.0747, "step": 110580 }, { "epoch": 31.1, "learning_rate": 4.203292412457439e-05, "loss": 0.0694, "step": 110610 }, { "epoch": 31.1, "learning_rate": 4.2014181738668664e-05, "loss": 0.0727, "step": 110640 }, { "epoch": 31.11, "learning_rate": 4.1995439352762945e-05, "loss": 0.0805, "step": 110670 }, { "epoch": 31.12, "learning_rate": 4.197669696685721e-05, "loss": 0.0661, "step": 110700 }, { "epoch": 31.13, "learning_rate": 4.1957954580951494e-05, "loss": 0.0732, "step": 110730 }, { "epoch": 31.14, "learning_rate": 4.193921219504576e-05, "loss": 0.0737, "step": 110760 }, { "epoch": 31.15, "learning_rate": 4.192046980914004e-05, "loss": 0.0691, "step": 110790 }, { "epoch": 31.16, "learning_rate": 4.190172742323431e-05, "loss": 0.0802, "step": 110820 }, { "epoch": 31.16, "learning_rate": 4.1882985037328584e-05, "loss": 0.0687, "step": 110850 }, { "epoch": 31.17, "learning_rate": 4.1864242651422865e-05, "loss": 0.0741, "step": 110880 }, { "epoch": 31.18, "learning_rate": 4.184550026551713e-05, "loss": 0.0684, "step": 110910 }, { "epoch": 31.19, "learning_rate": 4.182675787961141e-05, "loss": 0.0706, "step": 110940 }, { "epoch": 31.2, "learning_rate": 4.180801549370568e-05, "loss": 0.0806, "step": 110970 }, { "epoch": 31.21, "learning_rate": 4.178927310779996e-05, "loss": 0.067, "step": 111000 }, { "epoch": 31.21, "learning_rate": 4.177053072189423e-05, "loss": 0.0762, "step": 111030 }, { "epoch": 31.22, "learning_rate": 4.175178833598851e-05, "loss": 0.0692, "step": 111060 }, { "epoch": 31.23, "learning_rate": 4.1733045950082784e-05, "loss": 0.0731, "step": 111090 }, { "epoch": 31.24, "learning_rate": 4.171430356417705e-05, "loss": 0.0766, "step": 111120 }, { "epoch": 31.25, "learning_rate": 4.169556117827133e-05, "loss": 0.0659, "step": 111150 }, { "epoch": 31.26, "learning_rate": 4.16768187923656e-05, "loss": 0.0748, "step": 111180 }, { "epoch": 31.27, "learning_rate": 4.165807640645988e-05, "loss": 0.0704, "step": 111210 }, { "epoch": 31.27, "learning_rate": 4.163933402055415e-05, "loss": 0.0729, "step": 111240 }, { "epoch": 31.28, "learning_rate": 4.162059163464843e-05, "loss": 0.0836, "step": 111270 }, { "epoch": 31.29, "learning_rate": 4.16018492487427e-05, "loss": 0.0654, "step": 111300 }, { "epoch": 31.3, "learning_rate": 4.158310686283697e-05, "loss": 0.0783, "step": 111330 }, { "epoch": 31.31, "learning_rate": 4.156436447693125e-05, "loss": 0.0718, "step": 111360 }, { "epoch": 31.32, "learning_rate": 4.154562209102552e-05, "loss": 0.0779, "step": 111390 }, { "epoch": 31.32, "learning_rate": 4.15268797051198e-05, "loss": 0.0802, "step": 111420 }, { "epoch": 31.33, "learning_rate": 4.150813731921407e-05, "loss": 0.0666, "step": 111450 }, { "epoch": 31.34, "learning_rate": 4.148939493330835e-05, "loss": 0.0749, "step": 111480 }, { "epoch": 31.35, "learning_rate": 4.147065254740262e-05, "loss": 0.0723, "step": 111510 }, { "epoch": 31.36, "learning_rate": 4.145191016149689e-05, "loss": 0.0714, "step": 111540 }, { "epoch": 31.37, "learning_rate": 4.143316777559117e-05, "loss": 0.0817, "step": 111570 }, { "epoch": 31.37, "learning_rate": 4.141442538968544e-05, "loss": 0.06, "step": 111600 }, { "epoch": 31.38, "learning_rate": 4.139568300377972e-05, "loss": 0.076, "step": 111630 }, { "epoch": 31.39, "learning_rate": 4.137694061787399e-05, "loss": 0.0739, "step": 111660 }, { "epoch": 31.4, "learning_rate": 4.135819823196827e-05, "loss": 0.0708, "step": 111690 }, { "epoch": 31.41, "learning_rate": 4.133945584606254e-05, "loss": 0.0807, "step": 111720 }, { "epoch": 31.42, "learning_rate": 4.132071346015681e-05, "loss": 0.065, "step": 111750 }, { "epoch": 31.43, "learning_rate": 4.130197107425109e-05, "loss": 0.0744, "step": 111780 }, { "epoch": 31.43, "learning_rate": 4.128322868834536e-05, "loss": 0.0714, "step": 111810 }, { "epoch": 31.44, "learning_rate": 4.126448630243964e-05, "loss": 0.0724, "step": 111840 }, { "epoch": 31.45, "learning_rate": 4.1245743916533906e-05, "loss": 0.0763, "step": 111870 }, { "epoch": 31.46, "learning_rate": 4.122700153062819e-05, "loss": 0.0647, "step": 111900 }, { "epoch": 31.47, "learning_rate": 4.120825914472246e-05, "loss": 0.0724, "step": 111930 }, { "epoch": 31.48, "learning_rate": 4.118951675881673e-05, "loss": 0.0729, "step": 111960 }, { "epoch": 31.48, "learning_rate": 4.117077437291101e-05, "loss": 0.0748, "step": 111990 }, { "epoch": 31.49, "learning_rate": 4.115203198700528e-05, "loss": 0.0776, "step": 112020 }, { "epoch": 31.5, "learning_rate": 4.113328960109956e-05, "loss": 0.0696, "step": 112050 }, { "epoch": 31.51, "learning_rate": 4.1114547215193826e-05, "loss": 0.0803, "step": 112080 }, { "epoch": 31.52, "learning_rate": 4.1095804829288106e-05, "loss": 0.0692, "step": 112110 }, { "epoch": 31.53, "learning_rate": 4.107706244338238e-05, "loss": 0.0719, "step": 112140 }, { "epoch": 31.53, "learning_rate": 4.105832005747665e-05, "loss": 0.0827, "step": 112170 }, { "epoch": 31.54, "learning_rate": 4.103957767157093e-05, "loss": 0.0664, "step": 112200 }, { "epoch": 31.55, "learning_rate": 4.1020835285665196e-05, "loss": 0.0749, "step": 112230 }, { "epoch": 31.56, "learning_rate": 4.100209289975948e-05, "loss": 0.0766, "step": 112260 }, { "epoch": 31.57, "learning_rate": 4.0983350513853745e-05, "loss": 0.0713, "step": 112290 }, { "epoch": 31.58, "learning_rate": 4.0964608127948026e-05, "loss": 0.0797, "step": 112320 }, { "epoch": 31.59, "learning_rate": 4.09458657420423e-05, "loss": 0.0632, "step": 112350 }, { "epoch": 31.59, "learning_rate": 4.092712335613657e-05, "loss": 0.0828, "step": 112380 }, { "epoch": 31.6, "learning_rate": 4.090838097023085e-05, "loss": 0.0671, "step": 112410 }, { "epoch": 31.61, "learning_rate": 4.0889638584325116e-05, "loss": 0.0722, "step": 112440 }, { "epoch": 31.62, "learning_rate": 4.08708961984194e-05, "loss": 0.0797, "step": 112470 }, { "epoch": 31.63, "learning_rate": 4.0852153812513664e-05, "loss": 0.0683, "step": 112500 }, { "epoch": 31.64, "learning_rate": 4.0833411426607945e-05, "loss": 0.0732, "step": 112530 }, { "epoch": 31.64, "learning_rate": 4.081466904070222e-05, "loss": 0.0758, "step": 112560 }, { "epoch": 31.65, "learning_rate": 4.0795926654796494e-05, "loss": 0.0727, "step": 112590 }, { "epoch": 31.66, "learning_rate": 4.077718426889077e-05, "loss": 0.0804, "step": 112620 }, { "epoch": 31.67, "learning_rate": 4.0758441882985035e-05, "loss": 0.0671, "step": 112650 }, { "epoch": 31.68, "learning_rate": 4.0739699497079316e-05, "loss": 0.078, "step": 112680 }, { "epoch": 31.69, "learning_rate": 4.0720957111173584e-05, "loss": 0.0729, "step": 112710 }, { "epoch": 31.7, "learning_rate": 4.0702214725267864e-05, "loss": 0.0754, "step": 112740 }, { "epoch": 31.7, "learning_rate": 4.068347233936214e-05, "loss": 0.0798, "step": 112770 }, { "epoch": 31.71, "learning_rate": 4.066472995345641e-05, "loss": 0.0683, "step": 112800 }, { "epoch": 31.72, "learning_rate": 4.064598756755069e-05, "loss": 0.0776, "step": 112830 }, { "epoch": 31.73, "learning_rate": 4.0627245181644954e-05, "loss": 0.0702, "step": 112860 }, { "epoch": 31.74, "learning_rate": 4.0608502795739235e-05, "loss": 0.0764, "step": 112890 }, { "epoch": 31.75, "learning_rate": 4.05897604098335e-05, "loss": 0.0824, "step": 112920 }, { "epoch": 31.75, "learning_rate": 4.0571018023927784e-05, "loss": 0.0669, "step": 112950 }, { "epoch": 31.76, "learning_rate": 4.055227563802206e-05, "loss": 0.0786, "step": 112980 }, { "epoch": 31.77, "learning_rate": 4.053353325211633e-05, "loss": 0.0693, "step": 113010 }, { "epoch": 31.78, "learning_rate": 4.0514790866210606e-05, "loss": 0.0786, "step": 113040 }, { "epoch": 31.79, "learning_rate": 4.0496048480304874e-05, "loss": 0.0769, "step": 113070 }, { "epoch": 31.8, "learning_rate": 4.0477306094399155e-05, "loss": 0.0667, "step": 113100 }, { "epoch": 31.8, "learning_rate": 4.045856370849342e-05, "loss": 0.0788, "step": 113130 }, { "epoch": 31.81, "learning_rate": 4.04398213225877e-05, "loss": 0.0712, "step": 113160 }, { "epoch": 31.82, "learning_rate": 4.042107893668198e-05, "loss": 0.0721, "step": 113190 }, { "epoch": 31.83, "learning_rate": 4.040233655077625e-05, "loss": 0.0794, "step": 113220 }, { "epoch": 31.84, "learning_rate": 4.0383594164870526e-05, "loss": 0.0639, "step": 113250 }, { "epoch": 31.85, "learning_rate": 4.036485177896479e-05, "loss": 0.081, "step": 113280 }, { "epoch": 31.86, "learning_rate": 4.0346109393059074e-05, "loss": 0.0683, "step": 113310 }, { "epoch": 31.86, "learning_rate": 4.032736700715334e-05, "loss": 0.0754, "step": 113340 }, { "epoch": 31.87, "learning_rate": 4.030862462124762e-05, "loss": 0.0803, "step": 113370 }, { "epoch": 31.88, "learning_rate": 4.02898822353419e-05, "loss": 0.0671, "step": 113400 }, { "epoch": 31.89, "learning_rate": 4.027113984943617e-05, "loss": 0.0778, "step": 113430 }, { "epoch": 31.9, "learning_rate": 4.0252397463530445e-05, "loss": 0.071, "step": 113460 }, { "epoch": 31.91, "learning_rate": 4.023365507762471e-05, "loss": 0.0723, "step": 113490 }, { "epoch": 31.91, "learning_rate": 4.0214912691718993e-05, "loss": 0.0788, "step": 113520 }, { "epoch": 31.92, "learning_rate": 4.019617030581326e-05, "loss": 0.0643, "step": 113550 }, { "epoch": 31.93, "learning_rate": 4.017742791990754e-05, "loss": 0.0819, "step": 113580 }, { "epoch": 31.94, "learning_rate": 4.0158685534001816e-05, "loss": 0.0708, "step": 113610 }, { "epoch": 31.95, "learning_rate": 4.013994314809609e-05, "loss": 0.0754, "step": 113640 }, { "epoch": 31.96, "learning_rate": 4.0121200762190364e-05, "loss": 0.0797, "step": 113670 }, { "epoch": 31.97, "learning_rate": 4.010245837628463e-05, "loss": 0.0661, "step": 113700 }, { "epoch": 31.97, "learning_rate": 4.008434073657577e-05, "loss": 0.0755, "step": 113730 }, { "epoch": 31.98, "learning_rate": 4.006559835067004e-05, "loss": 0.0708, "step": 113760 }, { "epoch": 31.99, "learning_rate": 4.004685596476432e-05, "loss": 0.07, "step": 113790 }, { "epoch": 32.0, "learning_rate": 4.002873832505545e-05, "loss": 0.08, "step": 113820 }, { "epoch": 32.0, "eval_loss": 0.17339888215065002, "eval_runtime": 504.4941, "eval_samples_per_second": 31.78, "eval_steps_per_second": 0.995, "eval_wer": 0.1343946610620556, "step": 113824 }, { "epoch": 32.01, "learning_rate": 4.000999593914972e-05, "loss": 0.0651, "step": 113850 }, { "epoch": 32.02, "learning_rate": 3.9991253553244e-05, "loss": 0.0778, "step": 113880 }, { "epoch": 32.02, "learning_rate": 3.997251116733827e-05, "loss": 0.0642, "step": 113910 }, { "epoch": 32.03, "learning_rate": 3.9953768781432545e-05, "loss": 0.0787, "step": 113940 }, { "epoch": 32.04, "learning_rate": 3.993502639552682e-05, "loss": 0.0719, "step": 113970 }, { "epoch": 32.05, "learning_rate": 3.9916284009621094e-05, "loss": 0.0725, "step": 114000 }, { "epoch": 32.06, "learning_rate": 3.989754162371537e-05, "loss": 0.0718, "step": 114030 }, { "epoch": 32.07, "learning_rate": 3.987879923780964e-05, "loss": 0.0685, "step": 114060 }, { "epoch": 32.07, "learning_rate": 3.9860056851903916e-05, "loss": 0.0722, "step": 114090 }, { "epoch": 32.08, "learning_rate": 3.984131446599819e-05, "loss": 0.0678, "step": 114120 }, { "epoch": 32.09, "learning_rate": 3.9822572080092465e-05, "loss": 0.0681, "step": 114150 }, { "epoch": 32.1, "learning_rate": 3.980382969418674e-05, "loss": 0.0781, "step": 114180 }, { "epoch": 32.11, "learning_rate": 3.978508730828101e-05, "loss": 0.0688, "step": 114210 }, { "epoch": 32.12, "learning_rate": 3.976634492237529e-05, "loss": 0.0761, "step": 114240 }, { "epoch": 32.13, "learning_rate": 3.974760253646956e-05, "loss": 0.07, "step": 114270 }, { "epoch": 32.13, "learning_rate": 3.9728860150563836e-05, "loss": 0.0743, "step": 114300 }, { "epoch": 32.14, "learning_rate": 3.971011776465811e-05, "loss": 0.0765, "step": 114330 }, { "epoch": 32.15, "learning_rate": 3.9691375378752384e-05, "loss": 0.062, "step": 114360 }, { "epoch": 32.16, "learning_rate": 3.967263299284666e-05, "loss": 0.0747, "step": 114390 }, { "epoch": 32.17, "learning_rate": 3.965389060694093e-05, "loss": 0.0753, "step": 114420 }, { "epoch": 32.18, "learning_rate": 3.963514822103521e-05, "loss": 0.0737, "step": 114450 }, { "epoch": 32.18, "learning_rate": 3.961640583512948e-05, "loss": 0.0771, "step": 114480 }, { "epoch": 32.19, "learning_rate": 3.9597663449223755e-05, "loss": 0.0675, "step": 114510 }, { "epoch": 32.2, "learning_rate": 3.957892106331803e-05, "loss": 0.0757, "step": 114540 }, { "epoch": 32.21, "learning_rate": 3.95601786774123e-05, "loss": 0.0698, "step": 114570 }, { "epoch": 32.22, "learning_rate": 3.954143629150658e-05, "loss": 0.0689, "step": 114600 }, { "epoch": 32.23, "learning_rate": 3.952269390560085e-05, "loss": 0.0773, "step": 114630 }, { "epoch": 32.23, "learning_rate": 3.9503951519695126e-05, "loss": 0.0695, "step": 114660 }, { "epoch": 32.24, "learning_rate": 3.94852091337894e-05, "loss": 0.0754, "step": 114690 }, { "epoch": 32.25, "learning_rate": 3.9466466747883674e-05, "loss": 0.0689, "step": 114720 }, { "epoch": 32.26, "learning_rate": 3.944772436197795e-05, "loss": 0.0677, "step": 114750 }, { "epoch": 32.27, "learning_rate": 3.942898197607222e-05, "loss": 0.0772, "step": 114780 }, { "epoch": 32.28, "learning_rate": 3.94102395901665e-05, "loss": 0.0616, "step": 114810 }, { "epoch": 32.29, "learning_rate": 3.939149720426077e-05, "loss": 0.068, "step": 114840 }, { "epoch": 32.29, "learning_rate": 3.9372754818355045e-05, "loss": 0.0726, "step": 114870 }, { "epoch": 32.3, "learning_rate": 3.935401243244932e-05, "loss": 0.0765, "step": 114900 }, { "epoch": 32.31, "learning_rate": 3.9335270046543594e-05, "loss": 0.076, "step": 114930 }, { "epoch": 32.32, "learning_rate": 3.931652766063787e-05, "loss": 0.0674, "step": 114960 }, { "epoch": 32.33, "learning_rate": 3.929778527473214e-05, "loss": 0.0703, "step": 114990 }, { "epoch": 32.34, "learning_rate": 3.9279042888826416e-05, "loss": 0.0698, "step": 115020 }, { "epoch": 32.34, "learning_rate": 3.926030050292069e-05, "loss": 0.0699, "step": 115050 }, { "epoch": 32.35, "learning_rate": 3.9241558117014965e-05, "loss": 0.0794, "step": 115080 }, { "epoch": 32.36, "learning_rate": 3.922281573110924e-05, "loss": 0.0702, "step": 115110 }, { "epoch": 32.37, "learning_rate": 3.920407334520351e-05, "loss": 0.0742, "step": 115140 }, { "epoch": 32.38, "learning_rate": 3.918533095929779e-05, "loss": 0.0728, "step": 115170 }, { "epoch": 32.39, "learning_rate": 3.916658857339206e-05, "loss": 0.0682, "step": 115200 }, { "epoch": 32.4, "learning_rate": 3.9147846187486336e-05, "loss": 0.0743, "step": 115230 }, { "epoch": 32.4, "learning_rate": 3.912910380158061e-05, "loss": 0.0833, "step": 115260 }, { "epoch": 32.41, "learning_rate": 3.9110361415674884e-05, "loss": 0.0739, "step": 115290 }, { "epoch": 32.42, "learning_rate": 3.909161902976916e-05, "loss": 0.0723, "step": 115320 }, { "epoch": 32.43, "learning_rate": 3.907287664386343e-05, "loss": 0.0676, "step": 115350 }, { "epoch": 32.44, "learning_rate": 3.9054134257957707e-05, "loss": 0.0776, "step": 115380 }, { "epoch": 32.45, "learning_rate": 3.903539187205198e-05, "loss": 0.0676, "step": 115410 }, { "epoch": 32.45, "learning_rate": 3.9016649486146255e-05, "loss": 0.0735, "step": 115440 }, { "epoch": 32.46, "learning_rate": 3.899790710024053e-05, "loss": 0.0732, "step": 115470 }, { "epoch": 32.47, "learning_rate": 3.89791647143348e-05, "loss": 0.0712, "step": 115500 }, { "epoch": 32.48, "learning_rate": 3.896042232842908e-05, "loss": 0.0762, "step": 115530 }, { "epoch": 32.49, "learning_rate": 3.894167994252335e-05, "loss": 0.0624, "step": 115560 }, { "epoch": 32.5, "learning_rate": 3.8922937556617626e-05, "loss": 0.0805, "step": 115590 }, { "epoch": 32.5, "learning_rate": 3.89041951707119e-05, "loss": 0.0696, "step": 115620 }, { "epoch": 32.51, "learning_rate": 3.8885452784806174e-05, "loss": 0.0691, "step": 115650 }, { "epoch": 32.52, "learning_rate": 3.886671039890045e-05, "loss": 0.0795, "step": 115680 }, { "epoch": 32.53, "learning_rate": 3.884796801299472e-05, "loss": 0.0689, "step": 115710 }, { "epoch": 32.54, "learning_rate": 3.8829225627089e-05, "loss": 0.0736, "step": 115740 }, { "epoch": 32.55, "learning_rate": 3.881048324118327e-05, "loss": 0.0689, "step": 115770 }, { "epoch": 32.56, "learning_rate": 3.8791740855277545e-05, "loss": 0.0721, "step": 115800 }, { "epoch": 32.56, "learning_rate": 3.877299846937182e-05, "loss": 0.0763, "step": 115830 }, { "epoch": 32.57, "learning_rate": 3.8754256083466094e-05, "loss": 0.0676, "step": 115860 }, { "epoch": 32.58, "learning_rate": 3.873551369756037e-05, "loss": 0.0779, "step": 115890 }, { "epoch": 32.59, "learning_rate": 3.871677131165464e-05, "loss": 0.0727, "step": 115920 }, { "epoch": 32.6, "learning_rate": 3.8698028925748916e-05, "loss": 0.0716, "step": 115950 }, { "epoch": 32.61, "learning_rate": 3.867928653984319e-05, "loss": 0.0728, "step": 115980 }, { "epoch": 32.61, "learning_rate": 3.8660544153937465e-05, "loss": 0.0667, "step": 116010 }, { "epoch": 32.62, "learning_rate": 3.864180176803174e-05, "loss": 0.0741, "step": 116040 }, { "epoch": 32.63, "learning_rate": 3.862305938212601e-05, "loss": 0.073, "step": 116070 }, { "epoch": 32.64, "learning_rate": 3.860431699622029e-05, "loss": 0.07, "step": 116100 }, { "epoch": 32.65, "learning_rate": 3.858557461031456e-05, "loss": 0.0731, "step": 116130 }, { "epoch": 32.66, "learning_rate": 3.8566832224408835e-05, "loss": 0.0615, "step": 116160 }, { "epoch": 32.67, "learning_rate": 3.854808983850311e-05, "loss": 0.0712, "step": 116190 }, { "epoch": 32.67, "learning_rate": 3.8529347452597384e-05, "loss": 0.0686, "step": 116220 }, { "epoch": 32.68, "learning_rate": 3.851060506669166e-05, "loss": 0.0717, "step": 116250 }, { "epoch": 32.69, "learning_rate": 3.849186268078593e-05, "loss": 0.0768, "step": 116280 }, { "epoch": 32.7, "learning_rate": 3.8473120294880206e-05, "loss": 0.069, "step": 116310 }, { "epoch": 32.71, "learning_rate": 3.845437790897448e-05, "loss": 0.0742, "step": 116340 }, { "epoch": 32.72, "learning_rate": 3.8435635523068755e-05, "loss": 0.0685, "step": 116370 }, { "epoch": 32.72, "learning_rate": 3.841689313716303e-05, "loss": 0.066, "step": 116400 }, { "epoch": 32.73, "learning_rate": 3.83981507512573e-05, "loss": 0.0743, "step": 116430 }, { "epoch": 32.74, "learning_rate": 3.837940836535158e-05, "loss": 0.0687, "step": 116460 }, { "epoch": 32.75, "learning_rate": 3.836066597944585e-05, "loss": 0.0778, "step": 116490 }, { "epoch": 32.76, "learning_rate": 3.8341923593540126e-05, "loss": 0.0695, "step": 116520 }, { "epoch": 32.77, "learning_rate": 3.83231812076344e-05, "loss": 0.071, "step": 116550 }, { "epoch": 32.77, "learning_rate": 3.8304438821728674e-05, "loss": 0.0755, "step": 116580 }, { "epoch": 32.78, "learning_rate": 3.828569643582295e-05, "loss": 0.0654, "step": 116610 }, { "epoch": 32.79, "learning_rate": 3.826695404991722e-05, "loss": 0.0739, "step": 116640 }, { "epoch": 32.8, "learning_rate": 3.82482116640115e-05, "loss": 0.0711, "step": 116670 }, { "epoch": 32.81, "learning_rate": 3.822946927810577e-05, "loss": 0.0727, "step": 116700 }, { "epoch": 32.82, "learning_rate": 3.8210726892200045e-05, "loss": 0.0772, "step": 116730 }, { "epoch": 32.83, "learning_rate": 3.819198450629432e-05, "loss": 0.0666, "step": 116760 }, { "epoch": 32.83, "learning_rate": 3.8173242120388593e-05, "loss": 0.0703, "step": 116790 }, { "epoch": 32.84, "learning_rate": 3.815449973448287e-05, "loss": 0.0709, "step": 116820 }, { "epoch": 32.85, "learning_rate": 3.813575734857714e-05, "loss": 0.0669, "step": 116850 }, { "epoch": 32.86, "learning_rate": 3.8117014962671416e-05, "loss": 0.0814, "step": 116880 }, { "epoch": 32.87, "learning_rate": 3.809827257676569e-05, "loss": 0.0667, "step": 116910 }, { "epoch": 32.88, "learning_rate": 3.8079530190859964e-05, "loss": 0.0762, "step": 116940 }, { "epoch": 32.88, "learning_rate": 3.806078780495424e-05, "loss": 0.0712, "step": 116970 }, { "epoch": 32.89, "learning_rate": 3.804204541904851e-05, "loss": 0.0705, "step": 117000 }, { "epoch": 32.9, "learning_rate": 3.802330303314279e-05, "loss": 0.0774, "step": 117030 }, { "epoch": 32.91, "learning_rate": 3.800456064723706e-05, "loss": 0.0662, "step": 117060 }, { "epoch": 32.92, "learning_rate": 3.7985818261331335e-05, "loss": 0.0753, "step": 117090 }, { "epoch": 32.93, "learning_rate": 3.796707587542561e-05, "loss": 0.0716, "step": 117120 }, { "epoch": 32.93, "learning_rate": 3.7948333489519884e-05, "loss": 0.0707, "step": 117150 }, { "epoch": 32.94, "learning_rate": 3.792959110361416e-05, "loss": 0.0788, "step": 117180 }, { "epoch": 32.95, "learning_rate": 3.791084871770843e-05, "loss": 0.0658, "step": 117210 }, { "epoch": 32.96, "learning_rate": 3.7892106331802706e-05, "loss": 0.0779, "step": 117240 }, { "epoch": 32.97, "learning_rate": 3.787336394589698e-05, "loss": 0.0709, "step": 117270 }, { "epoch": 32.98, "learning_rate": 3.7854621559991255e-05, "loss": 0.0752, "step": 117300 }, { "epoch": 32.99, "learning_rate": 3.783587917408553e-05, "loss": 0.083, "step": 117330 }, { "epoch": 32.99, "learning_rate": 3.78171367881798e-05, "loss": 0.0644, "step": 117360 }, { "epoch": 33.0, "eval_loss": 0.1736820936203003, "eval_runtime": 505.177, "eval_samples_per_second": 31.737, "eval_steps_per_second": 0.994, "eval_wer": 0.13342568203840433, "step": 117381 }, { "epoch": 33.0, "learning_rate": 3.779839440227408e-05, "loss": 0.0821, "step": 117390 }, { "epoch": 33.01, "learning_rate": 3.777965201636835e-05, "loss": 0.0647, "step": 117420 }, { "epoch": 33.02, "learning_rate": 3.7760909630462626e-05, "loss": 0.072, "step": 117450 }, { "epoch": 33.03, "learning_rate": 3.77421672445569e-05, "loss": 0.07, "step": 117480 }, { "epoch": 33.04, "learning_rate": 3.7723424858651174e-05, "loss": 0.0648, "step": 117510 }, { "epoch": 33.04, "learning_rate": 3.770468247274545e-05, "loss": 0.0759, "step": 117540 }, { "epoch": 33.05, "learning_rate": 3.768594008683972e-05, "loss": 0.0648, "step": 117570 }, { "epoch": 33.06, "learning_rate": 3.7667197700934e-05, "loss": 0.0713, "step": 117600 }, { "epoch": 33.07, "learning_rate": 3.764845531502827e-05, "loss": 0.0697, "step": 117630 }, { "epoch": 33.08, "learning_rate": 3.7629712929122545e-05, "loss": 0.0647, "step": 117660 }, { "epoch": 33.09, "learning_rate": 3.761097054321682e-05, "loss": 0.0765, "step": 117690 }, { "epoch": 33.1, "learning_rate": 3.7592228157311093e-05, "loss": 0.0637, "step": 117720 }, { "epoch": 33.1, "learning_rate": 3.757348577140537e-05, "loss": 0.0722, "step": 117750 }, { "epoch": 33.11, "learning_rate": 3.755474338549964e-05, "loss": 0.0717, "step": 117780 }, { "epoch": 33.12, "learning_rate": 3.7536000999593916e-05, "loss": 0.0668, "step": 117810 }, { "epoch": 33.13, "learning_rate": 3.751725861368819e-05, "loss": 0.0749, "step": 117840 }, { "epoch": 33.14, "learning_rate": 3.7498516227782464e-05, "loss": 0.0646, "step": 117870 }, { "epoch": 33.15, "learning_rate": 3.747977384187674e-05, "loss": 0.0745, "step": 117900 }, { "epoch": 33.15, "learning_rate": 3.746103145597101e-05, "loss": 0.0757, "step": 117930 }, { "epoch": 33.16, "learning_rate": 3.744228907006529e-05, "loss": 0.0638, "step": 117960 }, { "epoch": 33.17, "learning_rate": 3.742354668415956e-05, "loss": 0.0761, "step": 117990 }, { "epoch": 33.18, "learning_rate": 3.7404804298253835e-05, "loss": 0.0671, "step": 118020 }, { "epoch": 33.19, "learning_rate": 3.738606191234811e-05, "loss": 0.0693, "step": 118050 }, { "epoch": 33.2, "learning_rate": 3.7367319526442384e-05, "loss": 0.0707, "step": 118080 }, { "epoch": 33.2, "learning_rate": 3.734920188673352e-05, "loss": 0.0654, "step": 118110 }, { "epoch": 33.21, "learning_rate": 3.733108424702465e-05, "loss": 0.0924, "step": 118140 }, { "epoch": 33.22, "learning_rate": 3.731234186111892e-05, "loss": 0.0655, "step": 118170 }, { "epoch": 33.23, "learning_rate": 3.72935994752132e-05, "loss": 0.0746, "step": 118200 }, { "epoch": 33.24, "learning_rate": 3.727485708930747e-05, "loss": 0.0739, "step": 118230 }, { "epoch": 33.25, "learning_rate": 3.725611470340175e-05, "loss": 0.0618, "step": 118260 }, { "epoch": 33.26, "learning_rate": 3.7237372317496016e-05, "loss": 0.0719, "step": 118290 }, { "epoch": 33.26, "learning_rate": 3.721862993159029e-05, "loss": 0.0637, "step": 118320 }, { "epoch": 33.27, "learning_rate": 3.719988754568457e-05, "loss": 0.0712, "step": 118350 }, { "epoch": 33.28, "learning_rate": 3.718114515977884e-05, "loss": 0.0729, "step": 118380 }, { "epoch": 33.29, "learning_rate": 3.716240277387312e-05, "loss": 0.0642, "step": 118410 }, { "epoch": 33.3, "learning_rate": 3.714366038796739e-05, "loss": 0.0766, "step": 118440 }, { "epoch": 33.31, "learning_rate": 3.712491800206167e-05, "loss": 0.0649, "step": 118470 }, { "epoch": 33.31, "learning_rate": 3.7106175616155936e-05, "loss": 0.0727, "step": 118500 }, { "epoch": 33.32, "learning_rate": 3.708743323025021e-05, "loss": 0.0738, "step": 118530 }, { "epoch": 33.33, "learning_rate": 3.706869084434449e-05, "loss": 0.0699, "step": 118560 }, { "epoch": 33.34, "learning_rate": 3.704994845843876e-05, "loss": 0.0803, "step": 118590 }, { "epoch": 33.35, "learning_rate": 3.703120607253304e-05, "loss": 0.0693, "step": 118620 }, { "epoch": 33.36, "learning_rate": 3.7012463686627307e-05, "loss": 0.0686, "step": 118650 }, { "epoch": 33.37, "learning_rate": 3.699372130072159e-05, "loss": 0.072, "step": 118680 }, { "epoch": 33.37, "learning_rate": 3.6974978914815855e-05, "loss": 0.0638, "step": 118710 }, { "epoch": 33.38, "learning_rate": 3.695623652891013e-05, "loss": 0.0771, "step": 118740 }, { "epoch": 33.39, "learning_rate": 3.693749414300441e-05, "loss": 0.0655, "step": 118770 }, { "epoch": 33.4, "learning_rate": 3.691875175709868e-05, "loss": 0.0731, "step": 118800 }, { "epoch": 33.41, "learning_rate": 3.690000937119296e-05, "loss": 0.0711, "step": 118830 }, { "epoch": 33.42, "learning_rate": 3.6881266985287226e-05, "loss": 0.0667, "step": 118860 }, { "epoch": 33.42, "learning_rate": 3.686252459938151e-05, "loss": 0.0784, "step": 118890 }, { "epoch": 33.43, "learning_rate": 3.6843782213475774e-05, "loss": 0.07, "step": 118920 }, { "epoch": 33.44, "learning_rate": 3.682503982757005e-05, "loss": 0.0707, "step": 118950 }, { "epoch": 33.45, "learning_rate": 3.680629744166433e-05, "loss": 0.0738, "step": 118980 }, { "epoch": 33.46, "learning_rate": 3.67875550557586e-05, "loss": 0.0649, "step": 119010 }, { "epoch": 33.47, "learning_rate": 3.676881266985288e-05, "loss": 0.0812, "step": 119040 }, { "epoch": 33.47, "learning_rate": 3.6750070283947145e-05, "loss": 0.0659, "step": 119070 }, { "epoch": 33.48, "learning_rate": 3.6731327898041426e-05, "loss": 0.0679, "step": 119100 }, { "epoch": 33.49, "learning_rate": 3.6712585512135694e-05, "loss": 0.0721, "step": 119130 }, { "epoch": 33.5, "learning_rate": 3.669384312622997e-05, "loss": 0.0634, "step": 119160 }, { "epoch": 33.51, "learning_rate": 3.667510074032425e-05, "loss": 0.0753, "step": 119190 }, { "epoch": 33.52, "learning_rate": 3.6656358354418516e-05, "loss": 0.0668, "step": 119220 }, { "epoch": 33.53, "learning_rate": 3.66376159685128e-05, "loss": 0.0718, "step": 119250 }, { "epoch": 33.53, "learning_rate": 3.6618873582607065e-05, "loss": 0.0759, "step": 119280 }, { "epoch": 33.54, "learning_rate": 3.6600131196701346e-05, "loss": 0.0681, "step": 119310 }, { "epoch": 33.55, "learning_rate": 3.658138881079561e-05, "loss": 0.0753, "step": 119340 }, { "epoch": 33.56, "learning_rate": 3.656264642488989e-05, "loss": 0.0653, "step": 119370 }, { "epoch": 33.57, "learning_rate": 3.654390403898417e-05, "loss": 0.0715, "step": 119400 }, { "epoch": 33.58, "learning_rate": 3.6525161653078436e-05, "loss": 0.0702, "step": 119430 }, { "epoch": 33.58, "learning_rate": 3.6506419267172716e-05, "loss": 0.0669, "step": 119460 }, { "epoch": 33.59, "learning_rate": 3.6487676881266984e-05, "loss": 0.0732, "step": 119490 }, { "epoch": 33.6, "learning_rate": 3.6468934495361265e-05, "loss": 0.0674, "step": 119520 }, { "epoch": 33.61, "learning_rate": 3.645019210945553e-05, "loss": 0.0692, "step": 119550 }, { "epoch": 33.62, "learning_rate": 3.6431449723549806e-05, "loss": 0.0688, "step": 119580 }, { "epoch": 33.63, "learning_rate": 3.641270733764409e-05, "loss": 0.067, "step": 119610 }, { "epoch": 33.63, "learning_rate": 3.6393964951738355e-05, "loss": 0.0742, "step": 119640 }, { "epoch": 33.64, "learning_rate": 3.6375222565832636e-05, "loss": 0.0663, "step": 119670 }, { "epoch": 33.65, "learning_rate": 3.63564801799269e-05, "loss": 0.0678, "step": 119700 }, { "epoch": 33.66, "learning_rate": 3.6337737794021184e-05, "loss": 0.0758, "step": 119730 }, { "epoch": 33.67, "learning_rate": 3.631899540811545e-05, "loss": 0.067, "step": 119760 }, { "epoch": 33.68, "learning_rate": 3.630025302220973e-05, "loss": 0.0794, "step": 119790 }, { "epoch": 33.69, "learning_rate": 3.628151063630401e-05, "loss": 0.0641, "step": 119820 }, { "epoch": 33.69, "learning_rate": 3.6262768250398274e-05, "loss": 0.0699, "step": 119850 }, { "epoch": 33.7, "learning_rate": 3.6244025864492555e-05, "loss": 0.0687, "step": 119880 }, { "epoch": 33.71, "learning_rate": 3.622528347858682e-05, "loss": 0.0673, "step": 119910 }, { "epoch": 33.72, "learning_rate": 3.6206541092681104e-05, "loss": 0.0728, "step": 119940 }, { "epoch": 33.73, "learning_rate": 3.618779870677537e-05, "loss": 0.065, "step": 119970 }, { "epoch": 33.74, "learning_rate": 3.616905632086965e-05, "loss": 0.0722, "step": 120000 }, { "epoch": 33.74, "learning_rate": 3.6150313934963926e-05, "loss": 0.0713, "step": 120030 }, { "epoch": 33.75, "learning_rate": 3.6131571549058194e-05, "loss": 0.0648, "step": 120060 }, { "epoch": 33.76, "learning_rate": 3.6112829163152474e-05, "loss": 0.072, "step": 120090 }, { "epoch": 33.77, "learning_rate": 3.609408677724674e-05, "loss": 0.0638, "step": 120120 }, { "epoch": 33.78, "learning_rate": 3.607534439134102e-05, "loss": 0.07, "step": 120150 }, { "epoch": 33.79, "learning_rate": 3.605660200543529e-05, "loss": 0.074, "step": 120180 }, { "epoch": 33.8, "learning_rate": 3.603785961952957e-05, "loss": 0.0681, "step": 120210 }, { "epoch": 33.8, "learning_rate": 3.6019117233623845e-05, "loss": 0.0749, "step": 120240 }, { "epoch": 33.81, "learning_rate": 3.600037484771811e-05, "loss": 0.0671, "step": 120270 }, { "epoch": 33.82, "learning_rate": 3.5981632461812394e-05, "loss": 0.0671, "step": 120300 }, { "epoch": 33.83, "learning_rate": 3.596289007590666e-05, "loss": 0.0676, "step": 120330 }, { "epoch": 33.84, "learning_rate": 3.594414769000094e-05, "loss": 0.0637, "step": 120360 }, { "epoch": 33.85, "learning_rate": 3.592540530409521e-05, "loss": 0.0791, "step": 120390 }, { "epoch": 33.85, "learning_rate": 3.590666291818949e-05, "loss": 0.0633, "step": 120420 }, { "epoch": 33.86, "learning_rate": 3.5887920532283765e-05, "loss": 0.0718, "step": 120450 }, { "epoch": 33.87, "learning_rate": 3.586917814637803e-05, "loss": 0.0754, "step": 120480 }, { "epoch": 33.88, "learning_rate": 3.585043576047231e-05, "loss": 0.067, "step": 120510 }, { "epoch": 33.89, "learning_rate": 3.583169337456658e-05, "loss": 0.0729, "step": 120540 }, { "epoch": 33.9, "learning_rate": 3.581295098866086e-05, "loss": 0.0651, "step": 120570 }, { "epoch": 33.9, "learning_rate": 3.579420860275513e-05, "loss": 0.0733, "step": 120600 }, { "epoch": 33.91, "learning_rate": 3.577546621684941e-05, "loss": 0.0754, "step": 120630 }, { "epoch": 33.92, "learning_rate": 3.5756723830943684e-05, "loss": 0.0666, "step": 120660 }, { "epoch": 33.93, "learning_rate": 3.573798144503795e-05, "loss": 0.0755, "step": 120690 }, { "epoch": 33.94, "learning_rate": 3.571923905913223e-05, "loss": 0.0694, "step": 120720 }, { "epoch": 33.95, "learning_rate": 3.57004966732265e-05, "loss": 0.0732, "step": 120750 }, { "epoch": 33.96, "learning_rate": 3.568175428732078e-05, "loss": 0.0734, "step": 120780 }, { "epoch": 33.96, "learning_rate": 3.566301190141505e-05, "loss": 0.0657, "step": 120810 }, { "epoch": 33.97, "learning_rate": 3.564426951550933e-05, "loss": 0.0697, "step": 120840 }, { "epoch": 33.98, "learning_rate": 3.56255271296036e-05, "loss": 0.0639, "step": 120870 }, { "epoch": 33.99, "learning_rate": 3.560678474369787e-05, "loss": 0.0722, "step": 120900 }, { "epoch": 34.0, "learning_rate": 3.558804235779215e-05, "loss": 0.0745, "step": 120930 }, { "epoch": 34.0, "eval_loss": 0.17628006637096405, "eval_runtime": 505.7594, "eval_samples_per_second": 31.701, "eval_steps_per_second": 0.993, "eval_wer": 0.13345297722216914, "step": 120938 }, { "epoch": 34.01, "learning_rate": 3.556929997188642e-05, "loss": 0.0622, "step": 120960 }, { "epoch": 34.01, "learning_rate": 3.55505575859807e-05, "loss": 0.0761, "step": 120990 }, { "epoch": 34.02, "learning_rate": 3.553181520007497e-05, "loss": 0.0592, "step": 121020 }, { "epoch": 34.03, "learning_rate": 3.551307281416925e-05, "loss": 0.0716, "step": 121050 }, { "epoch": 34.04, "learning_rate": 3.5494330428263516e-05, "loss": 0.07, "step": 121080 }, { "epoch": 34.05, "learning_rate": 3.547558804235779e-05, "loss": 0.0654, "step": 121110 }, { "epoch": 34.06, "learning_rate": 3.545684565645207e-05, "loss": 0.0767, "step": 121140 }, { "epoch": 34.07, "learning_rate": 3.543810327054634e-05, "loss": 0.0632, "step": 121170 }, { "epoch": 34.07, "learning_rate": 3.541936088464062e-05, "loss": 0.0701, "step": 121200 }, { "epoch": 34.08, "learning_rate": 3.540061849873489e-05, "loss": 0.0663, "step": 121230 }, { "epoch": 34.09, "learning_rate": 3.538187611282917e-05, "loss": 0.0699, "step": 121260 }, { "epoch": 34.1, "learning_rate": 3.5363133726923435e-05, "loss": 0.0768, "step": 121290 }, { "epoch": 34.11, "learning_rate": 3.5344391341017716e-05, "loss": 0.0639, "step": 121320 }, { "epoch": 34.12, "learning_rate": 3.532564895511199e-05, "loss": 0.0739, "step": 121350 }, { "epoch": 34.12, "learning_rate": 3.530690656920626e-05, "loss": 0.0649, "step": 121380 }, { "epoch": 34.13, "learning_rate": 3.528816418330054e-05, "loss": 0.0691, "step": 121410 }, { "epoch": 34.14, "learning_rate": 3.5269421797394806e-05, "loss": 0.0708, "step": 121440 }, { "epoch": 34.15, "learning_rate": 3.525067941148909e-05, "loss": 0.0601, "step": 121470 }, { "epoch": 34.16, "learning_rate": 3.5231937025583355e-05, "loss": 0.0718, "step": 121500 }, { "epoch": 34.17, "learning_rate": 3.5213194639677636e-05, "loss": 0.072, "step": 121530 }, { "epoch": 34.17, "learning_rate": 3.519445225377191e-05, "loss": 0.063, "step": 121560 }, { "epoch": 34.18, "learning_rate": 3.517570986786618e-05, "loss": 0.078, "step": 121590 }, { "epoch": 34.19, "learning_rate": 3.515696748196046e-05, "loss": 0.0597, "step": 121620 }, { "epoch": 34.2, "learning_rate": 3.5138849842251586e-05, "loss": 0.0781, "step": 121650 }, { "epoch": 34.21, "learning_rate": 3.512010745634586e-05, "loss": 0.0674, "step": 121680 }, { "epoch": 34.22, "learning_rate": 3.5101365070440134e-05, "loss": 0.069, "step": 121710 }, { "epoch": 34.23, "learning_rate": 3.508262268453441e-05, "loss": 0.0778, "step": 121740 }, { "epoch": 34.23, "learning_rate": 3.506388029862868e-05, "loss": 0.0619, "step": 121770 }, { "epoch": 34.24, "learning_rate": 3.5045137912722957e-05, "loss": 0.0716, "step": 121800 }, { "epoch": 34.25, "learning_rate": 3.502639552681723e-05, "loss": 0.0629, "step": 121830 }, { "epoch": 34.26, "learning_rate": 3.5007653140911505e-05, "loss": 0.072, "step": 121860 }, { "epoch": 34.27, "learning_rate": 3.4988910755005786e-05, "loss": 0.0704, "step": 121890 }, { "epoch": 34.28, "learning_rate": 3.497016836910005e-05, "loss": 0.0623, "step": 121920 }, { "epoch": 34.28, "learning_rate": 3.495142598319433e-05, "loss": 0.079, "step": 121950 }, { "epoch": 34.29, "learning_rate": 3.49326835972886e-05, "loss": 0.0659, "step": 121980 }, { "epoch": 34.3, "learning_rate": 3.4913941211382876e-05, "loss": 0.0664, "step": 122010 }, { "epoch": 34.31, "learning_rate": 3.489519882547715e-05, "loss": 0.0731, "step": 122040 }, { "epoch": 34.32, "learning_rate": 3.4876456439571424e-05, "loss": 0.0645, "step": 122070 }, { "epoch": 34.33, "learning_rate": 3.4857714053665705e-05, "loss": 0.0716, "step": 122100 }, { "epoch": 34.34, "learning_rate": 3.483897166775997e-05, "loss": 0.0663, "step": 122130 }, { "epoch": 34.34, "learning_rate": 3.482022928185425e-05, "loss": 0.0694, "step": 122160 }, { "epoch": 34.35, "learning_rate": 3.480148689594852e-05, "loss": 0.0785, "step": 122190 }, { "epoch": 34.36, "learning_rate": 3.4782744510042795e-05, "loss": 0.0592, "step": 122220 }, { "epoch": 34.37, "learning_rate": 3.476400212413707e-05, "loss": 0.0727, "step": 122250 }, { "epoch": 34.38, "learning_rate": 3.4745259738231344e-05, "loss": 0.066, "step": 122280 }, { "epoch": 34.39, "learning_rate": 3.4726517352325625e-05, "loss": 0.0675, "step": 122310 }, { "epoch": 34.39, "learning_rate": 3.470777496641989e-05, "loss": 0.0738, "step": 122340 }, { "epoch": 34.4, "learning_rate": 3.4689032580514166e-05, "loss": 0.0627, "step": 122370 }, { "epoch": 34.41, "learning_rate": 3.467029019460844e-05, "loss": 0.0754, "step": 122400 }, { "epoch": 34.42, "learning_rate": 3.4651547808702715e-05, "loss": 0.0693, "step": 122430 }, { "epoch": 34.43, "learning_rate": 3.463280542279699e-05, "loss": 0.0647, "step": 122460 }, { "epoch": 34.44, "learning_rate": 3.461406303689126e-05, "loss": 0.077, "step": 122490 }, { "epoch": 34.44, "learning_rate": 3.4595320650985544e-05, "loss": 0.0636, "step": 122520 }, { "epoch": 34.45, "learning_rate": 3.457657826507981e-05, "loss": 0.0692, "step": 122550 }, { "epoch": 34.46, "learning_rate": 3.4557835879174086e-05, "loss": 0.0654, "step": 122580 }, { "epoch": 34.47, "learning_rate": 3.453909349326836e-05, "loss": 0.0719, "step": 122610 }, { "epoch": 34.48, "learning_rate": 3.4520351107362634e-05, "loss": 0.0772, "step": 122640 }, { "epoch": 34.49, "learning_rate": 3.450160872145691e-05, "loss": 0.0612, "step": 122670 }, { "epoch": 34.5, "learning_rate": 3.448286633555118e-05, "loss": 0.0712, "step": 122700 }, { "epoch": 34.5, "learning_rate": 3.446412394964546e-05, "loss": 0.0642, "step": 122730 }, { "epoch": 34.51, "learning_rate": 3.444538156373973e-05, "loss": 0.0673, "step": 122760 }, { "epoch": 34.52, "learning_rate": 3.4426639177834005e-05, "loss": 0.0801, "step": 122790 }, { "epoch": 34.53, "learning_rate": 3.440789679192828e-05, "loss": 0.0653, "step": 122820 }, { "epoch": 34.54, "learning_rate": 3.438915440602255e-05, "loss": 0.0733, "step": 122850 }, { "epoch": 34.55, "learning_rate": 3.437041202011683e-05, "loss": 0.0657, "step": 122880 }, { "epoch": 34.55, "learning_rate": 3.43516696342111e-05, "loss": 0.0713, "step": 122910 }, { "epoch": 34.56, "learning_rate": 3.433292724830538e-05, "loss": 0.0749, "step": 122940 }, { "epoch": 34.57, "learning_rate": 3.431418486239965e-05, "loss": 0.0617, "step": 122970 }, { "epoch": 34.58, "learning_rate": 3.4295442476493924e-05, "loss": 0.0714, "step": 123000 }, { "epoch": 34.59, "learning_rate": 3.42767000905882e-05, "loss": 0.0654, "step": 123030 }, { "epoch": 34.6, "learning_rate": 3.425795770468247e-05, "loss": 0.0703, "step": 123060 }, { "epoch": 34.6, "learning_rate": 3.423921531877675e-05, "loss": 0.0721, "step": 123090 }, { "epoch": 34.61, "learning_rate": 3.422047293287102e-05, "loss": 0.0595, "step": 123120 }, { "epoch": 34.62, "learning_rate": 3.42017305469653e-05, "loss": 0.07, "step": 123150 }, { "epoch": 34.63, "learning_rate": 3.418298816105957e-05, "loss": 0.0703, "step": 123180 }, { "epoch": 34.64, "learning_rate": 3.416424577515385e-05, "loss": 0.0674, "step": 123210 }, { "epoch": 34.65, "learning_rate": 3.414550338924812e-05, "loss": 0.0748, "step": 123240 }, { "epoch": 34.66, "learning_rate": 3.412676100334239e-05, "loss": 0.0611, "step": 123270 }, { "epoch": 34.66, "learning_rate": 3.4108018617436666e-05, "loss": 0.0697, "step": 123300 }, { "epoch": 34.67, "learning_rate": 3.408927623153094e-05, "loss": 0.0675, "step": 123330 }, { "epoch": 34.68, "learning_rate": 3.407053384562522e-05, "loss": 0.0681, "step": 123360 }, { "epoch": 34.69, "learning_rate": 3.405179145971949e-05, "loss": 0.0752, "step": 123390 }, { "epoch": 34.7, "learning_rate": 3.403304907381377e-05, "loss": 0.0615, "step": 123420 }, { "epoch": 34.71, "learning_rate": 3.401430668790804e-05, "loss": 0.0723, "step": 123450 }, { "epoch": 34.71, "learning_rate": 3.399618904819917e-05, "loss": 0.0674, "step": 123480 }, { "epoch": 34.72, "learning_rate": 3.3977446662293445e-05, "loss": 0.0747, "step": 123510 }, { "epoch": 34.73, "learning_rate": 3.395870427638772e-05, "loss": 0.0762, "step": 123540 }, { "epoch": 34.74, "learning_rate": 3.3939961890481994e-05, "loss": 0.0643, "step": 123570 }, { "epoch": 34.75, "learning_rate": 3.392121950457627e-05, "loss": 0.0757, "step": 123600 }, { "epoch": 34.76, "learning_rate": 3.390247711867054e-05, "loss": 0.0599, "step": 123630 }, { "epoch": 34.77, "learning_rate": 3.3883734732764816e-05, "loss": 0.0727, "step": 123660 }, { "epoch": 34.77, "learning_rate": 3.386499234685909e-05, "loss": 0.0705, "step": 123690 }, { "epoch": 34.78, "learning_rate": 3.3846249960953365e-05, "loss": 0.0598, "step": 123720 }, { "epoch": 34.79, "learning_rate": 3.382750757504764e-05, "loss": 0.0719, "step": 123750 }, { "epoch": 34.8, "learning_rate": 3.380876518914191e-05, "loss": 0.0674, "step": 123780 }, { "epoch": 34.81, "learning_rate": 3.379002280323619e-05, "loss": 0.0704, "step": 123810 }, { "epoch": 34.82, "learning_rate": 3.377128041733046e-05, "loss": 0.0741, "step": 123840 }, { "epoch": 34.82, "learning_rate": 3.3752538031424736e-05, "loss": 0.063, "step": 123870 }, { "epoch": 34.83, "learning_rate": 3.373379564551901e-05, "loss": 0.0703, "step": 123900 }, { "epoch": 34.84, "learning_rate": 3.3715053259613284e-05, "loss": 0.0686, "step": 123930 }, { "epoch": 34.85, "learning_rate": 3.369631087370756e-05, "loss": 0.0759, "step": 123960 }, { "epoch": 34.86, "learning_rate": 3.367756848780183e-05, "loss": 0.0726, "step": 123990 }, { "epoch": 34.87, "learning_rate": 3.365882610189611e-05, "loss": 0.0641, "step": 124020 }, { "epoch": 34.87, "learning_rate": 3.364008371599038e-05, "loss": 0.0711, "step": 124050 }, { "epoch": 34.88, "learning_rate": 3.3621341330084655e-05, "loss": 0.0667, "step": 124080 }, { "epoch": 34.89, "learning_rate": 3.360259894417893e-05, "loss": 0.0673, "step": 124110 }, { "epoch": 34.9, "learning_rate": 3.3583856558273203e-05, "loss": 0.0793, "step": 124140 }, { "epoch": 34.91, "learning_rate": 3.356511417236748e-05, "loss": 0.0624, "step": 124170 }, { "epoch": 34.92, "learning_rate": 3.354637178646175e-05, "loss": 0.0705, "step": 124200 }, { "epoch": 34.93, "learning_rate": 3.3527629400556026e-05, "loss": 0.0656, "step": 124230 }, { "epoch": 34.93, "learning_rate": 3.35088870146503e-05, "loss": 0.068, "step": 124260 }, { "epoch": 34.94, "learning_rate": 3.3490144628744574e-05, "loss": 0.0793, "step": 124290 }, { "epoch": 34.95, "learning_rate": 3.347140224283885e-05, "loss": 0.0624, "step": 124320 }, { "epoch": 34.96, "learning_rate": 3.345265985693312e-05, "loss": 0.0718, "step": 124350 }, { "epoch": 34.97, "learning_rate": 3.34339174710274e-05, "loss": 0.0681, "step": 124380 }, { "epoch": 34.98, "learning_rate": 3.341517508512167e-05, "loss": 0.067, "step": 124410 }, { "epoch": 34.98, "learning_rate": 3.3396432699215945e-05, "loss": 0.0727, "step": 124440 }, { "epoch": 34.99, "learning_rate": 3.337769031331022e-05, "loss": 0.0629, "step": 124470 }, { "epoch": 35.0, "eval_loss": 0.1761113852262497, "eval_runtime": 507.443, "eval_samples_per_second": 31.596, "eval_steps_per_second": 0.989, "eval_wer": 0.13112606280621783, "step": 124495 }, { "epoch": 35.0, "learning_rate": 3.3358947927404494e-05, "loss": 0.0739, "step": 124500 }, { "epoch": 35.01, "learning_rate": 3.334020554149877e-05, "loss": 0.0606, "step": 124530 }, { "epoch": 35.02, "learning_rate": 3.332146315559304e-05, "loss": 0.0696, "step": 124560 }, { "epoch": 35.03, "learning_rate": 3.3302720769687316e-05, "loss": 0.0621, "step": 124590 }, { "epoch": 35.04, "learning_rate": 3.328397838378159e-05, "loss": 0.0666, "step": 124620 }, { "epoch": 35.04, "learning_rate": 3.3265235997875865e-05, "loss": 0.0742, "step": 124650 }, { "epoch": 35.05, "learning_rate": 3.324649361197014e-05, "loss": 0.0615, "step": 124680 }, { "epoch": 35.06, "learning_rate": 3.322775122606441e-05, "loss": 0.0659, "step": 124710 }, { "epoch": 35.07, "learning_rate": 3.320900884015869e-05, "loss": 0.0686, "step": 124740 }, { "epoch": 35.08, "learning_rate": 3.319026645425296e-05, "loss": 0.0666, "step": 124770 }, { "epoch": 35.09, "learning_rate": 3.3171524068347236e-05, "loss": 0.0668, "step": 124800 }, { "epoch": 35.09, "learning_rate": 3.315278168244151e-05, "loss": 0.0635, "step": 124830 }, { "epoch": 35.1, "learning_rate": 3.3134039296535784e-05, "loss": 0.0668, "step": 124860 }, { "epoch": 35.11, "learning_rate": 3.311529691063006e-05, "loss": 0.0675, "step": 124890 }, { "epoch": 35.12, "learning_rate": 3.309655452472433e-05, "loss": 0.0698, "step": 124920 }, { "epoch": 35.13, "learning_rate": 3.307781213881861e-05, "loss": 0.0706, "step": 124950 }, { "epoch": 35.14, "learning_rate": 3.305906975291288e-05, "loss": 0.0669, "step": 124980 }, { "epoch": 35.14, "learning_rate": 3.3040327367007155e-05, "loss": 0.0731, "step": 125010 }, { "epoch": 35.15, "learning_rate": 3.302158498110143e-05, "loss": 0.0644, "step": 125040 }, { "epoch": 35.16, "learning_rate": 3.30028425951957e-05, "loss": 0.0603, "step": 125070 }, { "epoch": 35.17, "learning_rate": 3.298410020928998e-05, "loss": 0.0705, "step": 125100 }, { "epoch": 35.18, "learning_rate": 3.296535782338425e-05, "loss": 0.0666, "step": 125130 }, { "epoch": 35.19, "learning_rate": 3.2946615437478526e-05, "loss": 0.0695, "step": 125160 }, { "epoch": 35.2, "learning_rate": 3.29278730515728e-05, "loss": 0.0696, "step": 125190 }, { "epoch": 35.2, "learning_rate": 3.2909130665667074e-05, "loss": 0.0649, "step": 125220 }, { "epoch": 35.21, "learning_rate": 3.289038827976135e-05, "loss": 0.0723, "step": 125250 }, { "epoch": 35.22, "learning_rate": 3.287164589385562e-05, "loss": 0.06, "step": 125280 }, { "epoch": 35.23, "learning_rate": 3.28529035079499e-05, "loss": 0.0716, "step": 125310 }, { "epoch": 35.24, "learning_rate": 3.283416112204417e-05, "loss": 0.0679, "step": 125340 }, { "epoch": 35.25, "learning_rate": 3.2815418736138445e-05, "loss": 0.0639, "step": 125370 }, { "epoch": 35.25, "learning_rate": 3.279667635023272e-05, "loss": 0.0715, "step": 125400 }, { "epoch": 35.26, "learning_rate": 3.2777933964326994e-05, "loss": 0.0607, "step": 125430 }, { "epoch": 35.27, "learning_rate": 3.275919157842127e-05, "loss": 0.0664, "step": 125460 }, { "epoch": 35.28, "learning_rate": 3.274044919251554e-05, "loss": 0.066, "step": 125490 }, { "epoch": 35.29, "learning_rate": 3.2721706806609816e-05, "loss": 0.065, "step": 125520 }, { "epoch": 35.3, "learning_rate": 3.270296442070409e-05, "loss": 0.0746, "step": 125550 }, { "epoch": 35.3, "learning_rate": 3.2684222034798365e-05, "loss": 0.0616, "step": 125580 }, { "epoch": 35.31, "learning_rate": 3.266547964889264e-05, "loss": 0.0716, "step": 125610 }, { "epoch": 35.32, "learning_rate": 3.264673726298691e-05, "loss": 0.0714, "step": 125640 }, { "epoch": 35.33, "learning_rate": 3.262799487708119e-05, "loss": 0.0641, "step": 125670 }, { "epoch": 35.34, "learning_rate": 3.260925249117546e-05, "loss": 0.0735, "step": 125700 }, { "epoch": 35.35, "learning_rate": 3.2590510105269736e-05, "loss": 0.0591, "step": 125730 }, { "epoch": 35.36, "learning_rate": 3.257176771936401e-05, "loss": 0.0727, "step": 125760 }, { "epoch": 35.36, "learning_rate": 3.2553025333458284e-05, "loss": 0.0652, "step": 125790 }, { "epoch": 35.37, "learning_rate": 3.253428294755256e-05, "loss": 0.0671, "step": 125820 }, { "epoch": 35.38, "learning_rate": 3.251554056164683e-05, "loss": 0.0725, "step": 125850 }, { "epoch": 35.39, "learning_rate": 3.2496798175741107e-05, "loss": 0.0627, "step": 125880 }, { "epoch": 35.4, "learning_rate": 3.247805578983538e-05, "loss": 0.0703, "step": 125910 }, { "epoch": 35.41, "learning_rate": 3.2459313403929655e-05, "loss": 0.064, "step": 125940 }, { "epoch": 35.41, "learning_rate": 3.244057101802393e-05, "loss": 0.0622, "step": 125970 }, { "epoch": 35.42, "learning_rate": 3.24218286321182e-05, "loss": 0.0756, "step": 126000 }, { "epoch": 35.43, "learning_rate": 3.240308624621248e-05, "loss": 0.063, "step": 126030 }, { "epoch": 35.44, "learning_rate": 3.238434386030675e-05, "loss": 0.0776, "step": 126060 }, { "epoch": 35.45, "learning_rate": 3.2365601474401026e-05, "loss": 0.0668, "step": 126090 }, { "epoch": 35.46, "learning_rate": 3.23468590884953e-05, "loss": 0.0692, "step": 126120 }, { "epoch": 35.47, "learning_rate": 3.2328116702589574e-05, "loss": 0.0752, "step": 126150 }, { "epoch": 35.47, "learning_rate": 3.230937431668385e-05, "loss": 0.0594, "step": 126180 }, { "epoch": 35.48, "learning_rate": 3.229063193077812e-05, "loss": 0.0692, "step": 126210 }, { "epoch": 35.49, "learning_rate": 3.22718895448724e-05, "loss": 0.0669, "step": 126240 }, { "epoch": 35.5, "learning_rate": 3.225314715896667e-05, "loss": 0.0648, "step": 126270 }, { "epoch": 35.51, "learning_rate": 3.2234404773060945e-05, "loss": 0.072, "step": 126300 }, { "epoch": 35.52, "learning_rate": 3.221566238715522e-05, "loss": 0.0603, "step": 126330 }, { "epoch": 35.52, "learning_rate": 3.2196920001249494e-05, "loss": 0.0711, "step": 126360 }, { "epoch": 35.53, "learning_rate": 3.217817761534377e-05, "loss": 0.0703, "step": 126390 }, { "epoch": 35.54, "learning_rate": 3.215943522943804e-05, "loss": 0.0601, "step": 126420 }, { "epoch": 35.55, "learning_rate": 3.2140692843532316e-05, "loss": 0.074, "step": 126450 }, { "epoch": 35.56, "learning_rate": 3.212195045762659e-05, "loss": 0.0598, "step": 126480 }, { "epoch": 35.57, "learning_rate": 3.2103208071720865e-05, "loss": 0.0682, "step": 126510 }, { "epoch": 35.57, "learning_rate": 3.208446568581514e-05, "loss": 0.0702, "step": 126540 }, { "epoch": 35.58, "learning_rate": 3.206572329990941e-05, "loss": 0.0616, "step": 126570 }, { "epoch": 35.59, "learning_rate": 3.204698091400369e-05, "loss": 0.0727, "step": 126600 }, { "epoch": 35.6, "learning_rate": 3.202823852809796e-05, "loss": 0.0639, "step": 126630 }, { "epoch": 35.61, "learning_rate": 3.2009496142192235e-05, "loss": 0.0706, "step": 126660 }, { "epoch": 35.62, "learning_rate": 3.199075375628651e-05, "loss": 0.066, "step": 126690 }, { "epoch": 35.63, "learning_rate": 3.1972011370380784e-05, "loss": 0.0681, "step": 126720 }, { "epoch": 35.63, "learning_rate": 3.195326898447506e-05, "loss": 0.0735, "step": 126750 }, { "epoch": 35.64, "learning_rate": 3.193452659856933e-05, "loss": 0.0624, "step": 126780 }, { "epoch": 35.65, "learning_rate": 3.1915784212663606e-05, "loss": 0.067, "step": 126810 }, { "epoch": 35.66, "learning_rate": 3.189704182675788e-05, "loss": 0.07, "step": 126840 }, { "epoch": 35.67, "learning_rate": 3.1878299440852155e-05, "loss": 0.0624, "step": 126870 }, { "epoch": 35.68, "learning_rate": 3.185955705494643e-05, "loss": 0.0707, "step": 126900 }, { "epoch": 35.68, "learning_rate": 3.18408146690407e-05, "loss": 0.0582, "step": 126930 }, { "epoch": 35.69, "learning_rate": 3.182207228313498e-05, "loss": 0.0675, "step": 126960 }, { "epoch": 35.7, "learning_rate": 3.180332989722925e-05, "loss": 0.0676, "step": 126990 }, { "epoch": 35.71, "learning_rate": 3.1784587511323526e-05, "loss": 0.0668, "step": 127020 }, { "epoch": 35.72, "learning_rate": 3.17658451254178e-05, "loss": 0.0721, "step": 127050 }, { "epoch": 35.73, "learning_rate": 3.1747102739512074e-05, "loss": 0.06, "step": 127080 }, { "epoch": 35.74, "learning_rate": 3.172836035360635e-05, "loss": 0.0674, "step": 127110 }, { "epoch": 35.74, "learning_rate": 3.170961796770062e-05, "loss": 0.0684, "step": 127140 }, { "epoch": 35.75, "learning_rate": 3.16908755817949e-05, "loss": 0.0682, "step": 127170 }, { "epoch": 35.76, "learning_rate": 3.167213319588917e-05, "loss": 0.0729, "step": 127200 }, { "epoch": 35.77, "learning_rate": 3.1653390809983445e-05, "loss": 0.0629, "step": 127230 }, { "epoch": 35.78, "learning_rate": 3.163527317027458e-05, "loss": 0.0674, "step": 127260 }, { "epoch": 35.79, "learning_rate": 3.1616530784368854e-05, "loss": 0.0656, "step": 127290 }, { "epoch": 35.79, "learning_rate": 3.159778839846312e-05, "loss": 0.0672, "step": 127320 }, { "epoch": 35.8, "learning_rate": 3.15790460125574e-05, "loss": 0.073, "step": 127350 }, { "epoch": 35.81, "learning_rate": 3.156030362665167e-05, "loss": 0.063, "step": 127380 }, { "epoch": 35.82, "learning_rate": 3.154156124074595e-05, "loss": 0.0674, "step": 127410 }, { "epoch": 35.83, "learning_rate": 3.1522818854840224e-05, "loss": 0.0636, "step": 127440 }, { "epoch": 35.84, "learning_rate": 3.15040764689345e-05, "loss": 0.0635, "step": 127470 }, { "epoch": 35.84, "learning_rate": 3.148533408302877e-05, "loss": 0.0782, "step": 127500 }, { "epoch": 35.85, "learning_rate": 3.146659169712304e-05, "loss": 0.0609, "step": 127530 }, { "epoch": 35.86, "learning_rate": 3.144784931121732e-05, "loss": 0.0694, "step": 127560 }, { "epoch": 35.87, "learning_rate": 3.142910692531159e-05, "loss": 0.0665, "step": 127590 }, { "epoch": 35.88, "learning_rate": 3.141036453940587e-05, "loss": 0.0686, "step": 127620 }, { "epoch": 35.89, "learning_rate": 3.1391622153500144e-05, "loss": 0.0709, "step": 127650 }, { "epoch": 35.9, "learning_rate": 3.137287976759442e-05, "loss": 0.0598, "step": 127680 }, { "epoch": 35.9, "learning_rate": 3.135413738168869e-05, "loss": 0.0657, "step": 127710 }, { "epoch": 35.91, "learning_rate": 3.133539499578296e-05, "loss": 0.0662, "step": 127740 }, { "epoch": 35.92, "learning_rate": 3.131665260987724e-05, "loss": 0.0667, "step": 127770 }, { "epoch": 35.93, "learning_rate": 3.129791022397151e-05, "loss": 0.0715, "step": 127800 }, { "epoch": 35.94, "learning_rate": 3.127916783806579e-05, "loss": 0.0582, "step": 127830 }, { "epoch": 35.95, "learning_rate": 3.126042545216006e-05, "loss": 0.0724, "step": 127860 }, { "epoch": 35.95, "learning_rate": 3.124168306625434e-05, "loss": 0.0695, "step": 127890 }, { "epoch": 35.96, "learning_rate": 3.122294068034861e-05, "loss": 0.0652, "step": 127920 }, { "epoch": 35.97, "learning_rate": 3.1204198294442886e-05, "loss": 0.0737, "step": 127950 }, { "epoch": 35.98, "learning_rate": 3.118545590853716e-05, "loss": 0.062, "step": 127980 }, { "epoch": 35.99, "learning_rate": 3.116671352263143e-05, "loss": 0.0685, "step": 128010 }, { "epoch": 36.0, "learning_rate": 3.114797113672571e-05, "loss": 0.0654, "step": 128040 }, { "epoch": 36.0, "eval_loss": 0.17177008092403412, "eval_runtime": 506.5545, "eval_samples_per_second": 31.651, "eval_steps_per_second": 0.991, "eval_wer": 0.13024579312980225, "step": 128052 }, { "epoch": 36.01, "learning_rate": 3.112922875081998e-05, "loss": 0.0672, "step": 128070 }, { "epoch": 36.01, "learning_rate": 3.111048636491426e-05, "loss": 0.0701, "step": 128100 }, { "epoch": 36.02, "learning_rate": 3.109174397900853e-05, "loss": 0.0635, "step": 128130 }, { "epoch": 36.03, "learning_rate": 3.1073001593102805e-05, "loss": 0.0681, "step": 128160 }, { "epoch": 36.04, "learning_rate": 3.105425920719708e-05, "loss": 0.0589, "step": 128190 }, { "epoch": 36.05, "learning_rate": 3.103551682129135e-05, "loss": 0.0651, "step": 128220 }, { "epoch": 36.06, "learning_rate": 3.101677443538563e-05, "loss": 0.0698, "step": 128250 }, { "epoch": 36.06, "learning_rate": 3.09980320494799e-05, "loss": 0.0625, "step": 128280 }, { "epoch": 36.07, "learning_rate": 3.0979289663574176e-05, "loss": 0.0688, "step": 128310 }, { "epoch": 36.08, "learning_rate": 3.096054727766845e-05, "loss": 0.0597, "step": 128340 }, { "epoch": 36.09, "learning_rate": 3.0941804891762724e-05, "loss": 0.0728, "step": 128370 }, { "epoch": 36.1, "learning_rate": 3.0923062505857e-05, "loss": 0.0727, "step": 128400 }, { "epoch": 36.11, "learning_rate": 3.0904320119951266e-05, "loss": 0.0589, "step": 128430 }, { "epoch": 36.11, "learning_rate": 3.088557773404555e-05, "loss": 0.0677, "step": 128460 }, { "epoch": 36.12, "learning_rate": 3.086683534813982e-05, "loss": 0.063, "step": 128490 }, { "epoch": 36.13, "learning_rate": 3.0848092962234095e-05, "loss": 0.0649, "step": 128520 }, { "epoch": 36.14, "learning_rate": 3.082935057632837e-05, "loss": 0.0688, "step": 128550 }, { "epoch": 36.15, "learning_rate": 3.0810608190422644e-05, "loss": 0.0653, "step": 128580 }, { "epoch": 36.16, "learning_rate": 3.079186580451692e-05, "loss": 0.0697, "step": 128610 }, { "epoch": 36.17, "learning_rate": 3.0773123418611185e-05, "loss": 0.0592, "step": 128640 }, { "epoch": 36.17, "learning_rate": 3.0754381032705466e-05, "loss": 0.0658, "step": 128670 }, { "epoch": 36.18, "learning_rate": 3.073563864679974e-05, "loss": 0.0678, "step": 128700 }, { "epoch": 36.19, "learning_rate": 3.0716896260894015e-05, "loss": 0.0602, "step": 128730 }, { "epoch": 36.2, "learning_rate": 3.069815387498829e-05, "loss": 0.0697, "step": 128760 }, { "epoch": 36.21, "learning_rate": 3.067941148908256e-05, "loss": 0.0628, "step": 128790 }, { "epoch": 36.22, "learning_rate": 3.066066910317684e-05, "loss": 0.0679, "step": 128820 }, { "epoch": 36.22, "learning_rate": 3.0641926717271105e-05, "loss": 0.0663, "step": 128850 }, { "epoch": 36.23, "learning_rate": 3.0623184331365386e-05, "loss": 0.0629, "step": 128880 }, { "epoch": 36.24, "learning_rate": 3.060444194545966e-05, "loss": 0.0737, "step": 128910 }, { "epoch": 36.25, "learning_rate": 3.0585699559553934e-05, "loss": 0.0578, "step": 128940 }, { "epoch": 36.26, "learning_rate": 3.056695717364821e-05, "loss": 0.0681, "step": 128970 }, { "epoch": 36.27, "learning_rate": 3.054821478774248e-05, "loss": 0.0705, "step": 129000 }, { "epoch": 36.27, "learning_rate": 3.0529472401836757e-05, "loss": 0.063, "step": 129030 }, { "epoch": 36.28, "learning_rate": 3.0510730015931027e-05, "loss": 0.0745, "step": 129060 }, { "epoch": 36.29, "learning_rate": 3.0491987630025305e-05, "loss": 0.0611, "step": 129090 }, { "epoch": 36.3, "learning_rate": 3.047324524411958e-05, "loss": 0.0647, "step": 129120 }, { "epoch": 36.31, "learning_rate": 3.045450285821385e-05, "loss": 0.0706, "step": 129150 }, { "epoch": 36.32, "learning_rate": 3.0435760472308128e-05, "loss": 0.0584, "step": 129180 }, { "epoch": 36.33, "learning_rate": 3.04170180864024e-05, "loss": 0.076, "step": 129210 }, { "epoch": 36.33, "learning_rate": 3.0398275700496676e-05, "loss": 0.0613, "step": 129240 }, { "epoch": 36.34, "learning_rate": 3.0379533314590947e-05, "loss": 0.0734, "step": 129270 }, { "epoch": 36.35, "learning_rate": 3.0360790928685224e-05, "loss": 0.066, "step": 129300 }, { "epoch": 36.36, "learning_rate": 3.03420485427795e-05, "loss": 0.0603, "step": 129330 }, { "epoch": 36.37, "learning_rate": 3.032330615687377e-05, "loss": 0.0732, "step": 129360 }, { "epoch": 36.38, "learning_rate": 3.0304563770968047e-05, "loss": 0.0607, "step": 129390 }, { "epoch": 36.38, "learning_rate": 3.0285821385062318e-05, "loss": 0.068, "step": 129420 }, { "epoch": 36.39, "learning_rate": 3.0267078999156595e-05, "loss": 0.071, "step": 129450 }, { "epoch": 36.4, "learning_rate": 3.0248336613250866e-05, "loss": 0.0636, "step": 129480 }, { "epoch": 36.41, "learning_rate": 3.0229594227345144e-05, "loss": 0.0733, "step": 129510 }, { "epoch": 36.42, "learning_rate": 3.0210851841439418e-05, "loss": 0.0625, "step": 129540 }, { "epoch": 36.43, "learning_rate": 3.019210945553369e-05, "loss": 0.0689, "step": 129570 }, { "epoch": 36.44, "learning_rate": 3.0173367069627966e-05, "loss": 0.0715, "step": 129600 }, { "epoch": 36.44, "learning_rate": 3.0154624683722237e-05, "loss": 0.0599, "step": 129630 }, { "epoch": 36.45, "learning_rate": 3.0135882297816515e-05, "loss": 0.069, "step": 129660 }, { "epoch": 36.46, "learning_rate": 3.0117139911910785e-05, "loss": 0.0635, "step": 129690 }, { "epoch": 36.47, "learning_rate": 3.0098397526005063e-05, "loss": 0.0671, "step": 129720 }, { "epoch": 36.48, "learning_rate": 3.0079655140099337e-05, "loss": 0.0697, "step": 129750 }, { "epoch": 36.49, "learning_rate": 3.006091275419361e-05, "loss": 0.0637, "step": 129780 }, { "epoch": 36.49, "learning_rate": 3.0042170368287886e-05, "loss": 0.0708, "step": 129810 }, { "epoch": 36.5, "learning_rate": 3.0023427982382156e-05, "loss": 0.0637, "step": 129840 }, { "epoch": 36.51, "learning_rate": 3.0004685596476434e-05, "loss": 0.0671, "step": 129870 }, { "epoch": 36.52, "learning_rate": 2.9985943210570705e-05, "loss": 0.066, "step": 129900 }, { "epoch": 36.53, "learning_rate": 2.9967200824664982e-05, "loss": 0.0631, "step": 129930 }, { "epoch": 36.54, "learning_rate": 2.9948458438759256e-05, "loss": 0.0715, "step": 129960 }, { "epoch": 36.54, "learning_rate": 2.992971605285353e-05, "loss": 0.0615, "step": 129990 }, { "epoch": 36.55, "learning_rate": 2.9910973666947805e-05, "loss": 0.0705, "step": 130020 }, { "epoch": 36.56, "learning_rate": 2.9892231281042076e-05, "loss": 0.0685, "step": 130050 }, { "epoch": 36.57, "learning_rate": 2.9873488895136353e-05, "loss": 0.0622, "step": 130080 }, { "epoch": 36.58, "learning_rate": 2.9854746509230624e-05, "loss": 0.0738, "step": 130110 }, { "epoch": 36.59, "learning_rate": 2.98360041233249e-05, "loss": 0.0627, "step": 130140 }, { "epoch": 36.6, "learning_rate": 2.981726173741918e-05, "loss": 0.0689, "step": 130170 }, { "epoch": 36.6, "learning_rate": 2.979851935151345e-05, "loss": 0.0665, "step": 130200 }, { "epoch": 36.61, "learning_rate": 2.9779776965607724e-05, "loss": 0.0591, "step": 130230 }, { "epoch": 36.62, "learning_rate": 2.9761034579701995e-05, "loss": 0.071, "step": 130260 }, { "epoch": 36.63, "learning_rate": 2.9742292193796273e-05, "loss": 0.0637, "step": 130290 }, { "epoch": 36.64, "learning_rate": 2.9723549807890543e-05, "loss": 0.0668, "step": 130320 }, { "epoch": 36.65, "learning_rate": 2.970480742198482e-05, "loss": 0.073, "step": 130350 }, { "epoch": 36.65, "learning_rate": 2.96860650360791e-05, "loss": 0.0632, "step": 130380 }, { "epoch": 36.66, "learning_rate": 2.966732265017337e-05, "loss": 0.07, "step": 130410 }, { "epoch": 36.67, "learning_rate": 2.9648580264267644e-05, "loss": 0.0596, "step": 130440 }, { "epoch": 36.68, "learning_rate": 2.9629837878361914e-05, "loss": 0.0616, "step": 130470 }, { "epoch": 36.69, "learning_rate": 2.9611095492456192e-05, "loss": 0.0632, "step": 130500 }, { "epoch": 36.7, "learning_rate": 2.9592353106550463e-05, "loss": 0.0628, "step": 130530 }, { "epoch": 36.7, "learning_rate": 2.957361072064474e-05, "loss": 0.0701, "step": 130560 }, { "epoch": 36.71, "learning_rate": 2.955486833473901e-05, "loss": 0.0607, "step": 130590 }, { "epoch": 36.72, "learning_rate": 2.953612594883329e-05, "loss": 0.066, "step": 130620 }, { "epoch": 36.73, "learning_rate": 2.9517383562927563e-05, "loss": 0.068, "step": 130650 }, { "epoch": 36.74, "learning_rate": 2.9498641177021834e-05, "loss": 0.0609, "step": 130680 }, { "epoch": 36.75, "learning_rate": 2.947989879111611e-05, "loss": 0.0714, "step": 130710 }, { "epoch": 36.76, "learning_rate": 2.9461156405210382e-05, "loss": 0.0627, "step": 130740 }, { "epoch": 36.76, "learning_rate": 2.944241401930466e-05, "loss": 0.0624, "step": 130770 }, { "epoch": 36.77, "learning_rate": 2.942367163339893e-05, "loss": 0.071, "step": 130800 }, { "epoch": 36.78, "learning_rate": 2.9404929247493208e-05, "loss": 0.0633, "step": 130830 }, { "epoch": 36.79, "learning_rate": 2.9386186861587482e-05, "loss": 0.0703, "step": 130860 }, { "epoch": 36.8, "learning_rate": 2.9367444475681753e-05, "loss": 0.0596, "step": 130890 }, { "epoch": 36.81, "learning_rate": 2.934870208977603e-05, "loss": 0.0656, "step": 130920 }, { "epoch": 36.81, "learning_rate": 2.93299597038703e-05, "loss": 0.0622, "step": 130950 }, { "epoch": 36.82, "learning_rate": 2.931121731796458e-05, "loss": 0.0631, "step": 130980 }, { "epoch": 36.83, "learning_rate": 2.929247493205885e-05, "loss": 0.0717, "step": 131010 }, { "epoch": 36.84, "learning_rate": 2.9273732546153127e-05, "loss": 0.0582, "step": 131040 }, { "epoch": 36.85, "learning_rate": 2.92549901602474e-05, "loss": 0.0676, "step": 131070 }, { "epoch": 36.86, "learning_rate": 2.9236247774341676e-05, "loss": 0.0679, "step": 131100 }, { "epoch": 36.87, "learning_rate": 2.921750538843595e-05, "loss": 0.0596, "step": 131130 }, { "epoch": 36.87, "learning_rate": 2.919876300253022e-05, "loss": 0.0693, "step": 131160 }, { "epoch": 36.88, "learning_rate": 2.9180020616624498e-05, "loss": 0.0609, "step": 131190 }, { "epoch": 36.89, "learning_rate": 2.916127823071877e-05, "loss": 0.0664, "step": 131220 }, { "epoch": 36.9, "learning_rate": 2.9142535844813047e-05, "loss": 0.0642, "step": 131250 }, { "epoch": 36.91, "learning_rate": 2.912379345890732e-05, "loss": 0.0648, "step": 131280 }, { "epoch": 36.92, "learning_rate": 2.9105051073001595e-05, "loss": 0.0705, "step": 131310 }, { "epoch": 36.92, "learning_rate": 2.908630868709587e-05, "loss": 0.0584, "step": 131340 }, { "epoch": 36.93, "learning_rate": 2.906756630119014e-05, "loss": 0.0678, "step": 131370 }, { "epoch": 36.94, "learning_rate": 2.9048823915284418e-05, "loss": 0.073, "step": 131400 }, { "epoch": 36.95, "learning_rate": 2.903008152937869e-05, "loss": 0.0688, "step": 131430 }, { "epoch": 36.96, "learning_rate": 2.9011339143472966e-05, "loss": 0.0712, "step": 131460 }, { "epoch": 36.97, "learning_rate": 2.8992596757567244e-05, "loss": 0.0621, "step": 131490 }, { "epoch": 36.97, "learning_rate": 2.8973854371661514e-05, "loss": 0.066, "step": 131520 }, { "epoch": 36.98, "learning_rate": 2.895511198575579e-05, "loss": 0.0684, "step": 131550 }, { "epoch": 36.99, "learning_rate": 2.893636959985006e-05, "loss": 0.0656, "step": 131580 }, { "epoch": 37.0, "eval_loss": 0.16971024870872498, "eval_runtime": 512.0403, "eval_samples_per_second": 31.312, "eval_steps_per_second": 0.98, "eval_wer": 0.1300888458231545, "step": 131609 }, { "epoch": 37.0, "learning_rate": 2.8917627213944337e-05, "loss": 0.0744, "step": 131610 }, { "epoch": 37.01, "learning_rate": 2.8898884828038608e-05, "loss": 0.0581, "step": 131640 }, { "epoch": 37.02, "learning_rate": 2.8880142442132885e-05, "loss": 0.0647, "step": 131670 }, { "epoch": 37.03, "learning_rate": 2.8861400056227163e-05, "loss": 0.0616, "step": 131700 }, { "epoch": 37.03, "learning_rate": 2.8842657670321434e-05, "loss": 0.0666, "step": 131730 }, { "epoch": 37.04, "learning_rate": 2.8823915284415708e-05, "loss": 0.0673, "step": 131760 }, { "epoch": 37.05, "learning_rate": 2.880517289850998e-05, "loss": 0.0608, "step": 131790 }, { "epoch": 37.06, "learning_rate": 2.8786430512604256e-05, "loss": 0.0646, "step": 131820 }, { "epoch": 37.07, "learning_rate": 2.8767688126698527e-05, "loss": 0.0618, "step": 131850 }, { "epoch": 37.08, "learning_rate": 2.8749570486989665e-05, "loss": 0.0658, "step": 131880 }, { "epoch": 37.08, "learning_rate": 2.8730828101083935e-05, "loss": 0.0694, "step": 131910 }, { "epoch": 37.09, "learning_rate": 2.871208571517821e-05, "loss": 0.0546, "step": 131940 }, { "epoch": 37.1, "learning_rate": 2.869334332927248e-05, "loss": 0.069, "step": 131970 }, { "epoch": 37.11, "learning_rate": 2.8675225689563618e-05, "loss": 0.0626, "step": 132000 }, { "epoch": 37.12, "learning_rate": 2.865648330365789e-05, "loss": 0.0661, "step": 132030 }, { "epoch": 37.13, "learning_rate": 2.8637740917752166e-05, "loss": 0.0661, "step": 132060 }, { "epoch": 37.14, "learning_rate": 2.861899853184644e-05, "loss": 0.055, "step": 132090 }, { "epoch": 37.14, "learning_rate": 2.860025614594071e-05, "loss": 0.0661, "step": 132120 }, { "epoch": 37.15, "learning_rate": 2.858151376003499e-05, "loss": 0.0613, "step": 132150 }, { "epoch": 37.16, "learning_rate": 2.856277137412926e-05, "loss": 0.068, "step": 132180 }, { "epoch": 37.17, "learning_rate": 2.8544028988223537e-05, "loss": 0.0707, "step": 132210 }, { "epoch": 37.18, "learning_rate": 2.8525286602317808e-05, "loss": 0.0566, "step": 132240 }, { "epoch": 37.19, "learning_rate": 2.8506544216412086e-05, "loss": 0.0651, "step": 132270 }, { "epoch": 37.19, "learning_rate": 2.8487801830506357e-05, "loss": 0.0643, "step": 132300 }, { "epoch": 37.2, "learning_rate": 2.846905944460063e-05, "loss": 0.0626, "step": 132330 }, { "epoch": 37.21, "learning_rate": 2.845031705869491e-05, "loss": 0.0681, "step": 132360 }, { "epoch": 37.22, "learning_rate": 2.843157467278918e-05, "loss": 0.0581, "step": 132390 }, { "epoch": 37.23, "learning_rate": 2.8412832286883457e-05, "loss": 0.0708, "step": 132420 }, { "epoch": 37.24, "learning_rate": 2.8394089900977728e-05, "loss": 0.0591, "step": 132450 }, { "epoch": 37.24, "learning_rate": 2.8375347515072005e-05, "loss": 0.0672, "step": 132480 }, { "epoch": 37.25, "learning_rate": 2.8356605129166276e-05, "loss": 0.0694, "step": 132510 }, { "epoch": 37.26, "learning_rate": 2.833786274326055e-05, "loss": 0.0558, "step": 132540 }, { "epoch": 37.27, "learning_rate": 2.8319120357354828e-05, "loss": 0.0692, "step": 132570 }, { "epoch": 37.28, "learning_rate": 2.83003779714491e-05, "loss": 0.0627, "step": 132600 }, { "epoch": 37.29, "learning_rate": 2.8281635585543376e-05, "loss": 0.0657, "step": 132630 }, { "epoch": 37.3, "learning_rate": 2.8262893199637647e-05, "loss": 0.0702, "step": 132660 }, { "epoch": 37.3, "learning_rate": 2.8244150813731924e-05, "loss": 0.0574, "step": 132690 }, { "epoch": 37.31, "learning_rate": 2.8225408427826195e-05, "loss": 0.072, "step": 132720 }, { "epoch": 37.32, "learning_rate": 2.820666604192047e-05, "loss": 0.0657, "step": 132750 }, { "epoch": 37.33, "learning_rate": 2.8187923656014747e-05, "loss": 0.066, "step": 132780 }, { "epoch": 37.34, "learning_rate": 2.8169181270109018e-05, "loss": 0.0695, "step": 132810 }, { "epoch": 37.35, "learning_rate": 2.8150438884203295e-05, "loss": 0.0594, "step": 132840 }, { "epoch": 37.35, "learning_rate": 2.8131696498297566e-05, "loss": 0.0709, "step": 132870 }, { "epoch": 37.36, "learning_rate": 2.8112954112391844e-05, "loss": 0.0587, "step": 132900 }, { "epoch": 37.37, "learning_rate": 2.8094211726486115e-05, "loss": 0.0699, "step": 132930 }, { "epoch": 37.38, "learning_rate": 2.807546934058039e-05, "loss": 0.0726, "step": 132960 }, { "epoch": 37.39, "learning_rate": 2.8056726954674666e-05, "loss": 0.0552, "step": 132990 }, { "epoch": 37.4, "learning_rate": 2.8037984568768937e-05, "loss": 0.0686, "step": 133020 }, { "epoch": 37.41, "learning_rate": 2.8019242182863215e-05, "loss": 0.061, "step": 133050 }, { "epoch": 37.41, "learning_rate": 2.8000499796957486e-05, "loss": 0.0668, "step": 133080 }, { "epoch": 37.42, "learning_rate": 2.7981757411051763e-05, "loss": 0.0683, "step": 133110 }, { "epoch": 37.43, "learning_rate": 2.7963015025146034e-05, "loss": 0.0578, "step": 133140 }, { "epoch": 37.44, "learning_rate": 2.7944272639240308e-05, "loss": 0.0715, "step": 133170 }, { "epoch": 37.45, "learning_rate": 2.7925530253334586e-05, "loss": 0.0643, "step": 133200 }, { "epoch": 37.46, "learning_rate": 2.7906787867428857e-05, "loss": 0.0645, "step": 133230 }, { "epoch": 37.46, "learning_rate": 2.7888045481523134e-05, "loss": 0.0698, "step": 133260 }, { "epoch": 37.47, "learning_rate": 2.7869303095617405e-05, "loss": 0.0554, "step": 133290 }, { "epoch": 37.48, "learning_rate": 2.7850560709711682e-05, "loss": 0.0722, "step": 133320 }, { "epoch": 37.49, "learning_rate": 2.7831818323805953e-05, "loss": 0.0607, "step": 133350 }, { "epoch": 37.5, "learning_rate": 2.781307593790023e-05, "loss": 0.0681, "step": 133380 }, { "epoch": 37.51, "learning_rate": 2.7794333551994505e-05, "loss": 0.0677, "step": 133410 }, { "epoch": 37.51, "learning_rate": 2.7775591166088776e-05, "loss": 0.0576, "step": 133440 }, { "epoch": 37.52, "learning_rate": 2.7756848780183053e-05, "loss": 0.0652, "step": 133470 }, { "epoch": 37.53, "learning_rate": 2.7738106394277324e-05, "loss": 0.0607, "step": 133500 }, { "epoch": 37.54, "learning_rate": 2.7719364008371602e-05, "loss": 0.0645, "step": 133530 }, { "epoch": 37.55, "learning_rate": 2.7700621622465873e-05, "loss": 0.0672, "step": 133560 }, { "epoch": 37.56, "learning_rate": 2.768187923656015e-05, "loss": 0.0513, "step": 133590 }, { "epoch": 37.57, "learning_rate": 2.7663136850654424e-05, "loss": 0.0654, "step": 133620 }, { "epoch": 37.57, "learning_rate": 2.7644394464748695e-05, "loss": 0.0584, "step": 133650 }, { "epoch": 37.58, "learning_rate": 2.7625652078842973e-05, "loss": 0.0637, "step": 133680 }, { "epoch": 37.59, "learning_rate": 2.7606909692937244e-05, "loss": 0.071, "step": 133710 }, { "epoch": 37.6, "learning_rate": 2.758816730703152e-05, "loss": 0.0593, "step": 133740 }, { "epoch": 37.61, "learning_rate": 2.7569424921125792e-05, "loss": 0.0717, "step": 133770 }, { "epoch": 37.62, "learning_rate": 2.755068253522007e-05, "loss": 0.0621, "step": 133800 }, { "epoch": 37.62, "learning_rate": 2.7531940149314344e-05, "loss": 0.0652, "step": 133830 }, { "epoch": 37.63, "learning_rate": 2.7513197763408615e-05, "loss": 0.0706, "step": 133860 }, { "epoch": 37.64, "learning_rate": 2.7494455377502892e-05, "loss": 0.0557, "step": 133890 }, { "epoch": 37.65, "learning_rate": 2.7475712991597163e-05, "loss": 0.0712, "step": 133920 }, { "epoch": 37.66, "learning_rate": 2.745697060569144e-05, "loss": 0.0629, "step": 133950 }, { "epoch": 37.67, "learning_rate": 2.743822821978571e-05, "loss": 0.0655, "step": 133980 }, { "epoch": 37.67, "learning_rate": 2.741948583387999e-05, "loss": 0.0706, "step": 134010 }, { "epoch": 37.68, "learning_rate": 2.7400743447974263e-05, "loss": 0.06, "step": 134040 }, { "epoch": 37.69, "learning_rate": 2.7382001062068534e-05, "loss": 0.07, "step": 134070 }, { "epoch": 37.7, "learning_rate": 2.736325867616281e-05, "loss": 0.0618, "step": 134100 }, { "epoch": 37.71, "learning_rate": 2.7344516290257082e-05, "loss": 0.0618, "step": 134130 }, { "epoch": 37.72, "learning_rate": 2.732577390435136e-05, "loss": 0.0699, "step": 134160 }, { "epoch": 37.73, "learning_rate": 2.730703151844563e-05, "loss": 0.0592, "step": 134190 }, { "epoch": 37.73, "learning_rate": 2.7288289132539908e-05, "loss": 0.0712, "step": 134220 }, { "epoch": 37.74, "learning_rate": 2.7269546746634182e-05, "loss": 0.0622, "step": 134250 }, { "epoch": 37.75, "learning_rate": 2.7250804360728453e-05, "loss": 0.0662, "step": 134280 }, { "epoch": 37.76, "learning_rate": 2.723206197482273e-05, "loss": 0.0715, "step": 134310 }, { "epoch": 37.77, "learning_rate": 2.7213319588917e-05, "loss": 0.0597, "step": 134340 }, { "epoch": 37.78, "learning_rate": 2.719457720301128e-05, "loss": 0.0687, "step": 134370 }, { "epoch": 37.78, "learning_rate": 2.717583481710555e-05, "loss": 0.063, "step": 134400 }, { "epoch": 37.79, "learning_rate": 2.7157092431199828e-05, "loss": 0.0663, "step": 134430 }, { "epoch": 37.8, "learning_rate": 2.7138350045294102e-05, "loss": 0.0702, "step": 134460 }, { "epoch": 37.81, "learning_rate": 2.7119607659388373e-05, "loss": 0.0579, "step": 134490 }, { "epoch": 37.82, "learning_rate": 2.710086527348265e-05, "loss": 0.0695, "step": 134520 }, { "epoch": 37.83, "learning_rate": 2.708212288757692e-05, "loss": 0.0628, "step": 134550 }, { "epoch": 37.84, "learning_rate": 2.70633805016712e-05, "loss": 0.0642, "step": 134580 }, { "epoch": 37.84, "learning_rate": 2.704463811576547e-05, "loss": 0.0705, "step": 134610 }, { "epoch": 37.85, "learning_rate": 2.7025895729859747e-05, "loss": 0.0566, "step": 134640 }, { "epoch": 37.86, "learning_rate": 2.700715334395402e-05, "loss": 0.0691, "step": 134670 }, { "epoch": 37.87, "learning_rate": 2.6988410958048295e-05, "loss": 0.061, "step": 134700 }, { "epoch": 37.88, "learning_rate": 2.696966857214257e-05, "loss": 0.0641, "step": 134730 }, { "epoch": 37.89, "learning_rate": 2.695092618623684e-05, "loss": 0.0707, "step": 134760 }, { "epoch": 37.89, "learning_rate": 2.6932183800331118e-05, "loss": 0.0619, "step": 134790 }, { "epoch": 37.9, "learning_rate": 2.691344141442539e-05, "loss": 0.0681, "step": 134820 }, { "epoch": 37.91, "learning_rate": 2.6894699028519666e-05, "loss": 0.0629, "step": 134850 }, { "epoch": 37.92, "learning_rate": 2.687595664261394e-05, "loss": 0.0627, "step": 134880 }, { "epoch": 37.93, "learning_rate": 2.6857214256708215e-05, "loss": 0.0701, "step": 134910 }, { "epoch": 37.94, "learning_rate": 2.683847187080249e-05, "loss": 0.0587, "step": 134940 }, { "epoch": 37.94, "learning_rate": 2.681972948489676e-05, "loss": 0.0652, "step": 134970 }, { "epoch": 37.95, "learning_rate": 2.6800987098991037e-05, "loss": 0.0597, "step": 135000 }, { "epoch": 37.96, "learning_rate": 2.6782244713085308e-05, "loss": 0.0651, "step": 135030 }, { "epoch": 37.97, "learning_rate": 2.6763502327179586e-05, "loss": 0.0755, "step": 135060 }, { "epoch": 37.98, "learning_rate": 2.6744759941273863e-05, "loss": 0.0553, "step": 135090 }, { "epoch": 37.99, "learning_rate": 2.6726017555368134e-05, "loss": 0.0671, "step": 135120 }, { "epoch": 38.0, "learning_rate": 2.6707275169462408e-05, "loss": 0.0643, "step": 135150 }, { "epoch": 38.0, "eval_loss": 0.17159442603588104, "eval_runtime": 506.1667, "eval_samples_per_second": 31.675, "eval_steps_per_second": 0.992, "eval_wer": 0.1278642883463213, "step": 135166 }, { "epoch": 38.0, "learning_rate": 2.668853278355668e-05, "loss": 0.0666, "step": 135180 }, { "epoch": 38.01, "learning_rate": 2.6669790397650956e-05, "loss": 0.0625, "step": 135210 }, { "epoch": 38.02, "learning_rate": 2.6651048011745227e-05, "loss": 0.0608, "step": 135240 }, { "epoch": 38.03, "learning_rate": 2.6632305625839505e-05, "loss": 0.0697, "step": 135270 }, { "epoch": 38.04, "learning_rate": 2.6613563239933782e-05, "loss": 0.057, "step": 135300 }, { "epoch": 38.05, "learning_rate": 2.6594820854028053e-05, "loss": 0.066, "step": 135330 }, { "epoch": 38.05, "learning_rate": 2.6576078468122327e-05, "loss": 0.0618, "step": 135360 }, { "epoch": 38.06, "learning_rate": 2.6557336082216598e-05, "loss": 0.0627, "step": 135390 }, { "epoch": 38.07, "learning_rate": 2.6538593696310876e-05, "loss": 0.0692, "step": 135420 }, { "epoch": 38.08, "learning_rate": 2.6519851310405147e-05, "loss": 0.0555, "step": 135450 }, { "epoch": 38.09, "learning_rate": 2.6501108924499424e-05, "loss": 0.0611, "step": 135480 }, { "epoch": 38.1, "learning_rate": 2.6482366538593702e-05, "loss": 0.0603, "step": 135510 }, { "epoch": 38.11, "learning_rate": 2.6463624152687973e-05, "loss": 0.0618, "step": 135540 }, { "epoch": 38.11, "learning_rate": 2.6444881766782247e-05, "loss": 0.0688, "step": 135570 }, { "epoch": 38.12, "learning_rate": 2.6426139380876518e-05, "loss": 0.0591, "step": 135600 }, { "epoch": 38.13, "learning_rate": 2.6407396994970795e-05, "loss": 0.0661, "step": 135630 }, { "epoch": 38.14, "learning_rate": 2.6388654609065066e-05, "loss": 0.0619, "step": 135660 }, { "epoch": 38.15, "learning_rate": 2.6369912223159344e-05, "loss": 0.0609, "step": 135690 }, { "epoch": 38.16, "learning_rate": 2.6351169837253614e-05, "loss": 0.0686, "step": 135720 }, { "epoch": 38.16, "learning_rate": 2.6332427451347892e-05, "loss": 0.0557, "step": 135750 }, { "epoch": 38.17, "learning_rate": 2.6313685065442166e-05, "loss": 0.0644, "step": 135780 }, { "epoch": 38.18, "learning_rate": 2.6294942679536437e-05, "loss": 0.0611, "step": 135810 }, { "epoch": 38.19, "learning_rate": 2.6276200293630714e-05, "loss": 0.0602, "step": 135840 }, { "epoch": 38.2, "learning_rate": 2.6257457907724985e-05, "loss": 0.0695, "step": 135870 }, { "epoch": 38.21, "learning_rate": 2.6238715521819263e-05, "loss": 0.0559, "step": 135900 }, { "epoch": 38.21, "learning_rate": 2.6219973135913534e-05, "loss": 0.0652, "step": 135930 }, { "epoch": 38.22, "learning_rate": 2.620123075000781e-05, "loss": 0.0596, "step": 135960 }, { "epoch": 38.23, "learning_rate": 2.6182488364102085e-05, "loss": 0.0575, "step": 135990 }, { "epoch": 38.24, "learning_rate": 2.6163745978196356e-05, "loss": 0.07, "step": 136020 }, { "epoch": 38.25, "learning_rate": 2.6145003592290634e-05, "loss": 0.0574, "step": 136050 }, { "epoch": 38.26, "learning_rate": 2.6126261206384905e-05, "loss": 0.0678, "step": 136080 }, { "epoch": 38.27, "learning_rate": 2.6107518820479182e-05, "loss": 0.0615, "step": 136110 }, { "epoch": 38.27, "learning_rate": 2.6088776434573453e-05, "loss": 0.0627, "step": 136140 }, { "epoch": 38.28, "learning_rate": 2.607003404866773e-05, "loss": 0.068, "step": 136170 }, { "epoch": 38.29, "learning_rate": 2.6051291662762005e-05, "loss": 0.0536, "step": 136200 }, { "epoch": 38.3, "learning_rate": 2.603254927685628e-05, "loss": 0.0641, "step": 136230 }, { "epoch": 38.31, "learning_rate": 2.6013806890950553e-05, "loss": 0.0609, "step": 136260 }, { "epoch": 38.32, "learning_rate": 2.5995064505044824e-05, "loss": 0.0607, "step": 136290 }, { "epoch": 38.32, "learning_rate": 2.59763221191391e-05, "loss": 0.0664, "step": 136320 }, { "epoch": 38.33, "learning_rate": 2.5957579733233372e-05, "loss": 0.0577, "step": 136350 }, { "epoch": 38.34, "learning_rate": 2.593883734732765e-05, "loss": 0.0637, "step": 136380 }, { "epoch": 38.35, "learning_rate": 2.5920094961421924e-05, "loss": 0.0601, "step": 136410 }, { "epoch": 38.36, "learning_rate": 2.5901352575516198e-05, "loss": 0.0567, "step": 136440 }, { "epoch": 38.37, "learning_rate": 2.5882610189610472e-05, "loss": 0.0659, "step": 136470 }, { "epoch": 38.37, "learning_rate": 2.5863867803704743e-05, "loss": 0.0586, "step": 136500 }, { "epoch": 38.38, "learning_rate": 2.584512541779902e-05, "loss": 0.07, "step": 136530 }, { "epoch": 38.39, "learning_rate": 2.582638303189329e-05, "loss": 0.062, "step": 136560 }, { "epoch": 38.4, "learning_rate": 2.580764064598757e-05, "loss": 0.0627, "step": 136590 }, { "epoch": 38.41, "learning_rate": 2.5788898260081847e-05, "loss": 0.0653, "step": 136620 }, { "epoch": 38.42, "learning_rate": 2.5770155874176118e-05, "loss": 0.0578, "step": 136650 }, { "epoch": 38.43, "learning_rate": 2.5751413488270392e-05, "loss": 0.0665, "step": 136680 }, { "epoch": 38.43, "learning_rate": 2.5732671102364663e-05, "loss": 0.0635, "step": 136710 }, { "epoch": 38.44, "learning_rate": 2.571392871645894e-05, "loss": 0.0629, "step": 136740 }, { "epoch": 38.45, "learning_rate": 2.569518633055321e-05, "loss": 0.0676, "step": 136770 }, { "epoch": 38.46, "learning_rate": 2.567644394464749e-05, "loss": 0.0621, "step": 136800 }, { "epoch": 38.47, "learning_rate": 2.5657701558741766e-05, "loss": 0.0614, "step": 136830 }, { "epoch": 38.48, "learning_rate": 2.5638959172836037e-05, "loss": 0.0633, "step": 136860 }, { "epoch": 38.48, "learning_rate": 2.562021678693031e-05, "loss": 0.0576, "step": 136890 }, { "epoch": 38.49, "learning_rate": 2.5601474401024582e-05, "loss": 0.0681, "step": 136920 }, { "epoch": 38.5, "learning_rate": 2.558273201511886e-05, "loss": 0.0561, "step": 136950 }, { "epoch": 38.51, "learning_rate": 2.556398962921313e-05, "loss": 0.0658, "step": 136980 }, { "epoch": 38.52, "learning_rate": 2.5545247243307408e-05, "loss": 0.061, "step": 137010 }, { "epoch": 38.53, "learning_rate": 2.5526504857401686e-05, "loss": 0.0622, "step": 137040 }, { "epoch": 38.54, "learning_rate": 2.5507762471495956e-05, "loss": 0.0692, "step": 137070 }, { "epoch": 38.54, "learning_rate": 2.548902008559023e-05, "loss": 0.0578, "step": 137100 }, { "epoch": 38.55, "learning_rate": 2.54702776996845e-05, "loss": 0.0665, "step": 137130 }, { "epoch": 38.56, "learning_rate": 2.545153531377878e-05, "loss": 0.0652, "step": 137160 }, { "epoch": 38.57, "learning_rate": 2.543279292787305e-05, "loss": 0.0628, "step": 137190 }, { "epoch": 38.58, "learning_rate": 2.5414050541967327e-05, "loss": 0.0734, "step": 137220 }, { "epoch": 38.59, "learning_rate": 2.5395308156061605e-05, "loss": 0.0568, "step": 137250 }, { "epoch": 38.59, "learning_rate": 2.5376565770155876e-05, "loss": 0.0678, "step": 137280 }, { "epoch": 38.6, "learning_rate": 2.535782338425015e-05, "loss": 0.0592, "step": 137310 }, { "epoch": 38.61, "learning_rate": 2.533908099834442e-05, "loss": 0.0614, "step": 137340 }, { "epoch": 38.62, "learning_rate": 2.5320338612438698e-05, "loss": 0.0709, "step": 137370 }, { "epoch": 38.63, "learning_rate": 2.530159622653297e-05, "loss": 0.0609, "step": 137400 }, { "epoch": 38.64, "learning_rate": 2.5282853840627247e-05, "loss": 0.0657, "step": 137430 }, { "epoch": 38.64, "learning_rate": 2.5264111454721524e-05, "loss": 0.0652, "step": 137460 }, { "epoch": 38.65, "learning_rate": 2.5245369068815795e-05, "loss": 0.0643, "step": 137490 }, { "epoch": 38.66, "learning_rate": 2.522662668291007e-05, "loss": 0.0734, "step": 137520 }, { "epoch": 38.67, "learning_rate": 2.520788429700434e-05, "loss": 0.0602, "step": 137550 }, { "epoch": 38.68, "learning_rate": 2.5189141911098618e-05, "loss": 0.0645, "step": 137580 }, { "epoch": 38.69, "learning_rate": 2.517039952519289e-05, "loss": 0.0608, "step": 137610 }, { "epoch": 38.7, "learning_rate": 2.5151657139287166e-05, "loss": 0.0623, "step": 137640 }, { "epoch": 38.7, "learning_rate": 2.5132914753381444e-05, "loss": 0.0656, "step": 137670 }, { "epoch": 38.71, "learning_rate": 2.5114172367475714e-05, "loss": 0.0556, "step": 137700 }, { "epoch": 38.72, "learning_rate": 2.509542998156999e-05, "loss": 0.0627, "step": 137730 }, { "epoch": 38.73, "learning_rate": 2.5076687595664263e-05, "loss": 0.0622, "step": 137760 }, { "epoch": 38.74, "learning_rate": 2.5057945209758537e-05, "loss": 0.0634, "step": 137790 }, { "epoch": 38.75, "learning_rate": 2.5039202823852808e-05, "loss": 0.0677, "step": 137820 }, { "epoch": 38.75, "learning_rate": 2.5020460437947085e-05, "loss": 0.0546, "step": 137850 }, { "epoch": 38.76, "learning_rate": 2.5001718052041363e-05, "loss": 0.0666, "step": 137880 }, { "epoch": 38.77, "learning_rate": 2.4982975666135634e-05, "loss": 0.061, "step": 137910 }, { "epoch": 38.78, "learning_rate": 2.4964233280229908e-05, "loss": 0.0638, "step": 137940 }, { "epoch": 38.79, "learning_rate": 2.4945490894324182e-05, "loss": 0.0704, "step": 137970 }, { "epoch": 38.8, "learning_rate": 2.4926748508418456e-05, "loss": 0.0535, "step": 138000 }, { "epoch": 38.81, "learning_rate": 2.4908630868709587e-05, "loss": 0.0662, "step": 138030 }, { "epoch": 38.81, "learning_rate": 2.488988848280386e-05, "loss": 0.0658, "step": 138060 }, { "epoch": 38.82, "learning_rate": 2.487114609689814e-05, "loss": 0.0631, "step": 138090 }, { "epoch": 38.83, "learning_rate": 2.485240371099241e-05, "loss": 0.0691, "step": 138120 }, { "epoch": 38.84, "learning_rate": 2.4833661325086684e-05, "loss": 0.058, "step": 138150 }, { "epoch": 38.85, "learning_rate": 2.4814918939180958e-05, "loss": 0.07, "step": 138180 }, { "epoch": 38.86, "learning_rate": 2.4796176553275232e-05, "loss": 0.0663, "step": 138210 }, { "epoch": 38.86, "learning_rate": 2.4777434167369506e-05, "loss": 0.0623, "step": 138240 }, { "epoch": 38.87, "learning_rate": 2.475869178146378e-05, "loss": 0.0784, "step": 138270 }, { "epoch": 38.88, "learning_rate": 2.4739949395558058e-05, "loss": 0.0632, "step": 138300 }, { "epoch": 38.89, "learning_rate": 2.4721207009652332e-05, "loss": 0.0666, "step": 138330 }, { "epoch": 38.9, "learning_rate": 2.4702464623746603e-05, "loss": 0.0645, "step": 138360 }, { "epoch": 38.91, "learning_rate": 2.4683722237840877e-05, "loss": 0.0616, "step": 138390 }, { "epoch": 38.91, "learning_rate": 2.466497985193515e-05, "loss": 0.07, "step": 138420 }, { "epoch": 38.92, "learning_rate": 2.4646237466029426e-05, "loss": 0.0581, "step": 138450 }, { "epoch": 38.93, "learning_rate": 2.46274950801237e-05, "loss": 0.0619, "step": 138480 }, { "epoch": 38.94, "learning_rate": 2.4608752694217977e-05, "loss": 0.0605, "step": 138510 }, { "epoch": 38.95, "learning_rate": 2.459001030831225e-05, "loss": 0.0621, "step": 138540 }, { "epoch": 38.96, "learning_rate": 2.4571267922406522e-05, "loss": 0.068, "step": 138570 }, { "epoch": 38.97, "learning_rate": 2.4552525536500797e-05, "loss": 0.054, "step": 138600 }, { "epoch": 38.97, "learning_rate": 2.453378315059507e-05, "loss": 0.0649, "step": 138630 }, { "epoch": 38.98, "learning_rate": 2.4515040764689345e-05, "loss": 0.0632, "step": 138660 }, { "epoch": 38.99, "learning_rate": 2.449629837878362e-05, "loss": 0.0639, "step": 138690 }, { "epoch": 39.0, "learning_rate": 2.4477555992877897e-05, "loss": 0.0683, "step": 138720 }, { "epoch": 39.0, "eval_loss": 0.17769518494606018, "eval_runtime": 505.9269, "eval_samples_per_second": 31.69, "eval_steps_per_second": 0.992, "eval_wer": 0.12791205491790975, "step": 138723 }, { "epoch": 39.01, "learning_rate": 2.445881360697217e-05, "loss": 0.056, "step": 138750 }, { "epoch": 39.02, "learning_rate": 2.4440071221066442e-05, "loss": 0.0672, "step": 138780 }, { "epoch": 39.02, "learning_rate": 2.4421328835160716e-05, "loss": 0.0538, "step": 138810 }, { "epoch": 39.03, "learning_rate": 2.440258644925499e-05, "loss": 0.0613, "step": 138840 }, { "epoch": 39.04, "learning_rate": 2.4383844063349264e-05, "loss": 0.0664, "step": 138870 }, { "epoch": 39.05, "learning_rate": 2.436510167744354e-05, "loss": 0.0597, "step": 138900 }, { "epoch": 39.06, "learning_rate": 2.4346984037734673e-05, "loss": 0.0637, "step": 138930 }, { "epoch": 39.07, "learning_rate": 2.4328241651828944e-05, "loss": 0.0584, "step": 138960 }, { "epoch": 39.08, "learning_rate": 2.4309499265923218e-05, "loss": 0.0651, "step": 138990 }, { "epoch": 39.08, "learning_rate": 2.4290756880017492e-05, "loss": 0.0643, "step": 139020 }, { "epoch": 39.09, "learning_rate": 2.427201449411177e-05, "loss": 0.06, "step": 139050 }, { "epoch": 39.1, "learning_rate": 2.4253272108206044e-05, "loss": 0.0657, "step": 139080 }, { "epoch": 39.11, "learning_rate": 2.4234529722300318e-05, "loss": 0.0607, "step": 139110 }, { "epoch": 39.12, "learning_rate": 2.4215787336394592e-05, "loss": 0.0648, "step": 139140 }, { "epoch": 39.13, "learning_rate": 2.4197044950488866e-05, "loss": 0.0618, "step": 139170 }, { "epoch": 39.13, "learning_rate": 2.4178302564583137e-05, "loss": 0.0586, "step": 139200 }, { "epoch": 39.14, "learning_rate": 2.415956017867741e-05, "loss": 0.0662, "step": 139230 }, { "epoch": 39.15, "learning_rate": 2.414081779277169e-05, "loss": 0.0581, "step": 139260 }, { "epoch": 39.16, "learning_rate": 2.4122075406865963e-05, "loss": 0.0647, "step": 139290 }, { "epoch": 39.17, "learning_rate": 2.4103333020960237e-05, "loss": 0.0656, "step": 139320 }, { "epoch": 39.18, "learning_rate": 2.408459063505451e-05, "loss": 0.0591, "step": 139350 }, { "epoch": 39.18, "learning_rate": 2.4065848249148786e-05, "loss": 0.069, "step": 139380 }, { "epoch": 39.19, "learning_rate": 2.4047105863243056e-05, "loss": 0.0589, "step": 139410 }, { "epoch": 39.2, "learning_rate": 2.402836347733733e-05, "loss": 0.0607, "step": 139440 }, { "epoch": 39.21, "learning_rate": 2.4009621091431608e-05, "loss": 0.062, "step": 139470 }, { "epoch": 39.22, "learning_rate": 2.3990878705525882e-05, "loss": 0.0585, "step": 139500 }, { "epoch": 39.23, "learning_rate": 2.3972136319620157e-05, "loss": 0.0688, "step": 139530 }, { "epoch": 39.24, "learning_rate": 2.395339393371443e-05, "loss": 0.0581, "step": 139560 }, { "epoch": 39.24, "learning_rate": 2.3934651547808705e-05, "loss": 0.0714, "step": 139590 }, { "epoch": 39.25, "learning_rate": 2.3915909161902976e-05, "loss": 0.062, "step": 139620 }, { "epoch": 39.26, "learning_rate": 2.389716677599725e-05, "loss": 0.0565, "step": 139650 }, { "epoch": 39.27, "learning_rate": 2.3878424390091528e-05, "loss": 0.0726, "step": 139680 }, { "epoch": 39.28, "learning_rate": 2.3859682004185802e-05, "loss": 0.056, "step": 139710 }, { "epoch": 39.29, "learning_rate": 2.3840939618280076e-05, "loss": 0.0601, "step": 139740 }, { "epoch": 39.29, "learning_rate": 2.382219723237435e-05, "loss": 0.0627, "step": 139770 }, { "epoch": 39.3, "learning_rate": 2.3803454846468624e-05, "loss": 0.0603, "step": 139800 }, { "epoch": 39.31, "learning_rate": 2.37847124605629e-05, "loss": 0.0623, "step": 139830 }, { "epoch": 39.32, "learning_rate": 2.376597007465717e-05, "loss": 0.0577, "step": 139860 }, { "epoch": 39.33, "learning_rate": 2.3747227688751447e-05, "loss": 0.0633, "step": 139890 }, { "epoch": 39.34, "learning_rate": 2.372848530284572e-05, "loss": 0.0645, "step": 139920 }, { "epoch": 39.34, "learning_rate": 2.3709742916939995e-05, "loss": 0.0568, "step": 139950 }, { "epoch": 39.35, "learning_rate": 2.369100053103427e-05, "loss": 0.0637, "step": 139980 }, { "epoch": 39.36, "learning_rate": 2.3672258145128544e-05, "loss": 0.0589, "step": 140010 }, { "epoch": 39.37, "learning_rate": 2.3653515759222818e-05, "loss": 0.0617, "step": 140040 }, { "epoch": 39.38, "learning_rate": 2.363477337331709e-05, "loss": 0.0622, "step": 140070 }, { "epoch": 39.39, "learning_rate": 2.3616030987411363e-05, "loss": 0.0591, "step": 140100 }, { "epoch": 39.4, "learning_rate": 2.359728860150564e-05, "loss": 0.0652, "step": 140130 }, { "epoch": 39.4, "learning_rate": 2.3578546215599915e-05, "loss": 0.059, "step": 140160 }, { "epoch": 39.41, "learning_rate": 2.355980382969419e-05, "loss": 0.0647, "step": 140190 }, { "epoch": 39.42, "learning_rate": 2.3541061443788463e-05, "loss": 0.0638, "step": 140220 }, { "epoch": 39.43, "learning_rate": 2.3522319057882737e-05, "loss": 0.0575, "step": 140250 }, { "epoch": 39.44, "learning_rate": 2.3503576671977008e-05, "loss": 0.0632, "step": 140280 }, { "epoch": 39.45, "learning_rate": 2.3484834286071282e-05, "loss": 0.0602, "step": 140310 }, { "epoch": 39.45, "learning_rate": 2.346609190016556e-05, "loss": 0.0621, "step": 140340 }, { "epoch": 39.46, "learning_rate": 2.3447349514259834e-05, "loss": 0.0629, "step": 140370 }, { "epoch": 39.47, "learning_rate": 2.3428607128354108e-05, "loss": 0.0601, "step": 140400 }, { "epoch": 39.48, "learning_rate": 2.3409864742448382e-05, "loss": 0.0647, "step": 140430 }, { "epoch": 39.49, "learning_rate": 2.3391122356542656e-05, "loss": 0.058, "step": 140460 }, { "epoch": 39.5, "learning_rate": 2.3372379970636927e-05, "loss": 0.0641, "step": 140490 }, { "epoch": 39.51, "learning_rate": 2.33536375847312e-05, "loss": 0.0642, "step": 140520 }, { "epoch": 39.51, "learning_rate": 2.333489519882548e-05, "loss": 0.0573, "step": 140550 }, { "epoch": 39.52, "learning_rate": 2.3316152812919753e-05, "loss": 0.0669, "step": 140580 }, { "epoch": 39.53, "learning_rate": 2.3297410427014027e-05, "loss": 0.0584, "step": 140610 }, { "epoch": 39.54, "learning_rate": 2.32786680411083e-05, "loss": 0.0648, "step": 140640 }, { "epoch": 39.55, "learning_rate": 2.3259925655202576e-05, "loss": 0.0634, "step": 140670 }, { "epoch": 39.56, "learning_rate": 2.324118326929685e-05, "loss": 0.0604, "step": 140700 }, { "epoch": 39.56, "learning_rate": 2.322244088339112e-05, "loss": 0.07, "step": 140730 }, { "epoch": 39.57, "learning_rate": 2.32036984974854e-05, "loss": 0.0565, "step": 140760 }, { "epoch": 39.58, "learning_rate": 2.3184956111579673e-05, "loss": 0.0623, "step": 140790 }, { "epoch": 39.59, "learning_rate": 2.3166213725673947e-05, "loss": 0.0636, "step": 140820 }, { "epoch": 39.6, "learning_rate": 2.314747133976822e-05, "loss": 0.0595, "step": 140850 }, { "epoch": 39.61, "learning_rate": 2.3128728953862495e-05, "loss": 0.0674, "step": 140880 }, { "epoch": 39.61, "learning_rate": 2.310998656795677e-05, "loss": 0.0563, "step": 140910 }, { "epoch": 39.62, "learning_rate": 2.309124418205104e-05, "loss": 0.0668, "step": 140940 }, { "epoch": 39.63, "learning_rate": 2.3072501796145318e-05, "loss": 0.0648, "step": 140970 }, { "epoch": 39.64, "learning_rate": 2.3053759410239592e-05, "loss": 0.0583, "step": 141000 }, { "epoch": 39.65, "learning_rate": 2.3035017024333866e-05, "loss": 0.0655, "step": 141030 }, { "epoch": 39.66, "learning_rate": 2.301627463842814e-05, "loss": 0.0621, "step": 141060 }, { "epoch": 39.67, "learning_rate": 2.2997532252522414e-05, "loss": 0.0595, "step": 141090 }, { "epoch": 39.67, "learning_rate": 2.297878986661669e-05, "loss": 0.0634, "step": 141120 }, { "epoch": 39.68, "learning_rate": 2.296004748071096e-05, "loss": 0.0637, "step": 141150 }, { "epoch": 39.69, "learning_rate": 2.2941305094805237e-05, "loss": 0.0682, "step": 141180 }, { "epoch": 39.7, "learning_rate": 2.292256270889951e-05, "loss": 0.0651, "step": 141210 }, { "epoch": 39.71, "learning_rate": 2.2903820322993785e-05, "loss": 0.0655, "step": 141240 }, { "epoch": 39.72, "learning_rate": 2.288507793708806e-05, "loss": 0.064, "step": 141270 }, { "epoch": 39.72, "learning_rate": 2.2866335551182334e-05, "loss": 0.0611, "step": 141300 }, { "epoch": 39.73, "learning_rate": 2.2847593165276608e-05, "loss": 0.0695, "step": 141330 }, { "epoch": 39.74, "learning_rate": 2.2828850779370882e-05, "loss": 0.0575, "step": 141360 }, { "epoch": 39.75, "learning_rate": 2.2810108393465156e-05, "loss": 0.0654, "step": 141390 }, { "epoch": 39.76, "learning_rate": 2.279136600755943e-05, "loss": 0.0618, "step": 141420 }, { "epoch": 39.77, "learning_rate": 2.2772623621653705e-05, "loss": 0.0602, "step": 141450 }, { "epoch": 39.77, "learning_rate": 2.275388123574798e-05, "loss": 0.0654, "step": 141480 }, { "epoch": 39.78, "learning_rate": 2.2735138849842253e-05, "loss": 0.0563, "step": 141510 }, { "epoch": 39.79, "learning_rate": 2.2716396463936527e-05, "loss": 0.0671, "step": 141540 }, { "epoch": 39.8, "learning_rate": 2.26976540780308e-05, "loss": 0.0623, "step": 141570 }, { "epoch": 39.81, "learning_rate": 2.2678911692125076e-05, "loss": 0.0625, "step": 141600 }, { "epoch": 39.82, "learning_rate": 2.266016930621935e-05, "loss": 0.0687, "step": 141630 }, { "epoch": 39.83, "learning_rate": 2.2641426920313624e-05, "loss": 0.0564, "step": 141660 }, { "epoch": 39.83, "learning_rate": 2.2622684534407898e-05, "loss": 0.0636, "step": 141690 }, { "epoch": 39.84, "learning_rate": 2.2603942148502172e-05, "loss": 0.062, "step": 141720 }, { "epoch": 39.85, "learning_rate": 2.2585199762596447e-05, "loss": 0.0589, "step": 141750 }, { "epoch": 39.86, "learning_rate": 2.256645737669072e-05, "loss": 0.0629, "step": 141780 }, { "epoch": 39.87, "learning_rate": 2.2547714990784995e-05, "loss": 0.0558, "step": 141810 }, { "epoch": 39.88, "learning_rate": 2.252897260487927e-05, "loss": 0.0612, "step": 141840 }, { "epoch": 39.88, "learning_rate": 2.2510230218973543e-05, "loss": 0.0627, "step": 141870 }, { "epoch": 39.89, "learning_rate": 2.2491487833067818e-05, "loss": 0.0566, "step": 141900 }, { "epoch": 39.9, "learning_rate": 2.2472745447162092e-05, "loss": 0.0665, "step": 141930 }, { "epoch": 39.91, "learning_rate": 2.2454003061256366e-05, "loss": 0.0547, "step": 141960 }, { "epoch": 39.92, "learning_rate": 2.2435885421547497e-05, "loss": 0.0638, "step": 141990 }, { "epoch": 39.93, "learning_rate": 2.241714303564177e-05, "loss": 0.0575, "step": 142020 }, { "epoch": 39.94, "learning_rate": 2.2398400649736045e-05, "loss": 0.0584, "step": 142050 }, { "epoch": 39.94, "learning_rate": 2.237965826383032e-05, "loss": 0.0676, "step": 142080 }, { "epoch": 39.95, "learning_rate": 2.2360915877924594e-05, "loss": 0.0615, "step": 142110 }, { "epoch": 39.96, "learning_rate": 2.234217349201887e-05, "loss": 0.0631, "step": 142140 }, { "epoch": 39.97, "learning_rate": 2.2323431106113142e-05, "loss": 0.0652, "step": 142170 }, { "epoch": 39.98, "learning_rate": 2.2304688720207416e-05, "loss": 0.0623, "step": 142200 }, { "epoch": 39.99, "learning_rate": 2.228594633430169e-05, "loss": 0.0696, "step": 142230 }, { "epoch": 39.99, "learning_rate": 2.2267203948395965e-05, "loss": 0.0587, "step": 142260 }, { "epoch": 40.0, "eval_loss": 0.17351745069026947, "eval_runtime": 506.6702, "eval_samples_per_second": 31.644, "eval_steps_per_second": 0.991, "eval_wer": 0.1271068469968474, "step": 142280 }, { "epoch": 40.0, "learning_rate": 2.224846156249024e-05, "loss": 0.0646, "step": 142290 }, { "epoch": 40.01, "learning_rate": 2.2229719176584513e-05, "loss": 0.057, "step": 142320 }, { "epoch": 40.02, "learning_rate": 2.221097679067879e-05, "loss": 0.0635, "step": 142350 }, { "epoch": 40.03, "learning_rate": 2.219223440477306e-05, "loss": 0.0667, "step": 142380 }, { "epoch": 40.04, "learning_rate": 2.2173492018867336e-05, "loss": 0.0561, "step": 142410 }, { "epoch": 40.04, "learning_rate": 2.215474963296161e-05, "loss": 0.0643, "step": 142440 }, { "epoch": 40.05, "learning_rate": 2.2136007247055884e-05, "loss": 0.0562, "step": 142470 }, { "epoch": 40.06, "learning_rate": 2.2117264861150158e-05, "loss": 0.062, "step": 142500 }, { "epoch": 40.07, "learning_rate": 2.2098522475244432e-05, "loss": 0.0686, "step": 142530 }, { "epoch": 40.08, "learning_rate": 2.207978008933871e-05, "loss": 0.0547, "step": 142560 }, { "epoch": 40.09, "learning_rate": 2.2061037703432984e-05, "loss": 0.06, "step": 142590 }, { "epoch": 40.1, "learning_rate": 2.2042295317527255e-05, "loss": 0.0572, "step": 142620 }, { "epoch": 40.1, "learning_rate": 2.202355293162153e-05, "loss": 0.0626, "step": 142650 }, { "epoch": 40.11, "learning_rate": 2.2004810545715803e-05, "loss": 0.0668, "step": 142680 }, { "epoch": 40.12, "learning_rate": 2.1986068159810077e-05, "loss": 0.0525, "step": 142710 }, { "epoch": 40.13, "learning_rate": 2.196732577390435e-05, "loss": 0.0625, "step": 142740 }, { "epoch": 40.14, "learning_rate": 2.1948583387998626e-05, "loss": 0.0567, "step": 142770 }, { "epoch": 40.15, "learning_rate": 2.1929841002092903e-05, "loss": 0.0651, "step": 142800 }, { "epoch": 40.15, "learning_rate": 2.1911098616187174e-05, "loss": 0.0704, "step": 142830 }, { "epoch": 40.16, "learning_rate": 2.189235623028145e-05, "loss": 0.0512, "step": 142860 }, { "epoch": 40.17, "learning_rate": 2.1873613844375723e-05, "loss": 0.0663, "step": 142890 }, { "epoch": 40.18, "learning_rate": 2.1854871458469997e-05, "loss": 0.0588, "step": 142920 }, { "epoch": 40.19, "learning_rate": 2.183612907256427e-05, "loss": 0.0641, "step": 142950 }, { "epoch": 40.2, "learning_rate": 2.1817386686658545e-05, "loss": 0.0659, "step": 142980 }, { "epoch": 40.21, "learning_rate": 2.1798644300752823e-05, "loss": 0.0563, "step": 143010 }, { "epoch": 40.21, "learning_rate": 2.1779901914847094e-05, "loss": 0.0662, "step": 143040 }, { "epoch": 40.22, "learning_rate": 2.1761159528941368e-05, "loss": 0.0565, "step": 143070 }, { "epoch": 40.23, "learning_rate": 2.1742417143035642e-05, "loss": 0.0601, "step": 143100 }, { "epoch": 40.24, "learning_rate": 2.1723674757129916e-05, "loss": 0.0693, "step": 143130 }, { "epoch": 40.25, "learning_rate": 2.170493237122419e-05, "loss": 0.056, "step": 143160 }, { "epoch": 40.26, "learning_rate": 2.1686189985318464e-05, "loss": 0.0677, "step": 143190 }, { "epoch": 40.26, "learning_rate": 2.1667447599412742e-05, "loss": 0.0562, "step": 143220 }, { "epoch": 40.27, "learning_rate": 2.1648705213507013e-05, "loss": 0.0635, "step": 143250 }, { "epoch": 40.28, "learning_rate": 2.1629962827601287e-05, "loss": 0.0686, "step": 143280 }, { "epoch": 40.29, "learning_rate": 2.161122044169556e-05, "loss": 0.0511, "step": 143310 }, { "epoch": 40.3, "learning_rate": 2.1592478055789835e-05, "loss": 0.066, "step": 143340 }, { "epoch": 40.31, "learning_rate": 2.157373566988411e-05, "loss": 0.0583, "step": 143370 }, { "epoch": 40.31, "learning_rate": 2.1554993283978384e-05, "loss": 0.055, "step": 143400 }, { "epoch": 40.32, "learning_rate": 2.153625089807266e-05, "loss": 0.0644, "step": 143430 }, { "epoch": 40.33, "learning_rate": 2.1517508512166936e-05, "loss": 0.0525, "step": 143460 }, { "epoch": 40.34, "learning_rate": 2.1498766126261206e-05, "loss": 0.0653, "step": 143490 }, { "epoch": 40.35, "learning_rate": 2.148002374035548e-05, "loss": 0.0569, "step": 143520 }, { "epoch": 40.36, "learning_rate": 2.1461281354449755e-05, "loss": 0.0593, "step": 143550 }, { "epoch": 40.37, "learning_rate": 2.144253896854403e-05, "loss": 0.0691, "step": 143580 }, { "epoch": 40.37, "learning_rate": 2.1423796582638303e-05, "loss": 0.0546, "step": 143610 }, { "epoch": 40.38, "learning_rate": 2.140505419673258e-05, "loss": 0.06, "step": 143640 }, { "epoch": 40.39, "learning_rate": 2.1386311810826855e-05, "loss": 0.0573, "step": 143670 }, { "epoch": 40.4, "learning_rate": 2.1367569424921126e-05, "loss": 0.0635, "step": 143700 }, { "epoch": 40.41, "learning_rate": 2.13488270390154e-05, "loss": 0.0698, "step": 143730 }, { "epoch": 40.42, "learning_rate": 2.1330084653109674e-05, "loss": 0.0514, "step": 143760 }, { "epoch": 40.42, "learning_rate": 2.1311342267203948e-05, "loss": 0.0637, "step": 143790 }, { "epoch": 40.43, "learning_rate": 2.1292599881298222e-05, "loss": 0.0572, "step": 143820 }, { "epoch": 40.44, "learning_rate": 2.12738574953925e-05, "loss": 0.0603, "step": 143850 }, { "epoch": 40.45, "learning_rate": 2.1255115109486774e-05, "loss": 0.0636, "step": 143880 }, { "epoch": 40.46, "learning_rate": 2.1236372723581045e-05, "loss": 0.0547, "step": 143910 }, { "epoch": 40.47, "learning_rate": 2.121763033767532e-05, "loss": 0.0613, "step": 143940 }, { "epoch": 40.48, "learning_rate": 2.1198887951769593e-05, "loss": 0.0591, "step": 143970 }, { "epoch": 40.48, "learning_rate": 2.1180145565863868e-05, "loss": 0.0599, "step": 144000 }, { "epoch": 40.49, "learning_rate": 2.1161403179958142e-05, "loss": 0.064, "step": 144030 }, { "epoch": 40.5, "learning_rate": 2.114266079405242e-05, "loss": 0.0556, "step": 144060 }, { "epoch": 40.51, "learning_rate": 2.1123918408146694e-05, "loss": 0.0625, "step": 144090 }, { "epoch": 40.52, "learning_rate": 2.1105176022240968e-05, "loss": 0.0587, "step": 144120 }, { "epoch": 40.53, "learning_rate": 2.108643363633524e-05, "loss": 0.0641, "step": 144150 }, { "epoch": 40.53, "learning_rate": 2.1067691250429513e-05, "loss": 0.0702, "step": 144180 }, { "epoch": 40.54, "learning_rate": 2.1048948864523787e-05, "loss": 0.0522, "step": 144210 }, { "epoch": 40.55, "learning_rate": 2.103020647861806e-05, "loss": 0.0663, "step": 144240 }, { "epoch": 40.56, "learning_rate": 2.101146409271234e-05, "loss": 0.0607, "step": 144270 }, { "epoch": 40.57, "learning_rate": 2.0992721706806613e-05, "loss": 0.0607, "step": 144300 }, { "epoch": 40.58, "learning_rate": 2.0973979320900887e-05, "loss": 0.0684, "step": 144330 }, { "epoch": 40.58, "learning_rate": 2.0955236934995158e-05, "loss": 0.058, "step": 144360 }, { "epoch": 40.59, "learning_rate": 2.0936494549089432e-05, "loss": 0.0644, "step": 144390 }, { "epoch": 40.6, "learning_rate": 2.0917752163183706e-05, "loss": 0.0573, "step": 144420 }, { "epoch": 40.61, "learning_rate": 2.089900977727798e-05, "loss": 0.0609, "step": 144450 }, { "epoch": 40.62, "learning_rate": 2.0880267391372258e-05, "loss": 0.0652, "step": 144480 }, { "epoch": 40.63, "learning_rate": 2.0861525005466532e-05, "loss": 0.0529, "step": 144510 }, { "epoch": 40.64, "learning_rate": 2.0842782619560806e-05, "loss": 0.0618, "step": 144540 }, { "epoch": 40.64, "learning_rate": 2.0824040233655077e-05, "loss": 0.0558, "step": 144570 }, { "epoch": 40.65, "learning_rate": 2.080529784774935e-05, "loss": 0.0609, "step": 144600 }, { "epoch": 40.66, "learning_rate": 2.0786555461843626e-05, "loss": 0.066, "step": 144630 }, { "epoch": 40.67, "learning_rate": 2.07678130759379e-05, "loss": 0.055, "step": 144660 }, { "epoch": 40.68, "learning_rate": 2.0749070690032174e-05, "loss": 0.0647, "step": 144690 }, { "epoch": 40.69, "learning_rate": 2.073032830412645e-05, "loss": 0.0555, "step": 144720 }, { "epoch": 40.69, "learning_rate": 2.0711585918220726e-05, "loss": 0.0592, "step": 144750 }, { "epoch": 40.7, "learning_rate": 2.0692843532315e-05, "loss": 0.0675, "step": 144780 }, { "epoch": 40.71, "learning_rate": 2.067410114640927e-05, "loss": 0.0522, "step": 144810 }, { "epoch": 40.72, "learning_rate": 2.0655358760503545e-05, "loss": 0.0653, "step": 144840 }, { "epoch": 40.73, "learning_rate": 2.063661637459782e-05, "loss": 0.0554, "step": 144870 }, { "epoch": 40.74, "learning_rate": 2.0617873988692093e-05, "loss": 0.0629, "step": 144900 }, { "epoch": 40.74, "learning_rate": 2.059913160278637e-05, "loss": 0.0666, "step": 144930 }, { "epoch": 40.75, "learning_rate": 2.0580389216880645e-05, "loss": 0.0524, "step": 144960 }, { "epoch": 40.76, "learning_rate": 2.056164683097492e-05, "loss": 0.0612, "step": 144990 }, { "epoch": 40.77, "learning_rate": 2.054290444506919e-05, "loss": 0.0573, "step": 145020 }, { "epoch": 40.78, "learning_rate": 2.0524162059163464e-05, "loss": 0.0659, "step": 145050 }, { "epoch": 40.79, "learning_rate": 2.050541967325774e-05, "loss": 0.0641, "step": 145080 }, { "epoch": 40.8, "learning_rate": 2.0486677287352013e-05, "loss": 0.0565, "step": 145110 }, { "epoch": 40.8, "learning_rate": 2.046793490144629e-05, "loss": 0.0605, "step": 145140 }, { "epoch": 40.81, "learning_rate": 2.0449192515540564e-05, "loss": 0.0622, "step": 145170 }, { "epoch": 40.82, "learning_rate": 2.043045012963484e-05, "loss": 0.0639, "step": 145200 }, { "epoch": 40.83, "learning_rate": 2.041170774372911e-05, "loss": 0.0667, "step": 145230 }, { "epoch": 40.84, "learning_rate": 2.0392965357823384e-05, "loss": 0.056, "step": 145260 }, { "epoch": 40.85, "learning_rate": 2.0374222971917658e-05, "loss": 0.0647, "step": 145290 }, { "epoch": 40.85, "learning_rate": 2.0355480586011932e-05, "loss": 0.0572, "step": 145320 }, { "epoch": 40.86, "learning_rate": 2.033673820010621e-05, "loss": 0.0603, "step": 145350 }, { "epoch": 40.87, "learning_rate": 2.0317995814200484e-05, "loss": 0.0619, "step": 145380 }, { "epoch": 40.88, "learning_rate": 2.0299253428294758e-05, "loss": 0.0524, "step": 145410 }, { "epoch": 40.89, "learning_rate": 2.028051104238903e-05, "loss": 0.0642, "step": 145440 }, { "epoch": 40.9, "learning_rate": 2.0261768656483303e-05, "loss": 0.0577, "step": 145470 }, { "epoch": 40.91, "learning_rate": 2.0243026270577577e-05, "loss": 0.0584, "step": 145500 }, { "epoch": 40.91, "learning_rate": 2.022428388467185e-05, "loss": 0.0677, "step": 145530 }, { "epoch": 40.92, "learning_rate": 2.020554149876613e-05, "loss": 0.0515, "step": 145560 }, { "epoch": 40.93, "learning_rate": 2.0186799112860403e-05, "loss": 0.0625, "step": 145590 }, { "epoch": 40.94, "learning_rate": 2.0168056726954677e-05, "loss": 0.0558, "step": 145620 }, { "epoch": 40.95, "learning_rate": 2.014931434104895e-05, "loss": 0.0605, "step": 145650 }, { "epoch": 40.96, "learning_rate": 2.0130571955143222e-05, "loss": 0.0691, "step": 145680 }, { "epoch": 40.96, "learning_rate": 2.0111829569237496e-05, "loss": 0.0519, "step": 145710 }, { "epoch": 40.97, "learning_rate": 2.009308718333177e-05, "loss": 0.0686, "step": 145740 }, { "epoch": 40.98, "learning_rate": 2.0074344797426048e-05, "loss": 0.0576, "step": 145770 }, { "epoch": 40.99, "learning_rate": 2.0055602411520322e-05, "loss": 0.0631, "step": 145800 }, { "epoch": 41.0, "learning_rate": 2.0036860025614597e-05, "loss": 0.0693, "step": 145830 }, { "epoch": 41.0, "eval_loss": 0.1780107468366623, "eval_runtime": 506.6643, "eval_samples_per_second": 31.644, "eval_steps_per_second": 0.991, "eval_wer": 0.1259945682584308, "step": 145837 }, { "epoch": 41.01, "learning_rate": 2.001811763970887e-05, "loss": 0.0566, "step": 145860 }, { "epoch": 41.01, "learning_rate": 1.999937525380314e-05, "loss": 0.0635, "step": 145890 }, { "epoch": 41.02, "learning_rate": 1.9980632867897416e-05, "loss": 0.0551, "step": 145920 }, { "epoch": 41.03, "learning_rate": 1.996189048199169e-05, "loss": 0.0635, "step": 145950 }, { "epoch": 41.04, "learning_rate": 1.9943148096085968e-05, "loss": 0.0601, "step": 145980 }, { "epoch": 41.05, "learning_rate": 1.9924405710180242e-05, "loss": 0.0547, "step": 146010 }, { "epoch": 41.06, "learning_rate": 1.9905663324274516e-05, "loss": 0.0628, "step": 146040 }, { "epoch": 41.07, "learning_rate": 1.988692093836879e-05, "loss": 0.0534, "step": 146070 }, { "epoch": 41.07, "learning_rate": 1.986817855246306e-05, "loss": 0.0635, "step": 146100 }, { "epoch": 41.08, "learning_rate": 1.9849436166557335e-05, "loss": 0.0573, "step": 146130 }, { "epoch": 41.09, "learning_rate": 1.983069378065161e-05, "loss": 0.0627, "step": 146160 }, { "epoch": 41.1, "learning_rate": 1.9811951394745887e-05, "loss": 0.0647, "step": 146190 }, { "epoch": 41.11, "learning_rate": 1.979320900884016e-05, "loss": 0.0539, "step": 146220 }, { "epoch": 41.12, "learning_rate": 1.9774466622934435e-05, "loss": 0.062, "step": 146250 }, { "epoch": 41.12, "learning_rate": 1.975572423702871e-05, "loss": 0.057, "step": 146280 }, { "epoch": 41.13, "learning_rate": 1.9736981851122984e-05, "loss": 0.061, "step": 146310 }, { "epoch": 41.14, "learning_rate": 1.9718239465217254e-05, "loss": 0.0651, "step": 146340 }, { "epoch": 41.15, "learning_rate": 1.969949707931153e-05, "loss": 0.051, "step": 146370 }, { "epoch": 41.16, "learning_rate": 1.9680754693405803e-05, "loss": 0.0586, "step": 146400 }, { "epoch": 41.17, "learning_rate": 1.966201230750008e-05, "loss": 0.0554, "step": 146430 }, { "epoch": 41.18, "learning_rate": 1.9643269921594355e-05, "loss": 0.0632, "step": 146460 }, { "epoch": 41.18, "learning_rate": 1.962452753568863e-05, "loss": 0.0656, "step": 146490 }, { "epoch": 41.19, "learning_rate": 1.9605785149782903e-05, "loss": 0.0501, "step": 146520 }, { "epoch": 41.2, "learning_rate": 1.9587042763877174e-05, "loss": 0.0619, "step": 146550 }, { "epoch": 41.21, "learning_rate": 1.9568300377971448e-05, "loss": 0.0565, "step": 146580 }, { "epoch": 41.22, "learning_rate": 1.9549557992065722e-05, "loss": 0.0596, "step": 146610 }, { "epoch": 41.23, "learning_rate": 1.953081560616e-05, "loss": 0.0659, "step": 146640 }, { "epoch": 41.23, "learning_rate": 1.9512073220254274e-05, "loss": 0.0554, "step": 146670 }, { "epoch": 41.24, "learning_rate": 1.9493330834348548e-05, "loss": 0.0626, "step": 146700 }, { "epoch": 41.25, "learning_rate": 1.9474588448442822e-05, "loss": 0.0579, "step": 146730 }, { "epoch": 41.26, "learning_rate": 1.9455846062537093e-05, "loss": 0.0573, "step": 146760 }, { "epoch": 41.27, "learning_rate": 1.9437103676631367e-05, "loss": 0.0667, "step": 146790 }, { "epoch": 41.28, "learning_rate": 1.941836129072564e-05, "loss": 0.0567, "step": 146820 }, { "epoch": 41.28, "learning_rate": 1.939961890481992e-05, "loss": 0.0638, "step": 146850 }, { "epoch": 41.29, "learning_rate": 1.9380876518914193e-05, "loss": 0.0557, "step": 146880 }, { "epoch": 41.3, "learning_rate": 1.9362134133008467e-05, "loss": 0.0563, "step": 146910 }, { "epoch": 41.31, "learning_rate": 1.934339174710274e-05, "loss": 0.0658, "step": 146940 }, { "epoch": 41.32, "learning_rate": 1.9324649361197016e-05, "loss": 0.0549, "step": 146970 }, { "epoch": 41.33, "learning_rate": 1.9305906975291287e-05, "loss": 0.0648, "step": 147000 }, { "epoch": 41.34, "learning_rate": 1.928716458938556e-05, "loss": 0.0604, "step": 147030 }, { "epoch": 41.34, "learning_rate": 1.926842220347984e-05, "loss": 0.0551, "step": 147060 }, { "epoch": 41.35, "learning_rate": 1.9249679817574113e-05, "loss": 0.0669, "step": 147090 }, { "epoch": 41.36, "learning_rate": 1.9230937431668387e-05, "loss": 0.0539, "step": 147120 }, { "epoch": 41.37, "learning_rate": 1.921219504576266e-05, "loss": 0.063, "step": 147150 }, { "epoch": 41.38, "learning_rate": 1.9193452659856935e-05, "loss": 0.0593, "step": 147180 }, { "epoch": 41.39, "learning_rate": 1.9174710273951206e-05, "loss": 0.0571, "step": 147210 }, { "epoch": 41.39, "learning_rate": 1.915659263424234e-05, "loss": 0.0637, "step": 147240 }, { "epoch": 41.4, "learning_rate": 1.9137850248336614e-05, "loss": 0.0539, "step": 147270 }, { "epoch": 41.41, "learning_rate": 1.911910786243089e-05, "loss": 0.06, "step": 147300 }, { "epoch": 41.42, "learning_rate": 1.9100365476525163e-05, "loss": 0.0584, "step": 147330 }, { "epoch": 41.43, "learning_rate": 1.9081623090619437e-05, "loss": 0.0589, "step": 147360 }, { "epoch": 41.44, "learning_rate": 1.906288070471371e-05, "loss": 0.0638, "step": 147390 }, { "epoch": 41.44, "learning_rate": 1.9044138318807985e-05, "loss": 0.0534, "step": 147420 }, { "epoch": 41.45, "learning_rate": 1.902539593290226e-05, "loss": 0.0597, "step": 147450 }, { "epoch": 41.46, "learning_rate": 1.9006653546996534e-05, "loss": 0.0564, "step": 147480 }, { "epoch": 41.47, "learning_rate": 1.8987911161090808e-05, "loss": 0.0567, "step": 147510 }, { "epoch": 41.48, "learning_rate": 1.8969168775185082e-05, "loss": 0.0648, "step": 147540 }, { "epoch": 41.49, "learning_rate": 1.8950426389279356e-05, "loss": 0.0531, "step": 147570 }, { "epoch": 41.5, "learning_rate": 1.893168400337363e-05, "loss": 0.0667, "step": 147600 }, { "epoch": 41.5, "learning_rate": 1.8912941617467905e-05, "loss": 0.0603, "step": 147630 }, { "epoch": 41.51, "learning_rate": 1.889419923156218e-05, "loss": 0.0593, "step": 147660 }, { "epoch": 41.52, "learning_rate": 1.8875456845656453e-05, "loss": 0.0606, "step": 147690 }, { "epoch": 41.53, "learning_rate": 1.8856714459750727e-05, "loss": 0.0559, "step": 147720 }, { "epoch": 41.54, "learning_rate": 1.8837972073845e-05, "loss": 0.0642, "step": 147750 }, { "epoch": 41.55, "learning_rate": 1.8819229687939276e-05, "loss": 0.0586, "step": 147780 }, { "epoch": 41.55, "learning_rate": 1.880048730203355e-05, "loss": 0.0589, "step": 147810 }, { "epoch": 41.56, "learning_rate": 1.8781744916127824e-05, "loss": 0.0693, "step": 147840 }, { "epoch": 41.57, "learning_rate": 1.8763002530222098e-05, "loss": 0.0565, "step": 147870 }, { "epoch": 41.58, "learning_rate": 1.8744260144316372e-05, "loss": 0.061, "step": 147900 }, { "epoch": 41.59, "learning_rate": 1.8725517758410647e-05, "loss": 0.0595, "step": 147930 }, { "epoch": 41.6, "learning_rate": 1.870677537250492e-05, "loss": 0.0585, "step": 147960 }, { "epoch": 41.61, "learning_rate": 1.8688032986599195e-05, "loss": 0.0627, "step": 147990 }, { "epoch": 41.61, "learning_rate": 1.866929060069347e-05, "loss": 0.0516, "step": 148020 }, { "epoch": 41.62, "learning_rate": 1.8650548214787743e-05, "loss": 0.0617, "step": 148050 }, { "epoch": 41.63, "learning_rate": 1.8631805828882018e-05, "loss": 0.0587, "step": 148080 }, { "epoch": 41.64, "learning_rate": 1.8613063442976292e-05, "loss": 0.062, "step": 148110 }, { "epoch": 41.65, "learning_rate": 1.8594321057070566e-05, "loss": 0.0639, "step": 148140 }, { "epoch": 41.66, "learning_rate": 1.857557867116484e-05, "loss": 0.0527, "step": 148170 }, { "epoch": 41.66, "learning_rate": 1.8556836285259114e-05, "loss": 0.0596, "step": 148200 }, { "epoch": 41.67, "learning_rate": 1.853809389935339e-05, "loss": 0.065, "step": 148230 }, { "epoch": 41.68, "learning_rate": 1.8519351513447663e-05, "loss": 0.061, "step": 148260 }, { "epoch": 41.69, "learning_rate": 1.8500609127541937e-05, "loss": 0.0621, "step": 148290 }, { "epoch": 41.7, "learning_rate": 1.848186674163621e-05, "loss": 0.0533, "step": 148320 }, { "epoch": 41.71, "learning_rate": 1.8463124355730485e-05, "loss": 0.0678, "step": 148350 }, { "epoch": 41.71, "learning_rate": 1.844438196982476e-05, "loss": 0.059, "step": 148380 }, { "epoch": 41.72, "learning_rate": 1.8425639583919034e-05, "loss": 0.0575, "step": 148410 }, { "epoch": 41.73, "learning_rate": 1.8406897198013308e-05, "loss": 0.0686, "step": 148440 }, { "epoch": 41.74, "learning_rate": 1.8388154812107582e-05, "loss": 0.0525, "step": 148470 }, { "epoch": 41.75, "learning_rate": 1.8369412426201856e-05, "loss": 0.0626, "step": 148500 }, { "epoch": 41.76, "learning_rate": 1.835067004029613e-05, "loss": 0.0574, "step": 148530 }, { "epoch": 41.77, "learning_rate": 1.8331927654390405e-05, "loss": 0.058, "step": 148560 }, { "epoch": 41.77, "learning_rate": 1.831318526848468e-05, "loss": 0.0654, "step": 148590 }, { "epoch": 41.78, "learning_rate": 1.8294442882578953e-05, "loss": 0.051, "step": 148620 }, { "epoch": 41.79, "learning_rate": 1.8275700496673227e-05, "loss": 0.0614, "step": 148650 }, { "epoch": 41.8, "learning_rate": 1.82569581107675e-05, "loss": 0.06, "step": 148680 }, { "epoch": 41.81, "learning_rate": 1.8238215724861776e-05, "loss": 0.0604, "step": 148710 }, { "epoch": 41.82, "learning_rate": 1.821947333895605e-05, "loss": 0.0686, "step": 148740 }, { "epoch": 41.82, "learning_rate": 1.8200730953050324e-05, "loss": 0.0546, "step": 148770 }, { "epoch": 41.83, "learning_rate": 1.8181988567144598e-05, "loss": 0.0612, "step": 148800 }, { "epoch": 41.84, "learning_rate": 1.8163246181238872e-05, "loss": 0.0577, "step": 148830 }, { "epoch": 41.85, "learning_rate": 1.8144503795333147e-05, "loss": 0.0598, "step": 148860 }, { "epoch": 41.86, "learning_rate": 1.812576140942742e-05, "loss": 0.0654, "step": 148890 }, { "epoch": 41.87, "learning_rate": 1.8107019023521695e-05, "loss": 0.0494, "step": 148920 }, { "epoch": 41.88, "learning_rate": 1.808827663761597e-05, "loss": 0.062, "step": 148950 }, { "epoch": 41.88, "learning_rate": 1.8069534251710243e-05, "loss": 0.0607, "step": 148980 }, { "epoch": 41.89, "learning_rate": 1.8050791865804517e-05, "loss": 0.0595, "step": 149010 }, { "epoch": 41.9, "learning_rate": 1.803204947989879e-05, "loss": 0.0628, "step": 149040 }, { "epoch": 41.91, "learning_rate": 1.8013307093993066e-05, "loss": 0.0518, "step": 149070 }, { "epoch": 41.92, "learning_rate": 1.799456470808734e-05, "loss": 0.065, "step": 149100 }, { "epoch": 41.93, "learning_rate": 1.7975822322181614e-05, "loss": 0.0615, "step": 149130 }, { "epoch": 41.93, "learning_rate": 1.795707993627589e-05, "loss": 0.0552, "step": 149160 }, { "epoch": 41.94, "learning_rate": 1.7938337550370163e-05, "loss": 0.063, "step": 149190 }, { "epoch": 41.95, "learning_rate": 1.7919595164464437e-05, "loss": 0.056, "step": 149220 }, { "epoch": 41.96, "learning_rate": 1.790085277855871e-05, "loss": 0.0608, "step": 149250 }, { "epoch": 41.97, "learning_rate": 1.7882110392652985e-05, "loss": 0.059, "step": 149280 }, { "epoch": 41.98, "learning_rate": 1.786336800674726e-05, "loss": 0.0579, "step": 149310 }, { "epoch": 41.98, "learning_rate": 1.7844625620841534e-05, "loss": 0.0664, "step": 149340 }, { "epoch": 41.99, "learning_rate": 1.7825883234935808e-05, "loss": 0.0532, "step": 149370 }, { "epoch": 42.0, "eval_loss": 0.17243234813213348, "eval_runtime": 510.6741, "eval_samples_per_second": 31.396, "eval_steps_per_second": 0.983, "eval_wer": 0.12452062833513027, "step": 149394 }, { "epoch": 42.0, "learning_rate": 1.7807140849030082e-05, "loss": 0.065, "step": 149400 }, { "epoch": 42.01, "learning_rate": 1.7788398463124356e-05, "loss": 0.0509, "step": 149430 }, { "epoch": 42.02, "learning_rate": 1.776965607721863e-05, "loss": 0.0653, "step": 149460 }, { "epoch": 42.03, "learning_rate": 1.7750913691312905e-05, "loss": 0.0577, "step": 149490 }, { "epoch": 42.04, "learning_rate": 1.773217130540718e-05, "loss": 0.0545, "step": 149520 }, { "epoch": 42.04, "learning_rate": 1.7713428919501453e-05, "loss": 0.0632, "step": 149550 }, { "epoch": 42.05, "learning_rate": 1.7695311279792584e-05, "loss": 0.0741, "step": 149580 }, { "epoch": 42.06, "learning_rate": 1.767656889388686e-05, "loss": 0.0606, "step": 149610 }, { "epoch": 42.07, "learning_rate": 1.7658451254177992e-05, "loss": 0.0579, "step": 149640 }, { "epoch": 42.08, "learning_rate": 1.7639708868272263e-05, "loss": 0.0573, "step": 149670 }, { "epoch": 42.09, "learning_rate": 1.7620966482366537e-05, "loss": 0.0611, "step": 149700 }, { "epoch": 42.09, "learning_rate": 1.7602224096460815e-05, "loss": 0.0555, "step": 149730 }, { "epoch": 42.1, "learning_rate": 1.758348171055509e-05, "loss": 0.0646, "step": 149760 }, { "epoch": 42.11, "learning_rate": 1.7564739324649363e-05, "loss": 0.0568, "step": 149790 }, { "epoch": 42.12, "learning_rate": 1.7545996938743637e-05, "loss": 0.0569, "step": 149820 }, { "epoch": 42.13, "learning_rate": 1.752725455283791e-05, "loss": 0.0643, "step": 149850 }, { "epoch": 42.14, "learning_rate": 1.7508512166932182e-05, "loss": 0.0523, "step": 149880 }, { "epoch": 42.15, "learning_rate": 1.7489769781026456e-05, "loss": 0.0598, "step": 149910 }, { "epoch": 42.15, "learning_rate": 1.7471027395120734e-05, "loss": 0.0607, "step": 149940 }, { "epoch": 42.16, "learning_rate": 1.7452285009215008e-05, "loss": 0.0533, "step": 149970 }, { "epoch": 42.17, "learning_rate": 1.7433542623309282e-05, "loss": 0.061, "step": 150000 }, { "epoch": 42.18, "learning_rate": 1.7414800237403557e-05, "loss": 0.0495, "step": 150030 }, { "epoch": 42.19, "learning_rate": 1.739605785149783e-05, "loss": 0.0625, "step": 150060 }, { "epoch": 42.2, "learning_rate": 1.7377315465592105e-05, "loss": 0.0547, "step": 150090 }, { "epoch": 42.2, "learning_rate": 1.7358573079686376e-05, "loss": 0.0549, "step": 150120 }, { "epoch": 42.21, "learning_rate": 1.7339830693780653e-05, "loss": 0.0626, "step": 150150 }, { "epoch": 42.22, "learning_rate": 1.7321088307874928e-05, "loss": 0.0496, "step": 150180 }, { "epoch": 42.23, "learning_rate": 1.7302345921969202e-05, "loss": 0.0555, "step": 150210 }, { "epoch": 42.24, "learning_rate": 1.7283603536063476e-05, "loss": 0.0624, "step": 150240 }, { "epoch": 42.25, "learning_rate": 1.726486115015775e-05, "loss": 0.057, "step": 150270 }, { "epoch": 42.25, "learning_rate": 1.7246118764252024e-05, "loss": 0.065, "step": 150300 }, { "epoch": 42.26, "learning_rate": 1.7227376378346295e-05, "loss": 0.0516, "step": 150330 }, { "epoch": 42.27, "learning_rate": 1.7208633992440573e-05, "loss": 0.0626, "step": 150360 }, { "epoch": 42.28, "learning_rate": 1.7189891606534847e-05, "loss": 0.061, "step": 150390 }, { "epoch": 42.29, "learning_rate": 1.717114922062912e-05, "loss": 0.0561, "step": 150420 }, { "epoch": 42.3, "learning_rate": 1.7152406834723395e-05, "loss": 0.0657, "step": 150450 }, { "epoch": 42.31, "learning_rate": 1.713366444881767e-05, "loss": 0.0559, "step": 150480 }, { "epoch": 42.31, "learning_rate": 1.7114922062911944e-05, "loss": 0.06, "step": 150510 }, { "epoch": 42.32, "learning_rate": 1.7096179677006214e-05, "loss": 0.0657, "step": 150540 }, { "epoch": 42.33, "learning_rate": 1.7077437291100492e-05, "loss": 0.0559, "step": 150570 }, { "epoch": 42.34, "learning_rate": 1.7059319651391623e-05, "loss": 0.0602, "step": 150600 }, { "epoch": 42.35, "learning_rate": 1.7040577265485897e-05, "loss": 0.0482, "step": 150630 }, { "epoch": 42.36, "learning_rate": 1.702183487958017e-05, "loss": 0.06, "step": 150660 }, { "epoch": 42.36, "learning_rate": 1.7003092493674445e-05, "loss": 0.06, "step": 150690 }, { "epoch": 42.37, "learning_rate": 1.698435010776872e-05, "loss": 0.0608, "step": 150720 }, { "epoch": 42.38, "learning_rate": 1.6965607721862994e-05, "loss": 0.0606, "step": 150750 }, { "epoch": 42.39, "learning_rate": 1.6946865335957268e-05, "loss": 0.0522, "step": 150780 }, { "epoch": 42.4, "learning_rate": 1.6928122950051542e-05, "loss": 0.0573, "step": 150810 }, { "epoch": 42.41, "learning_rate": 1.6909380564145816e-05, "loss": 0.0575, "step": 150840 }, { "epoch": 42.41, "learning_rate": 1.689063817824009e-05, "loss": 0.0579, "step": 150870 }, { "epoch": 42.42, "learning_rate": 1.6871895792334365e-05, "loss": 0.0635, "step": 150900 }, { "epoch": 42.43, "learning_rate": 1.685315340642864e-05, "loss": 0.0533, "step": 150930 }, { "epoch": 42.44, "learning_rate": 1.6834411020522913e-05, "loss": 0.0555, "step": 150960 }, { "epoch": 42.45, "learning_rate": 1.6815668634617187e-05, "loss": 0.0541, "step": 150990 }, { "epoch": 42.46, "learning_rate": 1.679692624871146e-05, "loss": 0.0573, "step": 151020 }, { "epoch": 42.47, "learning_rate": 1.6778183862805736e-05, "loss": 0.0667, "step": 151050 }, { "epoch": 42.47, "learning_rate": 1.675944147690001e-05, "loss": 0.0522, "step": 151080 }, { "epoch": 42.48, "learning_rate": 1.6740699090994284e-05, "loss": 0.0646, "step": 151110 }, { "epoch": 42.49, "learning_rate": 1.6721956705088558e-05, "loss": 0.0604, "step": 151140 }, { "epoch": 42.5, "learning_rate": 1.6703214319182832e-05, "loss": 0.0561, "step": 151170 }, { "epoch": 42.51, "learning_rate": 1.6684471933277107e-05, "loss": 0.0636, "step": 151200 }, { "epoch": 42.52, "learning_rate": 1.666572954737138e-05, "loss": 0.0518, "step": 151230 }, { "epoch": 42.52, "learning_rate": 1.6646987161465655e-05, "loss": 0.0594, "step": 151260 }, { "epoch": 42.53, "learning_rate": 1.662824477555993e-05, "loss": 0.0559, "step": 151290 }, { "epoch": 42.54, "learning_rate": 1.6609502389654207e-05, "loss": 0.0547, "step": 151320 }, { "epoch": 42.55, "learning_rate": 1.6590760003748478e-05, "loss": 0.066, "step": 151350 }, { "epoch": 42.56, "learning_rate": 1.6572017617842752e-05, "loss": 0.0541, "step": 151380 }, { "epoch": 42.57, "learning_rate": 1.6553275231937026e-05, "loss": 0.0618, "step": 151410 }, { "epoch": 42.58, "learning_rate": 1.65345328460313e-05, "loss": 0.0605, "step": 151440 }, { "epoch": 42.58, "learning_rate": 1.6515790460125574e-05, "loss": 0.054, "step": 151470 }, { "epoch": 42.59, "learning_rate": 1.649704807421985e-05, "loss": 0.0649, "step": 151500 }, { "epoch": 42.6, "learning_rate": 1.6478305688314123e-05, "loss": 0.0532, "step": 151530 }, { "epoch": 42.61, "learning_rate": 1.6459563302408397e-05, "loss": 0.0598, "step": 151560 }, { "epoch": 42.62, "learning_rate": 1.644082091650267e-05, "loss": 0.0595, "step": 151590 }, { "epoch": 42.63, "learning_rate": 1.6422078530596945e-05, "loss": 0.0566, "step": 151620 }, { "epoch": 42.63, "learning_rate": 1.640333614469122e-05, "loss": 0.065, "step": 151650 }, { "epoch": 42.64, "learning_rate": 1.6384593758785494e-05, "loss": 0.0528, "step": 151680 }, { "epoch": 42.65, "learning_rate": 1.6365851372879768e-05, "loss": 0.0613, "step": 151710 }, { "epoch": 42.66, "learning_rate": 1.6347108986974042e-05, "loss": 0.0598, "step": 151740 }, { "epoch": 42.67, "learning_rate": 1.6328366601068316e-05, "loss": 0.0616, "step": 151770 }, { "epoch": 42.68, "learning_rate": 1.630962421516259e-05, "loss": 0.0597, "step": 151800 }, { "epoch": 42.68, "learning_rate": 1.6290881829256865e-05, "loss": 0.0538, "step": 151830 }, { "epoch": 42.69, "learning_rate": 1.627213944335114e-05, "loss": 0.0593, "step": 151860 }, { "epoch": 42.7, "learning_rate": 1.6253397057445413e-05, "loss": 0.059, "step": 151890 }, { "epoch": 42.71, "learning_rate": 1.6234654671539687e-05, "loss": 0.055, "step": 151920 }, { "epoch": 42.72, "learning_rate": 1.621591228563396e-05, "loss": 0.0632, "step": 151950 }, { "epoch": 42.73, "learning_rate": 1.6197169899728236e-05, "loss": 0.0557, "step": 151980 }, { "epoch": 42.74, "learning_rate": 1.617842751382251e-05, "loss": 0.0612, "step": 152010 }, { "epoch": 42.74, "learning_rate": 1.6159685127916784e-05, "loss": 0.0629, "step": 152040 }, { "epoch": 42.75, "learning_rate": 1.6140942742011058e-05, "loss": 0.0619, "step": 152070 }, { "epoch": 42.76, "learning_rate": 1.6122200356105332e-05, "loss": 0.0692, "step": 152100 }, { "epoch": 42.77, "learning_rate": 1.6103457970199607e-05, "loss": 0.0527, "step": 152130 }, { "epoch": 42.78, "learning_rate": 1.608471558429388e-05, "loss": 0.0573, "step": 152160 }, { "epoch": 42.79, "learning_rate": 1.606597319838816e-05, "loss": 0.0592, "step": 152190 }, { "epoch": 42.79, "learning_rate": 1.604723081248243e-05, "loss": 0.056, "step": 152220 }, { "epoch": 42.8, "learning_rate": 1.6028488426576703e-05, "loss": 0.0651, "step": 152250 }, { "epoch": 42.81, "learning_rate": 1.6009746040670978e-05, "loss": 0.0556, "step": 152280 }, { "epoch": 42.82, "learning_rate": 1.5991003654765252e-05, "loss": 0.0595, "step": 152310 }, { "epoch": 42.83, "learning_rate": 1.5972261268859526e-05, "loss": 0.0586, "step": 152340 }, { "epoch": 42.84, "learning_rate": 1.59535188829538e-05, "loss": 0.0548, "step": 152370 }, { "epoch": 42.84, "learning_rate": 1.5934776497048078e-05, "loss": 0.0653, "step": 152400 }, { "epoch": 42.85, "learning_rate": 1.591603411114235e-05, "loss": 0.0561, "step": 152430 }, { "epoch": 42.86, "learning_rate": 1.5897291725236623e-05, "loss": 0.0607, "step": 152460 }, { "epoch": 42.87, "learning_rate": 1.5878549339330897e-05, "loss": 0.0566, "step": 152490 }, { "epoch": 42.88, "learning_rate": 1.585980695342517e-05, "loss": 0.0568, "step": 152520 }, { "epoch": 42.89, "learning_rate": 1.5841064567519445e-05, "loss": 0.0603, "step": 152550 }, { "epoch": 42.9, "learning_rate": 1.582232218161372e-05, "loss": 0.0559, "step": 152580 }, { "epoch": 42.9, "learning_rate": 1.5803579795707997e-05, "loss": 0.0677, "step": 152610 }, { "epoch": 42.91, "learning_rate": 1.5784837409802268e-05, "loss": 0.0572, "step": 152640 }, { "epoch": 42.92, "learning_rate": 1.5766095023896542e-05, "loss": 0.0584, "step": 152670 }, { "epoch": 42.93, "learning_rate": 1.5747352637990816e-05, "loss": 0.062, "step": 152700 }, { "epoch": 42.94, "learning_rate": 1.572861025208509e-05, "loss": 0.0536, "step": 152730 }, { "epoch": 42.95, "learning_rate": 1.5709867866179365e-05, "loss": 0.0574, "step": 152760 }, { "epoch": 42.95, "learning_rate": 1.569112548027364e-05, "loss": 0.0591, "step": 152790 }, { "epoch": 42.96, "learning_rate": 1.5672383094367916e-05, "loss": 0.0591, "step": 152820 }, { "epoch": 42.97, "learning_rate": 1.565364070846219e-05, "loss": 0.0623, "step": 152850 }, { "epoch": 42.98, "learning_rate": 1.563489832255646e-05, "loss": 0.054, "step": 152880 }, { "epoch": 42.99, "learning_rate": 1.5616155936650736e-05, "loss": 0.0598, "step": 152910 }, { "epoch": 43.0, "learning_rate": 1.559741355074501e-05, "loss": 0.0594, "step": 152940 }, { "epoch": 43.0, "eval_loss": 0.1735638976097107, "eval_runtime": 506.7114, "eval_samples_per_second": 31.641, "eval_steps_per_second": 0.991, "eval_wer": 0.12498464645913229, "step": 152951 }, { "epoch": 43.01, "learning_rate": 1.5578671164839284e-05, "loss": 0.058, "step": 152970 }, { "epoch": 43.01, "learning_rate": 1.5559928778933558e-05, "loss": 0.0646, "step": 153000 }, { "epoch": 43.02, "learning_rate": 1.5541186393027836e-05, "loss": 0.0515, "step": 153030 }, { "epoch": 43.03, "learning_rate": 1.552244400712211e-05, "loss": 0.0589, "step": 153060 }, { "epoch": 43.04, "learning_rate": 1.550370162121638e-05, "loss": 0.0527, "step": 153090 }, { "epoch": 43.05, "learning_rate": 1.5484959235310655e-05, "loss": 0.0596, "step": 153120 }, { "epoch": 43.06, "learning_rate": 1.546621684940493e-05, "loss": 0.058, "step": 153150 }, { "epoch": 43.06, "learning_rate": 1.5447474463499203e-05, "loss": 0.0518, "step": 153180 }, { "epoch": 43.07, "learning_rate": 1.5428732077593477e-05, "loss": 0.0603, "step": 153210 }, { "epoch": 43.08, "learning_rate": 1.5409989691687755e-05, "loss": 0.0545, "step": 153240 }, { "epoch": 43.09, "learning_rate": 1.539124730578203e-05, "loss": 0.0763, "step": 153270 }, { "epoch": 43.1, "learning_rate": 1.53725049198763e-05, "loss": 0.0657, "step": 153300 }, { "epoch": 43.11, "learning_rate": 1.5353762533970574e-05, "loss": 0.0535, "step": 153330 }, { "epoch": 43.11, "learning_rate": 1.533502014806485e-05, "loss": 0.0641, "step": 153360 }, { "epoch": 43.12, "learning_rate": 1.5316277762159123e-05, "loss": 0.0534, "step": 153390 }, { "epoch": 43.13, "learning_rate": 1.5297535376253397e-05, "loss": 0.0562, "step": 153420 }, { "epoch": 43.14, "learning_rate": 1.527879299034767e-05, "loss": 0.0569, "step": 153450 }, { "epoch": 43.15, "learning_rate": 1.526005060444195e-05, "loss": 0.0514, "step": 153480 }, { "epoch": 43.16, "learning_rate": 1.5241308218536221e-05, "loss": 0.0619, "step": 153510 }, { "epoch": 43.17, "learning_rate": 1.5222565832630495e-05, "loss": 0.0569, "step": 153540 }, { "epoch": 43.17, "learning_rate": 1.520382344672477e-05, "loss": 0.0569, "step": 153570 }, { "epoch": 43.18, "learning_rate": 1.5185081060819042e-05, "loss": 0.0601, "step": 153600 }, { "epoch": 43.19, "learning_rate": 1.5166338674913316e-05, "loss": 0.0535, "step": 153630 }, { "epoch": 43.2, "learning_rate": 1.514759628900759e-05, "loss": 0.063, "step": 153660 }, { "epoch": 43.21, "learning_rate": 1.5128853903101866e-05, "loss": 0.0532, "step": 153690 }, { "epoch": 43.22, "learning_rate": 1.511011151719614e-05, "loss": 0.0586, "step": 153720 }, { "epoch": 43.22, "learning_rate": 1.5091369131290415e-05, "loss": 0.0607, "step": 153750 }, { "epoch": 43.23, "learning_rate": 1.5072626745384689e-05, "loss": 0.0506, "step": 153780 }, { "epoch": 43.24, "learning_rate": 1.5053884359478961e-05, "loss": 0.0633, "step": 153810 }, { "epoch": 43.25, "learning_rate": 1.5035141973573235e-05, "loss": 0.0569, "step": 153840 }, { "epoch": 43.26, "learning_rate": 1.501639958766751e-05, "loss": 0.0582, "step": 153870 }, { "epoch": 43.27, "learning_rate": 1.4997657201761786e-05, "loss": 0.0581, "step": 153900 }, { "epoch": 43.28, "learning_rate": 1.497891481585606e-05, "loss": 0.0496, "step": 153930 }, { "epoch": 43.28, "learning_rate": 1.4960172429950334e-05, "loss": 0.0606, "step": 153960 }, { "epoch": 43.29, "learning_rate": 1.4941430044044608e-05, "loss": 0.0549, "step": 153990 }, { "epoch": 43.3, "learning_rate": 1.492268765813888e-05, "loss": 0.0587, "step": 154020 }, { "epoch": 43.31, "learning_rate": 1.4903945272233155e-05, "loss": 0.065, "step": 154050 }, { "epoch": 43.32, "learning_rate": 1.4885202886327429e-05, "loss": 0.0527, "step": 154080 }, { "epoch": 43.33, "learning_rate": 1.4866460500421705e-05, "loss": 0.0596, "step": 154110 }, { "epoch": 43.33, "learning_rate": 1.4847718114515979e-05, "loss": 0.0544, "step": 154140 }, { "epoch": 43.34, "learning_rate": 1.4828975728610253e-05, "loss": 0.0581, "step": 154170 }, { "epoch": 43.35, "learning_rate": 1.4810233342704527e-05, "loss": 0.0574, "step": 154200 }, { "epoch": 43.36, "learning_rate": 1.4791490956798802e-05, "loss": 0.0519, "step": 154230 }, { "epoch": 43.37, "learning_rate": 1.4772748570893074e-05, "loss": 0.0609, "step": 154260 }, { "epoch": 43.38, "learning_rate": 1.4754006184987348e-05, "loss": 0.054, "step": 154290 }, { "epoch": 43.38, "learning_rate": 1.4735263799081626e-05, "loss": 0.0565, "step": 154320 }, { "epoch": 43.39, "learning_rate": 1.4716521413175898e-05, "loss": 0.06, "step": 154350 }, { "epoch": 43.4, "learning_rate": 1.4697779027270173e-05, "loss": 0.0529, "step": 154380 }, { "epoch": 43.41, "learning_rate": 1.4679036641364447e-05, "loss": 0.0611, "step": 154410 }, { "epoch": 43.42, "learning_rate": 1.4660294255458721e-05, "loss": 0.0519, "step": 154440 }, { "epoch": 43.43, "learning_rate": 1.4641551869552993e-05, "loss": 0.0566, "step": 154470 }, { "epoch": 43.44, "learning_rate": 1.4622809483647268e-05, "loss": 0.0599, "step": 154500 }, { "epoch": 43.44, "learning_rate": 1.4604067097741545e-05, "loss": 0.0513, "step": 154530 }, { "epoch": 43.45, "learning_rate": 1.4585324711835818e-05, "loss": 0.0621, "step": 154560 }, { "epoch": 43.46, "learning_rate": 1.4566582325930092e-05, "loss": 0.0563, "step": 154590 }, { "epoch": 43.47, "learning_rate": 1.4547839940024366e-05, "loss": 0.0609, "step": 154620 }, { "epoch": 43.48, "learning_rate": 1.452909755411864e-05, "loss": 0.0577, "step": 154650 }, { "epoch": 43.49, "learning_rate": 1.4510355168212913e-05, "loss": 0.0541, "step": 154680 }, { "epoch": 43.49, "learning_rate": 1.4491612782307187e-05, "loss": 0.0621, "step": 154710 }, { "epoch": 43.5, "learning_rate": 1.4472870396401465e-05, "loss": 0.0534, "step": 154740 }, { "epoch": 43.51, "learning_rate": 1.4454128010495737e-05, "loss": 0.0585, "step": 154770 }, { "epoch": 43.52, "learning_rate": 1.4435385624590011e-05, "loss": 0.0571, "step": 154800 }, { "epoch": 43.53, "learning_rate": 1.4416643238684285e-05, "loss": 0.0563, "step": 154830 }, { "epoch": 43.54, "learning_rate": 1.439790085277856e-05, "loss": 0.0591, "step": 154860 }, { "epoch": 43.55, "learning_rate": 1.4379158466872834e-05, "loss": 0.06, "step": 154890 }, { "epoch": 43.55, "learning_rate": 1.4360416080967106e-05, "loss": 0.0647, "step": 154920 }, { "epoch": 43.56, "learning_rate": 1.4341673695061384e-05, "loss": 0.0583, "step": 154950 }, { "epoch": 43.57, "learning_rate": 1.4322931309155656e-05, "loss": 0.0507, "step": 154980 }, { "epoch": 43.58, "learning_rate": 1.430418892324993e-05, "loss": 0.063, "step": 155010 }, { "epoch": 43.59, "learning_rate": 1.4285446537344205e-05, "loss": 0.0525, "step": 155040 }, { "epoch": 43.6, "learning_rate": 1.4266704151438479e-05, "loss": 0.0562, "step": 155070 }, { "epoch": 43.6, "learning_rate": 1.4247961765532753e-05, "loss": 0.0595, "step": 155100 }, { "epoch": 43.61, "learning_rate": 1.4229219379627026e-05, "loss": 0.0555, "step": 155130 }, { "epoch": 43.62, "learning_rate": 1.42104769937213e-05, "loss": 0.0622, "step": 155160 }, { "epoch": 43.63, "learning_rate": 1.4191734607815577e-05, "loss": 0.0581, "step": 155190 }, { "epoch": 43.64, "learning_rate": 1.417299222190985e-05, "loss": 0.0565, "step": 155220 }, { "epoch": 43.65, "learning_rate": 1.4154249836004124e-05, "loss": 0.0633, "step": 155250 }, { "epoch": 43.65, "learning_rate": 1.4135507450098398e-05, "loss": 0.053, "step": 155280 }, { "epoch": 43.66, "learning_rate": 1.4116765064192672e-05, "loss": 0.0616, "step": 155310 }, { "epoch": 43.67, "learning_rate": 1.4098022678286945e-05, "loss": 0.0551, "step": 155340 }, { "epoch": 43.68, "learning_rate": 1.4079280292381219e-05, "loss": 0.0575, "step": 155370 }, { "epoch": 43.69, "learning_rate": 1.4060537906475497e-05, "loss": 0.0622, "step": 155400 }, { "epoch": 43.7, "learning_rate": 1.404179552056977e-05, "loss": 0.0535, "step": 155430 }, { "epoch": 43.71, "learning_rate": 1.4023053134664043e-05, "loss": 0.0651, "step": 155460 }, { "epoch": 43.71, "learning_rate": 1.4004310748758318e-05, "loss": 0.0561, "step": 155490 }, { "epoch": 43.72, "learning_rate": 1.3985568362852592e-05, "loss": 0.056, "step": 155520 }, { "epoch": 43.73, "learning_rate": 1.3966825976946864e-05, "loss": 0.0572, "step": 155550 }, { "epoch": 43.74, "learning_rate": 1.3948083591041138e-05, "loss": 0.0556, "step": 155580 }, { "epoch": 43.75, "learning_rate": 1.3929341205135416e-05, "loss": 0.0617, "step": 155610 }, { "epoch": 43.76, "learning_rate": 1.3910598819229689e-05, "loss": 0.0533, "step": 155640 }, { "epoch": 43.76, "learning_rate": 1.3891856433323963e-05, "loss": 0.0672, "step": 155670 }, { "epoch": 43.77, "learning_rate": 1.3873114047418237e-05, "loss": 0.0613, "step": 155700 }, { "epoch": 43.78, "learning_rate": 1.3854371661512511e-05, "loss": 0.055, "step": 155730 }, { "epoch": 43.79, "learning_rate": 1.3835629275606785e-05, "loss": 0.0598, "step": 155760 }, { "epoch": 43.8, "learning_rate": 1.3816886889701058e-05, "loss": 0.0558, "step": 155790 }, { "epoch": 43.81, "learning_rate": 1.3798144503795335e-05, "loss": 0.0637, "step": 155820 }, { "epoch": 43.81, "learning_rate": 1.377940211788961e-05, "loss": 0.0619, "step": 155850 }, { "epoch": 43.82, "learning_rate": 1.3760659731983882e-05, "loss": 0.0494, "step": 155880 }, { "epoch": 43.83, "learning_rate": 1.3741917346078156e-05, "loss": 0.0653, "step": 155910 }, { "epoch": 43.84, "learning_rate": 1.372317496017243e-05, "loss": 0.0554, "step": 155940 }, { "epoch": 43.85, "learning_rate": 1.3704432574266705e-05, "loss": 0.0629, "step": 155970 }, { "epoch": 43.86, "learning_rate": 1.3685690188360977e-05, "loss": 0.0594, "step": 156000 }, { "epoch": 43.87, "learning_rate": 1.3666947802455255e-05, "loss": 0.0552, "step": 156030 }, { "epoch": 43.87, "learning_rate": 1.3648205416549529e-05, "loss": 0.0632, "step": 156060 }, { "epoch": 43.88, "learning_rate": 1.3629463030643801e-05, "loss": 0.0565, "step": 156090 }, { "epoch": 43.89, "learning_rate": 1.3610720644738076e-05, "loss": 0.0563, "step": 156120 }, { "epoch": 43.9, "learning_rate": 1.359197825883235e-05, "loss": 0.0622, "step": 156150 }, { "epoch": 43.91, "learning_rate": 1.3573235872926624e-05, "loss": 0.0528, "step": 156180 }, { "epoch": 43.92, "learning_rate": 1.3554493487020896e-05, "loss": 0.0609, "step": 156210 }, { "epoch": 43.92, "learning_rate": 1.353637584731203e-05, "loss": 0.0729, "step": 156240 }, { "epoch": 43.93, "learning_rate": 1.3517633461406303e-05, "loss": 0.0566, "step": 156270 }, { "epoch": 43.94, "learning_rate": 1.3498891075500577e-05, "loss": 0.0588, "step": 156300 }, { "epoch": 43.95, "learning_rate": 1.3480148689594852e-05, "loss": 0.052, "step": 156330 }, { "epoch": 43.96, "learning_rate": 1.3461406303689127e-05, "loss": 0.0612, "step": 156360 }, { "epoch": 43.97, "learning_rate": 1.3442663917783402e-05, "loss": 0.0516, "step": 156390 }, { "epoch": 43.98, "learning_rate": 1.3423921531877676e-05, "loss": 0.058, "step": 156420 }, { "epoch": 43.98, "learning_rate": 1.340517914597195e-05, "loss": 0.058, "step": 156450 }, { "epoch": 43.99, "learning_rate": 1.3386436760066223e-05, "loss": 0.0544, "step": 156480 }, { "epoch": 44.0, "eval_loss": 0.17437909543514252, "eval_runtime": 509.2768, "eval_samples_per_second": 31.482, "eval_steps_per_second": 0.986, "eval_wer": 0.1237768345775388, "step": 156508 }, { "epoch": 44.0, "learning_rate": 1.3367694374160497e-05, "loss": 0.0637, "step": 156510 }, { "epoch": 44.01, "learning_rate": 1.3348951988254771e-05, "loss": 0.049, "step": 156540 }, { "epoch": 44.02, "learning_rate": 1.3330209602349047e-05, "loss": 0.0665, "step": 156570 }, { "epoch": 44.03, "learning_rate": 1.3311467216443321e-05, "loss": 0.058, "step": 156600 }, { "epoch": 44.03, "learning_rate": 1.3292724830537595e-05, "loss": 0.0575, "step": 156630 }, { "epoch": 44.04, "learning_rate": 1.327398244463187e-05, "loss": 0.0585, "step": 156660 }, { "epoch": 44.05, "learning_rate": 1.3255240058726144e-05, "loss": 0.0499, "step": 156690 }, { "epoch": 44.06, "learning_rate": 1.3236497672820416e-05, "loss": 0.0607, "step": 156720 }, { "epoch": 44.07, "learning_rate": 1.321775528691469e-05, "loss": 0.0541, "step": 156750 }, { "epoch": 44.08, "learning_rate": 1.3199012901008966e-05, "loss": 0.0554, "step": 156780 }, { "epoch": 44.08, "learning_rate": 1.318027051510324e-05, "loss": 0.0599, "step": 156810 }, { "epoch": 44.09, "learning_rate": 1.3161528129197515e-05, "loss": 0.0511, "step": 156840 }, { "epoch": 44.1, "learning_rate": 1.3142785743291789e-05, "loss": 0.0618, "step": 156870 }, { "epoch": 44.11, "learning_rate": 1.3124043357386063e-05, "loss": 0.0551, "step": 156900 }, { "epoch": 44.12, "learning_rate": 1.3105300971480335e-05, "loss": 0.051, "step": 156930 }, { "epoch": 44.13, "learning_rate": 1.308655858557461e-05, "loss": 0.0605, "step": 156960 }, { "epoch": 44.14, "learning_rate": 1.3067816199668887e-05, "loss": 0.055, "step": 156990 }, { "epoch": 44.14, "learning_rate": 1.304907381376316e-05, "loss": 0.0584, "step": 157020 }, { "epoch": 44.15, "learning_rate": 1.3030331427857434e-05, "loss": 0.0567, "step": 157050 }, { "epoch": 44.16, "learning_rate": 1.3011589041951708e-05, "loss": 0.0541, "step": 157080 }, { "epoch": 44.17, "learning_rate": 1.2992846656045982e-05, "loss": 0.0606, "step": 157110 }, { "epoch": 44.18, "learning_rate": 1.2974104270140255e-05, "loss": 0.0478, "step": 157140 }, { "epoch": 44.19, "learning_rate": 1.2955361884234529e-05, "loss": 0.0612, "step": 157170 }, { "epoch": 44.19, "learning_rate": 1.2936619498328806e-05, "loss": 0.0552, "step": 157200 }, { "epoch": 44.2, "learning_rate": 1.2917877112423079e-05, "loss": 0.0547, "step": 157230 }, { "epoch": 44.21, "learning_rate": 1.2899134726517353e-05, "loss": 0.0606, "step": 157260 }, { "epoch": 44.22, "learning_rate": 1.2880392340611627e-05, "loss": 0.0454, "step": 157290 }, { "epoch": 44.23, "learning_rate": 1.2861649954705902e-05, "loss": 0.0611, "step": 157320 }, { "epoch": 44.24, "learning_rate": 1.2842907568800174e-05, "loss": 0.0572, "step": 157350 }, { "epoch": 44.25, "learning_rate": 1.2824165182894448e-05, "loss": 0.0582, "step": 157380 }, { "epoch": 44.25, "learning_rate": 1.2805422796988726e-05, "loss": 0.0657, "step": 157410 }, { "epoch": 44.26, "learning_rate": 1.2786680411082998e-05, "loss": 0.0498, "step": 157440 }, { "epoch": 44.27, "learning_rate": 1.2767938025177273e-05, "loss": 0.0617, "step": 157470 }, { "epoch": 44.28, "learning_rate": 1.2749195639271547e-05, "loss": 0.0553, "step": 157500 }, { "epoch": 44.29, "learning_rate": 1.2730453253365821e-05, "loss": 0.0577, "step": 157530 }, { "epoch": 44.3, "learning_rate": 1.2711710867460095e-05, "loss": 0.0607, "step": 157560 }, { "epoch": 44.3, "learning_rate": 1.2692968481554368e-05, "loss": 0.0551, "step": 157590 }, { "epoch": 44.31, "learning_rate": 1.2674226095648645e-05, "loss": 0.0598, "step": 157620 }, { "epoch": 44.32, "learning_rate": 1.265548370974292e-05, "loss": 0.0538, "step": 157650 }, { "epoch": 44.33, "learning_rate": 1.2636741323837192e-05, "loss": 0.0581, "step": 157680 }, { "epoch": 44.34, "learning_rate": 1.2617998937931466e-05, "loss": 0.0622, "step": 157710 }, { "epoch": 44.35, "learning_rate": 1.259925655202574e-05, "loss": 0.0542, "step": 157740 }, { "epoch": 44.35, "learning_rate": 1.2580514166120014e-05, "loss": 0.0617, "step": 157770 }, { "epoch": 44.36, "learning_rate": 1.2561771780214287e-05, "loss": 0.0519, "step": 157800 }, { "epoch": 44.37, "learning_rate": 1.2543029394308561e-05, "loss": 0.0595, "step": 157830 }, { "epoch": 44.38, "learning_rate": 1.2524287008402839e-05, "loss": 0.0653, "step": 157860 }, { "epoch": 44.39, "learning_rate": 1.2505544622497111e-05, "loss": 0.0531, "step": 157890 }, { "epoch": 44.4, "learning_rate": 1.2486802236591385e-05, "loss": 0.0593, "step": 157920 }, { "epoch": 44.41, "learning_rate": 1.246805985068566e-05, "loss": 0.0545, "step": 157950 }, { "epoch": 44.41, "learning_rate": 1.2449317464779934e-05, "loss": 0.0569, "step": 157980 }, { "epoch": 44.42, "learning_rate": 1.2430575078874208e-05, "loss": 0.0627, "step": 158010 }, { "epoch": 44.43, "learning_rate": 1.2411832692968482e-05, "loss": 0.054, "step": 158040 }, { "epoch": 44.44, "learning_rate": 1.2393090307062756e-05, "loss": 0.0552, "step": 158070 }, { "epoch": 44.45, "learning_rate": 1.237434792115703e-05, "loss": 0.0522, "step": 158100 }, { "epoch": 44.46, "learning_rate": 1.2355605535251305e-05, "loss": 0.0571, "step": 158130 }, { "epoch": 44.46, "learning_rate": 1.2336863149345579e-05, "loss": 0.0617, "step": 158160 }, { "epoch": 44.47, "learning_rate": 1.2318120763439853e-05, "loss": 0.054, "step": 158190 }, { "epoch": 44.48, "learning_rate": 1.2299378377534127e-05, "loss": 0.0623, "step": 158220 }, { "epoch": 44.49, "learning_rate": 1.2280635991628401e-05, "loss": 0.0538, "step": 158250 }, { "epoch": 44.5, "learning_rate": 1.2261893605722676e-05, "loss": 0.0541, "step": 158280 }, { "epoch": 44.51, "learning_rate": 1.224315121981695e-05, "loss": 0.0589, "step": 158310 }, { "epoch": 44.51, "learning_rate": 1.2224408833911224e-05, "loss": 0.0503, "step": 158340 }, { "epoch": 44.52, "learning_rate": 1.2205666448005498e-05, "loss": 0.0572, "step": 158370 }, { "epoch": 44.53, "learning_rate": 1.2186924062099772e-05, "loss": 0.0564, "step": 158400 }, { "epoch": 44.54, "learning_rate": 1.2168181676194047e-05, "loss": 0.0558, "step": 158430 }, { "epoch": 44.55, "learning_rate": 1.214943929028832e-05, "loss": 0.0608, "step": 158460 }, { "epoch": 44.56, "learning_rate": 1.2130696904382595e-05, "loss": 0.0498, "step": 158490 }, { "epoch": 44.57, "learning_rate": 1.211195451847687e-05, "loss": 0.0609, "step": 158520 }, { "epoch": 44.57, "learning_rate": 1.2093212132571143e-05, "loss": 0.0531, "step": 158550 }, { "epoch": 44.58, "learning_rate": 1.2074469746665418e-05, "loss": 0.0563, "step": 158580 }, { "epoch": 44.59, "learning_rate": 1.2055727360759692e-05, "loss": 0.0602, "step": 158610 }, { "epoch": 44.6, "learning_rate": 1.2036984974853966e-05, "loss": 0.0506, "step": 158640 }, { "epoch": 44.61, "learning_rate": 1.201824258894824e-05, "loss": 0.0606, "step": 158670 }, { "epoch": 44.62, "learning_rate": 1.1999500203042514e-05, "loss": 0.0543, "step": 158700 }, { "epoch": 44.62, "learning_rate": 1.1980757817136789e-05, "loss": 0.0563, "step": 158730 }, { "epoch": 44.63, "learning_rate": 1.1962015431231063e-05, "loss": 0.066, "step": 158760 }, { "epoch": 44.64, "learning_rate": 1.1943273045325337e-05, "loss": 0.0493, "step": 158790 }, { "epoch": 44.65, "learning_rate": 1.1924530659419611e-05, "loss": 0.0626, "step": 158820 }, { "epoch": 44.66, "learning_rate": 1.1905788273513887e-05, "loss": 0.0517, "step": 158850 }, { "epoch": 44.67, "learning_rate": 1.188704588760816e-05, "loss": 0.0547, "step": 158880 }, { "epoch": 44.68, "learning_rate": 1.1868303501702434e-05, "loss": 0.0585, "step": 158910 }, { "epoch": 44.68, "learning_rate": 1.1849561115796708e-05, "loss": 0.0493, "step": 158940 }, { "epoch": 44.69, "learning_rate": 1.1830818729890982e-05, "loss": 0.0568, "step": 158970 }, { "epoch": 44.7, "learning_rate": 1.1812076343985256e-05, "loss": 0.0549, "step": 159000 }, { "epoch": 44.71, "learning_rate": 1.179333395807953e-05, "loss": 0.0556, "step": 159030 }, { "epoch": 44.72, "learning_rate": 1.1774591572173805e-05, "loss": 0.0627, "step": 159060 }, { "epoch": 44.73, "learning_rate": 1.1755849186268079e-05, "loss": 0.0494, "step": 159090 }, { "epoch": 44.73, "learning_rate": 1.1737106800362353e-05, "loss": 0.0618, "step": 159120 }, { "epoch": 44.74, "learning_rate": 1.1718364414456627e-05, "loss": 0.0573, "step": 159150 }, { "epoch": 44.75, "learning_rate": 1.1699622028550903e-05, "loss": 0.0555, "step": 159180 }, { "epoch": 44.76, "learning_rate": 1.1680879642645176e-05, "loss": 0.0565, "step": 159210 }, { "epoch": 44.77, "learning_rate": 1.166213725673945e-05, "loss": 0.0532, "step": 159240 }, { "epoch": 44.78, "learning_rate": 1.1643394870833724e-05, "loss": 0.0633, "step": 159270 }, { "epoch": 44.78, "learning_rate": 1.1624652484927998e-05, "loss": 0.0493, "step": 159300 }, { "epoch": 44.79, "learning_rate": 1.1605910099022272e-05, "loss": 0.0591, "step": 159330 }, { "epoch": 44.8, "learning_rate": 1.1587167713116547e-05, "loss": 0.0632, "step": 159360 }, { "epoch": 44.81, "learning_rate": 1.1568425327210822e-05, "loss": 0.049, "step": 159390 }, { "epoch": 44.82, "learning_rate": 1.1549682941305095e-05, "loss": 0.0626, "step": 159420 }, { "epoch": 44.83, "learning_rate": 1.1530940555399369e-05, "loss": 0.0528, "step": 159450 }, { "epoch": 44.84, "learning_rate": 1.1512198169493643e-05, "loss": 0.0589, "step": 159480 }, { "epoch": 44.84, "learning_rate": 1.149345578358792e-05, "loss": 0.0589, "step": 159510 }, { "epoch": 44.85, "learning_rate": 1.1474713397682192e-05, "loss": 0.0497, "step": 159540 }, { "epoch": 44.86, "learning_rate": 1.1455971011776466e-05, "loss": 0.0609, "step": 159570 }, { "epoch": 44.87, "learning_rate": 1.1437228625870742e-05, "loss": 0.0542, "step": 159600 }, { "epoch": 44.88, "learning_rate": 1.1418486239965014e-05, "loss": 0.0564, "step": 159630 }, { "epoch": 44.89, "learning_rate": 1.1399743854059288e-05, "loss": 0.0622, "step": 159660 }, { "epoch": 44.89, "learning_rate": 1.1381001468153563e-05, "loss": 0.05, "step": 159690 }, { "epoch": 44.9, "learning_rate": 1.1362259082247839e-05, "loss": 0.059, "step": 159720 }, { "epoch": 44.91, "learning_rate": 1.1343516696342111e-05, "loss": 0.0544, "step": 159750 }, { "epoch": 44.92, "learning_rate": 1.1324774310436385e-05, "loss": 0.0565, "step": 159780 }, { "epoch": 44.93, "learning_rate": 1.1306031924530661e-05, "loss": 0.0603, "step": 159810 }, { "epoch": 44.94, "learning_rate": 1.1287289538624935e-05, "loss": 0.0492, "step": 159840 }, { "epoch": 44.95, "learning_rate": 1.1268547152719208e-05, "loss": 0.0571, "step": 159870 }, { "epoch": 44.95, "learning_rate": 1.1249804766813482e-05, "loss": 0.0561, "step": 159900 }, { "epoch": 44.96, "learning_rate": 1.1231062380907758e-05, "loss": 0.0554, "step": 159930 }, { "epoch": 44.97, "learning_rate": 1.121231999500203e-05, "loss": 0.0617, "step": 159960 }, { "epoch": 44.98, "learning_rate": 1.1193577609096305e-05, "loss": 0.0534, "step": 159990 }, { "epoch": 44.99, "learning_rate": 1.1174835223190579e-05, "loss": 0.0629, "step": 160020 }, { "epoch": 45.0, "learning_rate": 1.1156092837284855e-05, "loss": 0.0559, "step": 160050 }, { "epoch": 45.0, "eval_loss": 0.1769741326570511, "eval_runtime": 534.7373, "eval_samples_per_second": 29.983, "eval_steps_per_second": 0.939, "eval_wer": 0.1232309309022423, "step": 160065 }, { "epoch": 45.0, "learning_rate": 1.1137350451379127e-05, "loss": 0.058, "step": 160080 }, { "epoch": 45.01, "learning_rate": 1.1118608065473401e-05, "loss": 0.0529, "step": 160110 }, { "epoch": 45.02, "learning_rate": 1.1099865679567677e-05, "loss": 0.0541, "step": 160140 }, { "epoch": 45.03, "learning_rate": 1.108112329366195e-05, "loss": 0.0572, "step": 160170 }, { "epoch": 45.04, "learning_rate": 1.1062380907756224e-05, "loss": 0.0506, "step": 160200 }, { "epoch": 45.05, "learning_rate": 1.1043638521850498e-05, "loss": 0.057, "step": 160230 }, { "epoch": 45.05, "learning_rate": 1.1024896135944774e-05, "loss": 0.0572, "step": 160260 }, { "epoch": 45.06, "learning_rate": 1.1006153750039046e-05, "loss": 0.0508, "step": 160290 }, { "epoch": 45.07, "learning_rate": 1.098741136413332e-05, "loss": 0.0617, "step": 160320 }, { "epoch": 45.08, "learning_rate": 1.0968668978227597e-05, "loss": 0.0488, "step": 160350 }, { "epoch": 45.09, "learning_rate": 1.094992659232187e-05, "loss": 0.0569, "step": 160380 }, { "epoch": 45.1, "learning_rate": 1.0931184206416143e-05, "loss": 0.0547, "step": 160410 }, { "epoch": 45.11, "learning_rate": 1.0912441820510417e-05, "loss": 0.0544, "step": 160440 }, { "epoch": 45.11, "learning_rate": 1.0893699434604693e-05, "loss": 0.0601, "step": 160470 }, { "epoch": 45.12, "learning_rate": 1.0874957048698966e-05, "loss": 0.0528, "step": 160500 }, { "epoch": 45.13, "learning_rate": 1.085621466279324e-05, "loss": 0.0533, "step": 160530 }, { "epoch": 45.14, "learning_rate": 1.0838097023084372e-05, "loss": 0.0542, "step": 160560 }, { "epoch": 45.15, "learning_rate": 1.0819354637178647e-05, "loss": 0.0509, "step": 160590 }, { "epoch": 45.16, "learning_rate": 1.0800612251272921e-05, "loss": 0.0604, "step": 160620 }, { "epoch": 45.16, "learning_rate": 1.0781869865367195e-05, "loss": 0.0529, "step": 160650 }, { "epoch": 45.17, "learning_rate": 1.0763752225658328e-05, "loss": 0.0732, "step": 160680 }, { "epoch": 45.18, "learning_rate": 1.0745009839752602e-05, "loss": 0.0576, "step": 160710 }, { "epoch": 45.19, "learning_rate": 1.0726267453846874e-05, "loss": 0.0511, "step": 160740 }, { "epoch": 45.2, "learning_rate": 1.0707525067941148e-05, "loss": 0.0603, "step": 160770 }, { "epoch": 45.21, "learning_rate": 1.0688782682035424e-05, "loss": 0.0513, "step": 160800 }, { "epoch": 45.22, "learning_rate": 1.0670040296129699e-05, "loss": 0.0604, "step": 160830 }, { "epoch": 45.22, "learning_rate": 1.0651297910223971e-05, "loss": 0.0523, "step": 160860 }, { "epoch": 45.23, "learning_rate": 1.0632555524318247e-05, "loss": 0.0555, "step": 160890 }, { "epoch": 45.24, "learning_rate": 1.0613813138412521e-05, "loss": 0.0621, "step": 160920 }, { "epoch": 45.25, "learning_rate": 1.0595070752506794e-05, "loss": 0.0495, "step": 160950 }, { "epoch": 45.26, "learning_rate": 1.0576328366601068e-05, "loss": 0.0579, "step": 160980 }, { "epoch": 45.27, "learning_rate": 1.0557585980695344e-05, "loss": 0.0576, "step": 161010 }, { "epoch": 45.27, "learning_rate": 1.0538843594789618e-05, "loss": 0.054, "step": 161040 }, { "epoch": 45.28, "learning_rate": 1.052010120888389e-05, "loss": 0.0584, "step": 161070 }, { "epoch": 45.29, "learning_rate": 1.0501358822978166e-05, "loss": 0.0493, "step": 161100 }, { "epoch": 45.3, "learning_rate": 1.048261643707244e-05, "loss": 0.0602, "step": 161130 }, { "epoch": 45.31, "learning_rate": 1.0463874051166715e-05, "loss": 0.0564, "step": 161160 }, { "epoch": 45.32, "learning_rate": 1.0445131665260987e-05, "loss": 0.0517, "step": 161190 }, { "epoch": 45.32, "learning_rate": 1.0426389279355263e-05, "loss": 0.0614, "step": 161220 }, { "epoch": 45.33, "learning_rate": 1.0407646893449537e-05, "loss": 0.0488, "step": 161250 }, { "epoch": 45.34, "learning_rate": 1.038890450754381e-05, "loss": 0.0553, "step": 161280 }, { "epoch": 45.35, "learning_rate": 1.0370162121638086e-05, "loss": 0.058, "step": 161310 }, { "epoch": 45.36, "learning_rate": 1.035141973573236e-05, "loss": 0.0557, "step": 161340 }, { "epoch": 45.37, "learning_rate": 1.0332677349826634e-05, "loss": 0.061, "step": 161370 }, { "epoch": 45.38, "learning_rate": 1.0313934963920906e-05, "loss": 0.0514, "step": 161400 }, { "epoch": 45.38, "learning_rate": 1.029581732421204e-05, "loss": 0.0803, "step": 161430 }, { "epoch": 45.39, "learning_rate": 1.0277074938306313e-05, "loss": 0.0538, "step": 161460 }, { "epoch": 45.4, "learning_rate": 1.0258332552400587e-05, "loss": 0.0548, "step": 161490 }, { "epoch": 45.41, "learning_rate": 1.0239590166494863e-05, "loss": 0.0611, "step": 161520 }, { "epoch": 45.42, "learning_rate": 1.0220847780589136e-05, "loss": 0.0488, "step": 161550 }, { "epoch": 45.43, "learning_rate": 1.020210539468341e-05, "loss": 0.0586, "step": 161580 }, { "epoch": 45.43, "learning_rate": 1.0183363008777684e-05, "loss": 0.0536, "step": 161610 }, { "epoch": 45.44, "learning_rate": 1.016462062287196e-05, "loss": 0.0543, "step": 161640 }, { "epoch": 45.45, "learning_rate": 1.0145878236966232e-05, "loss": 0.0645, "step": 161670 }, { "epoch": 45.46, "learning_rate": 1.0127135851060507e-05, "loss": 0.0513, "step": 161700 }, { "epoch": 45.47, "learning_rate": 1.010839346515478e-05, "loss": 0.0576, "step": 161730 }, { "epoch": 45.48, "learning_rate": 1.0089651079249057e-05, "loss": 0.0545, "step": 161760 }, { "epoch": 45.48, "learning_rate": 1.007090869334333e-05, "loss": 0.0539, "step": 161790 }, { "epoch": 45.49, "learning_rate": 1.0052166307437603e-05, "loss": 0.0629, "step": 161820 }, { "epoch": 45.5, "learning_rate": 1.003342392153188e-05, "loss": 0.0551, "step": 161850 }, { "epoch": 45.51, "learning_rate": 1.0014681535626152e-05, "loss": 0.0568, "step": 161880 }, { "epoch": 45.52, "learning_rate": 9.995939149720426e-06, "loss": 0.0542, "step": 161910 }, { "epoch": 45.53, "learning_rate": 9.9771967638147e-06, "loss": 0.0511, "step": 161940 }, { "epoch": 45.54, "learning_rate": 9.958454377908976e-06, "loss": 0.0594, "step": 161970 }, { "epoch": 45.54, "learning_rate": 9.939711992003249e-06, "loss": 0.0499, "step": 162000 }, { "epoch": 45.55, "learning_rate": 9.920969606097523e-06, "loss": 0.0568, "step": 162030 }, { "epoch": 45.56, "learning_rate": 9.902227220191799e-06, "loss": 0.0549, "step": 162060 }, { "epoch": 45.57, "learning_rate": 9.883484834286071e-06, "loss": 0.0536, "step": 162090 }, { "epoch": 45.58, "learning_rate": 9.864742448380345e-06, "loss": 0.0638, "step": 162120 }, { "epoch": 45.59, "learning_rate": 9.84600006247462e-06, "loss": 0.0486, "step": 162150 }, { "epoch": 45.59, "learning_rate": 9.827257676568895e-06, "loss": 0.058, "step": 162180 }, { "epoch": 45.6, "learning_rate": 9.808515290663168e-06, "loss": 0.0561, "step": 162210 }, { "epoch": 45.61, "learning_rate": 9.789772904757442e-06, "loss": 0.0528, "step": 162240 }, { "epoch": 45.62, "learning_rate": 9.771030518851718e-06, "loss": 0.0583, "step": 162270 }, { "epoch": 45.63, "learning_rate": 9.752288132945992e-06, "loss": 0.0503, "step": 162300 }, { "epoch": 45.64, "learning_rate": 9.733545747040265e-06, "loss": 0.0634, "step": 162330 }, { "epoch": 45.65, "learning_rate": 9.714803361134539e-06, "loss": 0.0523, "step": 162360 }, { "epoch": 45.65, "learning_rate": 9.696060975228815e-06, "loss": 0.057, "step": 162390 }, { "epoch": 45.66, "learning_rate": 9.677318589323087e-06, "loss": 0.0641, "step": 162420 }, { "epoch": 45.67, "learning_rate": 9.658576203417361e-06, "loss": 0.0489, "step": 162450 }, { "epoch": 45.68, "learning_rate": 9.639833817511636e-06, "loss": 0.0546, "step": 162480 }, { "epoch": 45.69, "learning_rate": 9.621091431605911e-06, "loss": 0.0549, "step": 162510 }, { "epoch": 45.7, "learning_rate": 9.602349045700184e-06, "loss": 0.0508, "step": 162540 }, { "epoch": 45.7, "learning_rate": 9.583606659794458e-06, "loss": 0.0595, "step": 162570 }, { "epoch": 45.71, "learning_rate": 9.564864273888734e-06, "loss": 0.0511, "step": 162600 }, { "epoch": 45.72, "learning_rate": 9.546121887983008e-06, "loss": 0.0605, "step": 162630 }, { "epoch": 45.73, "learning_rate": 9.52737950207728e-06, "loss": 0.0532, "step": 162660 }, { "epoch": 45.74, "learning_rate": 9.508637116171555e-06, "loss": 0.0575, "step": 162690 }, { "epoch": 45.75, "learning_rate": 9.48989473026583e-06, "loss": 0.066, "step": 162720 }, { "epoch": 45.75, "learning_rate": 9.471152344360103e-06, "loss": 0.0477, "step": 162750 }, { "epoch": 45.76, "learning_rate": 9.452409958454378e-06, "loss": 0.0579, "step": 162780 }, { "epoch": 45.77, "learning_rate": 9.433667572548653e-06, "loss": 0.058, "step": 162810 }, { "epoch": 45.78, "learning_rate": 9.414925186642928e-06, "loss": 0.0591, "step": 162840 }, { "epoch": 45.79, "learning_rate": 9.3961828007372e-06, "loss": 0.0565, "step": 162870 }, { "epoch": 45.8, "learning_rate": 9.377440414831474e-06, "loss": 0.048, "step": 162900 }, { "epoch": 45.81, "learning_rate": 9.35869802892575e-06, "loss": 0.0537, "step": 162930 }, { "epoch": 45.81, "learning_rate": 9.339955643020024e-06, "loss": 0.0558, "step": 162960 }, { "epoch": 45.82, "learning_rate": 9.321213257114297e-06, "loss": 0.057, "step": 162990 }, { "epoch": 45.83, "learning_rate": 9.302470871208573e-06, "loss": 0.0584, "step": 163020 }, { "epoch": 45.84, "learning_rate": 9.283728485302847e-06, "loss": 0.0501, "step": 163050 }, { "epoch": 45.85, "learning_rate": 9.26498609939712e-06, "loss": 0.0561, "step": 163080 }, { "epoch": 45.86, "learning_rate": 9.246243713491394e-06, "loss": 0.0555, "step": 163110 }, { "epoch": 45.86, "learning_rate": 9.22750132758567e-06, "loss": 0.053, "step": 163140 }, { "epoch": 45.87, "learning_rate": 9.208758941679944e-06, "loss": 0.0616, "step": 163170 }, { "epoch": 45.88, "learning_rate": 9.190016555774216e-06, "loss": 0.0491, "step": 163200 }, { "epoch": 45.89, "learning_rate": 9.171274169868492e-06, "loss": 0.0592, "step": 163230 }, { "epoch": 45.9, "learning_rate": 9.152531783962766e-06, "loss": 0.0538, "step": 163260 }, { "epoch": 45.91, "learning_rate": 9.13378939805704e-06, "loss": 0.0526, "step": 163290 }, { "epoch": 45.91, "learning_rate": 9.115047012151313e-06, "loss": 0.0579, "step": 163320 }, { "epoch": 45.92, "learning_rate": 9.096304626245589e-06, "loss": 0.0513, "step": 163350 }, { "epoch": 45.93, "learning_rate": 9.077562240339863e-06, "loss": 0.0617, "step": 163380 }, { "epoch": 45.94, "learning_rate": 9.058819854434136e-06, "loss": 0.0545, "step": 163410 }, { "epoch": 45.95, "learning_rate": 9.04007746852841e-06, "loss": 0.0522, "step": 163440 }, { "epoch": 45.96, "learning_rate": 9.021335082622686e-06, "loss": 0.063, "step": 163470 }, { "epoch": 45.97, "learning_rate": 9.00259269671696e-06, "loss": 0.0515, "step": 163500 }, { "epoch": 45.97, "learning_rate": 8.983850310811232e-06, "loss": 0.0603, "step": 163530 }, { "epoch": 45.98, "learning_rate": 8.965107924905508e-06, "loss": 0.052, "step": 163560 }, { "epoch": 45.99, "learning_rate": 8.946365538999782e-06, "loss": 0.0519, "step": 163590 }, { "epoch": 46.0, "learning_rate": 8.927623153094057e-06, "loss": 0.0557, "step": 163620 }, { "epoch": 46.0, "eval_loss": 0.1765855848789215, "eval_runtime": 511.5794, "eval_samples_per_second": 31.34, "eval_steps_per_second": 0.981, "eval_wer": 0.12310127877935938, "step": 163622 }, { "epoch": 46.01, "learning_rate": 8.908880767188329e-06, "loss": 0.0524, "step": 163650 }, { "epoch": 46.02, "learning_rate": 8.890138381282605e-06, "loss": 0.0607, "step": 163680 }, { "epoch": 46.02, "learning_rate": 8.871395995376879e-06, "loss": 0.0514, "step": 163710 }, { "epoch": 46.03, "learning_rate": 8.852653609471152e-06, "loss": 0.0511, "step": 163740 }, { "epoch": 46.04, "learning_rate": 8.833911223565428e-06, "loss": 0.0576, "step": 163770 }, { "epoch": 46.05, "learning_rate": 8.815168837659702e-06, "loss": 0.0529, "step": 163800 }, { "epoch": 46.06, "learning_rate": 8.796426451753976e-06, "loss": 0.0597, "step": 163830 }, { "epoch": 46.07, "learning_rate": 8.777684065848248e-06, "loss": 0.0501, "step": 163860 }, { "epoch": 46.08, "learning_rate": 8.758941679942524e-06, "loss": 0.0592, "step": 163890 }, { "epoch": 46.08, "learning_rate": 8.740199294036798e-06, "loss": 0.0547, "step": 163920 }, { "epoch": 46.09, "learning_rate": 8.721456908131071e-06, "loss": 0.0494, "step": 163950 }, { "epoch": 46.1, "learning_rate": 8.702714522225347e-06, "loss": 0.0599, "step": 163980 }, { "epoch": 46.11, "learning_rate": 8.683972136319621e-06, "loss": 0.0494, "step": 164010 }, { "epoch": 46.12, "learning_rate": 8.665229750413895e-06, "loss": 0.0565, "step": 164040 }, { "epoch": 46.13, "learning_rate": 8.646487364508168e-06, "loss": 0.057, "step": 164070 }, { "epoch": 46.13, "learning_rate": 8.627744978602444e-06, "loss": 0.0481, "step": 164100 }, { "epoch": 46.14, "learning_rate": 8.609002592696718e-06, "loss": 0.0621, "step": 164130 }, { "epoch": 46.15, "learning_rate": 8.590260206790992e-06, "loss": 0.0558, "step": 164160 }, { "epoch": 46.16, "learning_rate": 8.571517820885266e-06, "loss": 0.0536, "step": 164190 }, { "epoch": 46.17, "learning_rate": 8.55277543497954e-06, "loss": 0.0584, "step": 164220 }, { "epoch": 46.18, "learning_rate": 8.534033049073815e-06, "loss": 0.0535, "step": 164250 }, { "epoch": 46.18, "learning_rate": 8.515290663168087e-06, "loss": 0.0599, "step": 164280 }, { "epoch": 46.19, "learning_rate": 8.496548277262363e-06, "loss": 0.0533, "step": 164310 }, { "epoch": 46.2, "learning_rate": 8.477805891356637e-06, "loss": 0.0561, "step": 164340 }, { "epoch": 46.21, "learning_rate": 8.459063505450911e-06, "loss": 0.0579, "step": 164370 }, { "epoch": 46.22, "learning_rate": 8.440321119545184e-06, "loss": 0.0515, "step": 164400 }, { "epoch": 46.23, "learning_rate": 8.42157873363946e-06, "loss": 0.0577, "step": 164430 }, { "epoch": 46.24, "learning_rate": 8.402836347733734e-06, "loss": 0.0515, "step": 164460 }, { "epoch": 46.24, "learning_rate": 8.384093961828008e-06, "loss": 0.0561, "step": 164490 }, { "epoch": 46.25, "learning_rate": 8.365351575922282e-06, "loss": 0.058, "step": 164520 }, { "epoch": 46.26, "learning_rate": 8.346609190016556e-06, "loss": 0.0565, "step": 164550 }, { "epoch": 46.27, "learning_rate": 8.32786680411083e-06, "loss": 0.0569, "step": 164580 }, { "epoch": 46.28, "learning_rate": 8.309124418205103e-06, "loss": 0.0501, "step": 164610 }, { "epoch": 46.29, "learning_rate": 8.290382032299379e-06, "loss": 0.0552, "step": 164640 }, { "epoch": 46.29, "learning_rate": 8.271639646393653e-06, "loss": 0.0579, "step": 164670 }, { "epoch": 46.3, "learning_rate": 8.252897260487927e-06, "loss": 0.053, "step": 164700 }, { "epoch": 46.31, "learning_rate": 8.234154874582202e-06, "loss": 0.0593, "step": 164730 }, { "epoch": 46.32, "learning_rate": 8.215412488676476e-06, "loss": 0.0569, "step": 164760 }, { "epoch": 46.33, "learning_rate": 8.19667010277075e-06, "loss": 0.0564, "step": 164790 }, { "epoch": 46.34, "learning_rate": 8.177927716865024e-06, "loss": 0.0555, "step": 164820 }, { "epoch": 46.35, "learning_rate": 8.159185330959298e-06, "loss": 0.0488, "step": 164850 }, { "epoch": 46.35, "learning_rate": 8.140442945053573e-06, "loss": 0.0574, "step": 164880 }, { "epoch": 46.36, "learning_rate": 8.121700559147847e-06, "loss": 0.0524, "step": 164910 }, { "epoch": 46.37, "learning_rate": 8.102958173242121e-06, "loss": 0.0555, "step": 164940 }, { "epoch": 46.38, "learning_rate": 8.084215787336395e-06, "loss": 0.057, "step": 164970 }, { "epoch": 46.39, "learning_rate": 8.06547340143067e-06, "loss": 0.0489, "step": 165000 }, { "epoch": 46.4, "learning_rate": 8.046731015524944e-06, "loss": 0.0597, "step": 165030 }, { "epoch": 46.4, "learning_rate": 8.027988629619218e-06, "loss": 0.0496, "step": 165060 }, { "epoch": 46.41, "learning_rate": 8.009246243713492e-06, "loss": 0.0549, "step": 165090 }, { "epoch": 46.42, "learning_rate": 7.990503857807766e-06, "loss": 0.0574, "step": 165120 }, { "epoch": 46.43, "learning_rate": 7.97176147190204e-06, "loss": 0.0487, "step": 165150 }, { "epoch": 46.44, "learning_rate": 7.953019085996314e-06, "loss": 0.0583, "step": 165180 }, { "epoch": 46.45, "learning_rate": 7.934276700090589e-06, "loss": 0.0495, "step": 165210 }, { "epoch": 46.45, "learning_rate": 7.915534314184863e-06, "loss": 0.0556, "step": 165240 }, { "epoch": 46.46, "learning_rate": 7.896791928279137e-06, "loss": 0.0554, "step": 165270 }, { "epoch": 46.47, "learning_rate": 7.878049542373411e-06, "loss": 0.0541, "step": 165300 }, { "epoch": 46.48, "learning_rate": 7.859307156467685e-06, "loss": 0.0556, "step": 165330 }, { "epoch": 46.49, "learning_rate": 7.84056477056196e-06, "loss": 0.055, "step": 165360 }, { "epoch": 46.5, "learning_rate": 7.821822384656234e-06, "loss": 0.058, "step": 165390 }, { "epoch": 46.51, "learning_rate": 7.803079998750508e-06, "loss": 0.055, "step": 165420 }, { "epoch": 46.51, "learning_rate": 7.784337612844782e-06, "loss": 0.0521, "step": 165450 }, { "epoch": 46.52, "learning_rate": 7.765595226939056e-06, "loss": 0.0582, "step": 165480 }, { "epoch": 46.53, "learning_rate": 7.74685284103333e-06, "loss": 0.0499, "step": 165510 }, { "epoch": 46.54, "learning_rate": 7.728110455127605e-06, "loss": 0.0502, "step": 165540 }, { "epoch": 46.55, "learning_rate": 7.709368069221879e-06, "loss": 0.0574, "step": 165570 }, { "epoch": 46.56, "learning_rate": 7.690625683316153e-06, "loss": 0.0521, "step": 165600 }, { "epoch": 46.56, "learning_rate": 7.671883297410427e-06, "loss": 0.0585, "step": 165630 }, { "epoch": 46.57, "learning_rate": 7.653140911504702e-06, "loss": 0.0479, "step": 165660 }, { "epoch": 46.58, "learning_rate": 7.634398525598976e-06, "loss": 0.0542, "step": 165690 }, { "epoch": 46.59, "learning_rate": 7.61565613969325e-06, "loss": 0.0586, "step": 165720 }, { "epoch": 46.6, "learning_rate": 7.596913753787524e-06, "loss": 0.0526, "step": 165750 }, { "epoch": 46.61, "learning_rate": 7.5781713678817974e-06, "loss": 0.0595, "step": 165780 }, { "epoch": 46.62, "learning_rate": 7.559428981976073e-06, "loss": 0.0525, "step": 165810 }, { "epoch": 46.62, "learning_rate": 7.540686596070347e-06, "loss": 0.0523, "step": 165840 }, { "epoch": 46.63, "learning_rate": 7.521944210164621e-06, "loss": 0.0541, "step": 165870 }, { "epoch": 46.64, "learning_rate": 7.503201824258896e-06, "loss": 0.0512, "step": 165900 }, { "epoch": 46.65, "learning_rate": 7.484459438353169e-06, "loss": 0.0587, "step": 165930 }, { "epoch": 46.66, "learning_rate": 7.4657170524474434e-06, "loss": 0.0512, "step": 165960 }, { "epoch": 46.67, "learning_rate": 7.446974666541718e-06, "loss": 0.0546, "step": 165990 }, { "epoch": 46.67, "learning_rate": 7.428232280635993e-06, "loss": 0.0558, "step": 166020 }, { "epoch": 46.68, "learning_rate": 7.409489894730266e-06, "loss": 0.0516, "step": 166050 }, { "epoch": 46.69, "learning_rate": 7.39074750882454e-06, "loss": 0.0595, "step": 166080 }, { "epoch": 46.7, "learning_rate": 7.3720051229188135e-06, "loss": 0.0517, "step": 166110 }, { "epoch": 46.71, "learning_rate": 7.353262737013089e-06, "loss": 0.0557, "step": 166140 }, { "epoch": 46.72, "learning_rate": 7.334520351107363e-06, "loss": 0.0584, "step": 166170 }, { "epoch": 46.72, "learning_rate": 7.315777965201637e-06, "loss": 0.0535, "step": 166200 }, { "epoch": 46.73, "learning_rate": 7.297035579295912e-06, "loss": 0.0629, "step": 166230 }, { "epoch": 46.74, "learning_rate": 7.278293193390185e-06, "loss": 0.0497, "step": 166260 }, { "epoch": 46.75, "learning_rate": 7.2595508074844595e-06, "loss": 0.0563, "step": 166290 }, { "epoch": 46.76, "learning_rate": 7.240808421578734e-06, "loss": 0.059, "step": 166320 }, { "epoch": 46.77, "learning_rate": 7.222066035673009e-06, "loss": 0.0484, "step": 166350 }, { "epoch": 46.78, "learning_rate": 7.203323649767282e-06, "loss": 0.0602, "step": 166380 }, { "epoch": 46.78, "learning_rate": 7.184581263861556e-06, "loss": 0.0503, "step": 166410 }, { "epoch": 46.79, "learning_rate": 7.165838877955831e-06, "loss": 0.0563, "step": 166440 }, { "epoch": 46.8, "learning_rate": 7.1470964920501055e-06, "loss": 0.0559, "step": 166470 }, { "epoch": 46.81, "learning_rate": 7.128354106144379e-06, "loss": 0.0509, "step": 166500 }, { "epoch": 46.82, "learning_rate": 7.109611720238653e-06, "loss": 0.0609, "step": 166530 }, { "epoch": 46.83, "learning_rate": 7.090869334332928e-06, "loss": 0.0539, "step": 166560 }, { "epoch": 46.83, "learning_rate": 7.0721269484272014e-06, "loss": 0.0547, "step": 166590 }, { "epoch": 46.84, "learning_rate": 7.053384562521476e-06, "loss": 0.0566, "step": 166620 }, { "epoch": 46.85, "learning_rate": 7.034642176615751e-06, "loss": 0.0474, "step": 166650 }, { "epoch": 46.86, "learning_rate": 7.015899790710025e-06, "loss": 0.0596, "step": 166680 }, { "epoch": 46.87, "learning_rate": 6.997157404804298e-06, "loss": 0.0503, "step": 166710 }, { "epoch": 46.88, "learning_rate": 6.978415018898572e-06, "loss": 0.0583, "step": 166740 }, { "epoch": 46.88, "learning_rate": 6.959672632992847e-06, "loss": 0.0577, "step": 166770 }, { "epoch": 46.89, "learning_rate": 6.940930247087122e-06, "loss": 0.0511, "step": 166800 }, { "epoch": 46.9, "learning_rate": 6.922187861181395e-06, "loss": 0.0559, "step": 166830 }, { "epoch": 46.91, "learning_rate": 6.90344547527567e-06, "loss": 0.0507, "step": 166860 }, { "epoch": 46.92, "learning_rate": 6.884703089369944e-06, "loss": 0.0565, "step": 166890 }, { "epoch": 46.93, "learning_rate": 6.8659607034642175e-06, "loss": 0.0549, "step": 166920 }, { "epoch": 46.94, "learning_rate": 6.847218317558492e-06, "loss": 0.0536, "step": 166950 }, { "epoch": 46.94, "learning_rate": 6.828475931652767e-06, "loss": 0.0589, "step": 166980 }, { "epoch": 46.95, "learning_rate": 6.809733545747041e-06, "loss": 0.0529, "step": 167010 }, { "epoch": 46.96, "learning_rate": 6.790991159841314e-06, "loss": 0.055, "step": 167040 }, { "epoch": 46.97, "learning_rate": 6.7722487739355885e-06, "loss": 0.0593, "step": 167070 }, { "epoch": 46.98, "learning_rate": 6.7535063880298635e-06, "loss": 0.0528, "step": 167100 }, { "epoch": 46.99, "learning_rate": 6.734764002124138e-06, "loss": 0.0577, "step": 167130 }, { "epoch": 46.99, "learning_rate": 6.716021616218411e-06, "loss": 0.0521, "step": 167160 }, { "epoch": 47.0, "eval_loss": 0.17507979273796082, "eval_runtime": 537.6874, "eval_samples_per_second": 29.818, "eval_steps_per_second": 0.934, "eval_wer": 0.12198900004094278, "step": 167179 }, { "epoch": 47.0, "learning_rate": 6.697279230312686e-06, "loss": 0.0557, "step": 167190 }, { "epoch": 47.01, "learning_rate": 6.67853684440696e-06, "loss": 0.0514, "step": 167220 }, { "epoch": 47.02, "learning_rate": 6.659794458501234e-06, "loss": 0.0556, "step": 167250 }, { "epoch": 47.03, "learning_rate": 6.641052072595508e-06, "loss": 0.0593, "step": 167280 }, { "epoch": 47.04, "learning_rate": 6.622309686689783e-06, "loss": 0.0473, "step": 167310 }, { "epoch": 47.05, "learning_rate": 6.603567300784057e-06, "loss": 0.0545, "step": 167340 }, { "epoch": 47.05, "learning_rate": 6.58482491487833e-06, "loss": 0.0525, "step": 167370 }, { "epoch": 47.06, "learning_rate": 6.5660825289726054e-06, "loss": 0.0552, "step": 167400 }, { "epoch": 47.07, "learning_rate": 6.54734014306688e-06, "loss": 0.0604, "step": 167430 }, { "epoch": 47.08, "learning_rate": 6.528597757161154e-06, "loss": 0.0467, "step": 167460 }, { "epoch": 47.09, "learning_rate": 6.509855371255427e-06, "loss": 0.0604, "step": 167490 }, { "epoch": 47.1, "learning_rate": 6.491112985349702e-06, "loss": 0.0526, "step": 167520 }, { "epoch": 47.1, "learning_rate": 6.472995345640834e-06, "loss": 0.0562, "step": 167550 }, { "epoch": 47.11, "learning_rate": 6.454252959735107e-06, "loss": 0.0605, "step": 167580 }, { "epoch": 47.12, "learning_rate": 6.435510573829383e-06, "loss": 0.049, "step": 167610 }, { "epoch": 47.13, "learning_rate": 6.416768187923656e-06, "loss": 0.0584, "step": 167640 }, { "epoch": 47.14, "learning_rate": 6.398025802017931e-06, "loss": 0.0491, "step": 167670 }, { "epoch": 47.15, "learning_rate": 6.379283416112204e-06, "loss": 0.058, "step": 167700 }, { "epoch": 47.15, "learning_rate": 6.360541030206479e-06, "loss": 0.0603, "step": 167730 }, { "epoch": 47.16, "learning_rate": 6.341798644300753e-06, "loss": 0.0488, "step": 167760 }, { "epoch": 47.17, "learning_rate": 6.323056258395027e-06, "loss": 0.0544, "step": 167790 }, { "epoch": 47.18, "learning_rate": 6.304313872489301e-06, "loss": 0.0517, "step": 167820 }, { "epoch": 47.19, "learning_rate": 6.285571486583576e-06, "loss": 0.0545, "step": 167850 }, { "epoch": 47.2, "learning_rate": 6.267453846874707e-06, "loss": 0.0571, "step": 167880 }, { "epoch": 47.21, "learning_rate": 6.248711460968982e-06, "loss": 0.0485, "step": 167910 }, { "epoch": 47.21, "learning_rate": 6.229969075063256e-06, "loss": 0.0601, "step": 167940 }, { "epoch": 47.22, "learning_rate": 6.21122668915753e-06, "loss": 0.052, "step": 167970 }, { "epoch": 47.23, "learning_rate": 6.192484303251804e-06, "loss": 0.0539, "step": 168000 }, { "epoch": 47.24, "learning_rate": 6.173741917346078e-06, "loss": 0.0597, "step": 168030 }, { "epoch": 47.25, "learning_rate": 6.1549995314403526e-06, "loss": 0.0451, "step": 168060 }, { "epoch": 47.26, "learning_rate": 6.136257145534627e-06, "loss": 0.0548, "step": 168090 }, { "epoch": 47.26, "learning_rate": 6.117514759628901e-06, "loss": 0.0492, "step": 168120 }, { "epoch": 47.27, "learning_rate": 6.098772373723175e-06, "loss": 0.0506, "step": 168150 }, { "epoch": 47.28, "learning_rate": 6.080029987817449e-06, "loss": 0.0577, "step": 168180 }, { "epoch": 47.29, "learning_rate": 6.0612876019117235e-06, "loss": 0.0476, "step": 168210 }, { "epoch": 47.3, "learning_rate": 6.042545216005998e-06, "loss": 0.0573, "step": 168240 }, { "epoch": 47.31, "learning_rate": 6.023802830100272e-06, "loss": 0.05, "step": 168270 }, { "epoch": 47.32, "learning_rate": 6.005060444194546e-06, "loss": 0.0559, "step": 168300 }, { "epoch": 47.32, "learning_rate": 5.986318058288821e-06, "loss": 0.058, "step": 168330 }, { "epoch": 47.33, "learning_rate": 5.9675756723830945e-06, "loss": 0.0469, "step": 168360 }, { "epoch": 47.34, "learning_rate": 5.9488332864773695e-06, "loss": 0.0583, "step": 168390 }, { "epoch": 47.35, "learning_rate": 5.930090900571643e-06, "loss": 0.0507, "step": 168420 }, { "epoch": 47.36, "learning_rate": 5.911348514665917e-06, "loss": 0.0551, "step": 168450 }, { "epoch": 47.37, "learning_rate": 5.892606128760191e-06, "loss": 0.0633, "step": 168480 }, { "epoch": 47.37, "learning_rate": 5.873863742854465e-06, "loss": 0.0474, "step": 168510 }, { "epoch": 47.38, "learning_rate": 5.85512135694874e-06, "loss": 0.0554, "step": 168540 }, { "epoch": 47.39, "learning_rate": 5.836378971043014e-06, "loss": 0.0541, "step": 168570 }, { "epoch": 47.4, "learning_rate": 5.817636585137289e-06, "loss": 0.0513, "step": 168600 }, { "epoch": 47.41, "learning_rate": 5.798894199231562e-06, "loss": 0.0595, "step": 168630 }, { "epoch": 47.42, "learning_rate": 5.780151813325837e-06, "loss": 0.0474, "step": 168660 }, { "epoch": 47.42, "learning_rate": 5.7614094274201106e-06, "loss": 0.0535, "step": 168690 }, { "epoch": 47.43, "learning_rate": 5.742667041514385e-06, "loss": 0.052, "step": 168720 }, { "epoch": 47.44, "learning_rate": 5.723924655608659e-06, "loss": 0.0532, "step": 168750 }, { "epoch": 47.45, "learning_rate": 5.705182269702933e-06, "loss": 0.0568, "step": 168780 }, { "epoch": 47.46, "learning_rate": 5.686439883797208e-06, "loss": 0.0495, "step": 168810 }, { "epoch": 47.47, "learning_rate": 5.6676974978914815e-06, "loss": 0.0593, "step": 168840 }, { "epoch": 47.48, "learning_rate": 5.6489551119857566e-06, "loss": 0.0527, "step": 168870 }, { "epoch": 47.48, "learning_rate": 5.63021272608003e-06, "loss": 0.0544, "step": 168900 }, { "epoch": 47.49, "learning_rate": 5.611470340174305e-06, "loss": 0.061, "step": 168930 }, { "epoch": 47.5, "learning_rate": 5.592727954268578e-06, "loss": 0.0474, "step": 168960 }, { "epoch": 47.51, "learning_rate": 5.573985568362853e-06, "loss": 0.0632, "step": 168990 }, { "epoch": 47.52, "learning_rate": 5.555243182457127e-06, "loss": 0.0534, "step": 169020 }, { "epoch": 47.53, "learning_rate": 5.536500796551401e-06, "loss": 0.0547, "step": 169050 }, { "epoch": 47.53, "learning_rate": 5.517758410645676e-06, "loss": 0.0556, "step": 169080 }, { "epoch": 47.54, "learning_rate": 5.499016024739949e-06, "loss": 0.0489, "step": 169110 }, { "epoch": 47.55, "learning_rate": 5.480273638834224e-06, "loss": 0.0583, "step": 169140 }, { "epoch": 47.56, "learning_rate": 5.461531252928498e-06, "loss": 0.0521, "step": 169170 }, { "epoch": 47.57, "learning_rate": 5.442788867022773e-06, "loss": 0.0528, "step": 169200 }, { "epoch": 47.58, "learning_rate": 5.424046481117046e-06, "loss": 0.0625, "step": 169230 }, { "epoch": 47.58, "learning_rate": 5.405304095211321e-06, "loss": 0.0453, "step": 169260 }, { "epoch": 47.59, "learning_rate": 5.386561709305595e-06, "loss": 0.0594, "step": 169290 }, { "epoch": 47.6, "learning_rate": 5.367819323399869e-06, "loss": 0.0507, "step": 169320 }, { "epoch": 47.61, "learning_rate": 5.349076937494144e-06, "loss": 0.0533, "step": 169350 }, { "epoch": 47.62, "learning_rate": 5.330334551588417e-06, "loss": 0.0618, "step": 169380 }, { "epoch": 47.63, "learning_rate": 5.311592165682692e-06, "loss": 0.0491, "step": 169410 }, { "epoch": 47.64, "learning_rate": 5.292849779776965e-06, "loss": 0.0605, "step": 169440 }, { "epoch": 47.64, "learning_rate": 5.27410739387124e-06, "loss": 0.0532, "step": 169470 }, { "epoch": 47.65, "learning_rate": 5.255365007965514e-06, "loss": 0.0561, "step": 169500 }, { "epoch": 47.66, "learning_rate": 5.236622622059789e-06, "loss": 0.0609, "step": 169530 }, { "epoch": 47.67, "learning_rate": 5.217880236154063e-06, "loss": 0.0497, "step": 169560 }, { "epoch": 47.68, "learning_rate": 5.199137850248337e-06, "loss": 0.0589, "step": 169590 }, { "epoch": 47.69, "learning_rate": 5.180395464342611e-06, "loss": 0.0533, "step": 169620 }, { "epoch": 47.69, "learning_rate": 5.161653078436885e-06, "loss": 0.0546, "step": 169650 }, { "epoch": 47.7, "learning_rate": 5.14291069253116e-06, "loss": 0.0598, "step": 169680 }, { "epoch": 47.71, "learning_rate": 5.124168306625433e-06, "loss": 0.0486, "step": 169710 }, { "epoch": 47.72, "learning_rate": 5.105425920719708e-06, "loss": 0.0598, "step": 169740 }, { "epoch": 47.73, "learning_rate": 5.086683534813982e-06, "loss": 0.0545, "step": 169770 }, { "epoch": 47.74, "learning_rate": 5.0679411489082565e-06, "loss": 0.0564, "step": 169800 }, { "epoch": 47.75, "learning_rate": 5.049198763002531e-06, "loss": 0.0578, "step": 169830 }, { "epoch": 47.75, "learning_rate": 5.030456377096805e-06, "loss": 0.0471, "step": 169860 }, { "epoch": 47.76, "learning_rate": 5.011713991191079e-06, "loss": 0.0535, "step": 169890 }, { "epoch": 47.77, "learning_rate": 4.992971605285353e-06, "loss": 0.0474, "step": 169920 }, { "epoch": 47.78, "learning_rate": 4.974229219379627e-06, "loss": 0.0525, "step": 169950 }, { "epoch": 47.79, "learning_rate": 4.955486833473901e-06, "loss": 0.0583, "step": 169980 }, { "epoch": 47.8, "learning_rate": 4.936744447568176e-06, "loss": 0.0493, "step": 170010 }, { "epoch": 47.8, "learning_rate": 4.91800206166245e-06, "loss": 0.0604, "step": 170040 }, { "epoch": 47.81, "learning_rate": 4.899259675756724e-06, "loss": 0.0514, "step": 170070 }, { "epoch": 47.82, "learning_rate": 4.880517289850998e-06, "loss": 0.0532, "step": 170100 }, { "epoch": 47.83, "learning_rate": 4.8617749039452726e-06, "loss": 0.0637, "step": 170130 }, { "epoch": 47.84, "learning_rate": 4.843032518039547e-06, "loss": 0.0481, "step": 170160 }, { "epoch": 47.85, "learning_rate": 4.824290132133821e-06, "loss": 0.0545, "step": 170190 }, { "epoch": 47.85, "learning_rate": 4.805547746228095e-06, "loss": 0.0503, "step": 170220 }, { "epoch": 47.86, "learning_rate": 4.786805360322369e-06, "loss": 0.0542, "step": 170250 }, { "epoch": 47.87, "learning_rate": 4.7680629744166435e-06, "loss": 0.0575, "step": 170280 }, { "epoch": 47.88, "learning_rate": 4.749320588510918e-06, "loss": 0.0445, "step": 170310 }, { "epoch": 47.89, "learning_rate": 4.730578202605192e-06, "loss": 0.0553, "step": 170340 }, { "epoch": 47.9, "learning_rate": 4.711835816699466e-06, "loss": 0.0514, "step": 170370 }, { "epoch": 47.91, "learning_rate": 4.69309343079374e-06, "loss": 0.0547, "step": 170400 }, { "epoch": 47.91, "learning_rate": 4.6743510448880145e-06, "loss": 0.057, "step": 170430 }, { "epoch": 47.92, "learning_rate": 4.655608658982289e-06, "loss": 0.0547, "step": 170460 }, { "epoch": 47.93, "learning_rate": 4.636866273076563e-06, "loss": 0.0579, "step": 170490 }, { "epoch": 47.94, "learning_rate": 4.618123887170837e-06, "loss": 0.0515, "step": 170520 }, { "epoch": 47.95, "learning_rate": 4.599381501265111e-06, "loss": 0.0546, "step": 170550 }, { "epoch": 47.96, "learning_rate": 4.5806391153593854e-06, "loss": 0.059, "step": 170580 }, { "epoch": 47.96, "learning_rate": 4.56189672945366e-06, "loss": 0.0451, "step": 170610 }, { "epoch": 47.97, "learning_rate": 4.543154343547934e-06, "loss": 0.0563, "step": 170640 }, { "epoch": 47.98, "learning_rate": 4.524411957642208e-06, "loss": 0.0526, "step": 170670 }, { "epoch": 47.99, "learning_rate": 4.505669571736482e-06, "loss": 0.0515, "step": 170700 }, { "epoch": 48.0, "learning_rate": 4.486927185830756e-06, "loss": 0.0591, "step": 170730 }, { "epoch": 48.0, "eval_loss": 0.17236961424350739, "eval_runtime": 503.3181, "eval_samples_per_second": 31.855, "eval_steps_per_second": 0.997, "eval_wer": 0.12165463403982367, "step": 170736 }, { "epoch": 48.01, "learning_rate": 4.4681847999250306e-06, "loss": 0.0496, "step": 170760 }, { "epoch": 48.02, "learning_rate": 4.449442414019305e-06, "loss": 0.0607, "step": 170790 }, { "epoch": 48.02, "learning_rate": 4.430700028113579e-06, "loss": 0.0494, "step": 170820 }, { "epoch": 48.03, "learning_rate": 4.411957642207853e-06, "loss": 0.0559, "step": 170850 }, { "epoch": 48.04, "learning_rate": 4.393215256302127e-06, "loss": 0.0481, "step": 170880 }, { "epoch": 48.05, "learning_rate": 4.3744728703964015e-06, "loss": 0.0554, "step": 170910 }, { "epoch": 48.06, "learning_rate": 4.355730484490676e-06, "loss": 0.0554, "step": 170940 }, { "epoch": 48.07, "learning_rate": 4.33698809858495e-06, "loss": 0.0499, "step": 170970 }, { "epoch": 48.07, "learning_rate": 4.318245712679225e-06, "loss": 0.0571, "step": 171000 }, { "epoch": 48.08, "learning_rate": 4.299503326773498e-06, "loss": 0.0554, "step": 171030 }, { "epoch": 48.09, "learning_rate": 4.280760940867773e-06, "loss": 0.0551, "step": 171060 }, { "epoch": 48.1, "learning_rate": 4.262018554962047e-06, "loss": 0.0568, "step": 171090 }, { "epoch": 48.11, "learning_rate": 4.243276169056321e-06, "loss": 0.0496, "step": 171120 }, { "epoch": 48.12, "learning_rate": 4.224533783150595e-06, "loss": 0.0542, "step": 171150 }, { "epoch": 48.12, "learning_rate": 4.205791397244869e-06, "loss": 0.0545, "step": 171180 }, { "epoch": 48.13, "learning_rate": 4.1870490113391434e-06, "loss": 0.0484, "step": 171210 }, { "epoch": 48.14, "learning_rate": 4.168306625433418e-06, "loss": 0.0591, "step": 171240 }, { "epoch": 48.15, "learning_rate": 4.149564239527693e-06, "loss": 0.0471, "step": 171270 }, { "epoch": 48.16, "learning_rate": 4.130821853621966e-06, "loss": 0.0557, "step": 171300 }, { "epoch": 48.17, "learning_rate": 4.112079467716241e-06, "loss": 0.0512, "step": 171330 }, { "epoch": 48.18, "learning_rate": 4.093337081810514e-06, "loss": 0.0523, "step": 171360 }, { "epoch": 48.18, "learning_rate": 4.0745946959047886e-06, "loss": 0.0574, "step": 171390 }, { "epoch": 48.19, "learning_rate": 4.055852309999063e-06, "loss": 0.0466, "step": 171420 }, { "epoch": 48.2, "learning_rate": 4.037109924093337e-06, "loss": 0.0569, "step": 171450 }, { "epoch": 48.21, "learning_rate": 4.018367538187612e-06, "loss": 0.0528, "step": 171480 }, { "epoch": 48.22, "learning_rate": 3.999625152281885e-06, "loss": 0.0541, "step": 171510 }, { "epoch": 48.23, "learning_rate": 3.98088276637616e-06, "loss": 0.0615, "step": 171540 }, { "epoch": 48.23, "learning_rate": 3.962140380470434e-06, "loss": 0.0504, "step": 171570 }, { "epoch": 48.24, "learning_rate": 3.943397994564709e-06, "loss": 0.0546, "step": 171600 }, { "epoch": 48.25, "learning_rate": 3.924655608658982e-06, "loss": 0.054, "step": 171630 }, { "epoch": 48.26, "learning_rate": 3.905913222753257e-06, "loss": 0.0488, "step": 171660 }, { "epoch": 48.27, "learning_rate": 3.8871708368475305e-06, "loss": 0.0552, "step": 171690 }, { "epoch": 48.28, "learning_rate": 3.868428450941805e-06, "loss": 0.0496, "step": 171720 }, { "epoch": 48.29, "learning_rate": 3.84968606503608e-06, "loss": 0.059, "step": 171750 }, { "epoch": 48.29, "learning_rate": 3.830943679130353e-06, "loss": 0.0544, "step": 171780 }, { "epoch": 48.3, "learning_rate": 3.812201293224628e-06, "loss": 0.0524, "step": 171810 }, { "epoch": 48.31, "learning_rate": 3.793458907318902e-06, "loss": 0.0593, "step": 171840 }, { "epoch": 48.32, "learning_rate": 3.774716521413176e-06, "loss": 0.0489, "step": 171870 }, { "epoch": 48.33, "learning_rate": 3.7565988817043077e-06, "loss": 0.0531, "step": 171900 }, { "epoch": 48.34, "learning_rate": 3.737856495798582e-06, "loss": 0.0596, "step": 171930 }, { "epoch": 48.34, "learning_rate": 3.7191141098928565e-06, "loss": 0.0526, "step": 171960 }, { "epoch": 48.35, "learning_rate": 3.7009964701839878e-06, "loss": 0.0604, "step": 171990 }, { "epoch": 48.36, "learning_rate": 3.6822540842782624e-06, "loss": 0.0494, "step": 172020 }, { "epoch": 48.37, "learning_rate": 3.663511698372536e-06, "loss": 0.0575, "step": 172050 }, { "epoch": 48.38, "learning_rate": 3.6447693124668107e-06, "loss": 0.052, "step": 172080 }, { "epoch": 48.39, "learning_rate": 3.6260269265610845e-06, "loss": 0.0528, "step": 172110 }, { "epoch": 48.39, "learning_rate": 3.607284540655359e-06, "loss": 0.0599, "step": 172140 }, { "epoch": 48.4, "learning_rate": 3.588542154749633e-06, "loss": 0.0498, "step": 172170 }, { "epoch": 48.41, "learning_rate": 3.5697997688439075e-06, "loss": 0.0517, "step": 172200 }, { "epoch": 48.42, "learning_rate": 3.5510573829381817e-06, "loss": 0.05, "step": 172230 }, { "epoch": 48.43, "learning_rate": 3.5323149970324555e-06, "loss": 0.0558, "step": 172260 }, { "epoch": 48.44, "learning_rate": 3.51357261112673e-06, "loss": 0.0572, "step": 172290 }, { "epoch": 48.45, "learning_rate": 3.494830225221004e-06, "loss": 0.0478, "step": 172320 }, { "epoch": 48.45, "learning_rate": 3.4760878393152785e-06, "loss": 0.0563, "step": 172350 }, { "epoch": 48.46, "learning_rate": 3.4573454534095522e-06, "loss": 0.053, "step": 172380 }, { "epoch": 48.47, "learning_rate": 3.438603067503827e-06, "loss": 0.0552, "step": 172410 }, { "epoch": 48.48, "learning_rate": 3.4198606815981006e-06, "loss": 0.0563, "step": 172440 }, { "epoch": 48.49, "learning_rate": 3.4011182956923752e-06, "loss": 0.046, "step": 172470 }, { "epoch": 48.5, "learning_rate": 3.3823759097866494e-06, "loss": 0.0548, "step": 172500 }, { "epoch": 48.5, "learning_rate": 3.3636335238809236e-06, "loss": 0.052, "step": 172530 }, { "epoch": 48.51, "learning_rate": 3.344891137975198e-06, "loss": 0.0545, "step": 172560 }, { "epoch": 48.52, "learning_rate": 3.3261487520694716e-06, "loss": 0.0577, "step": 172590 }, { "epoch": 48.53, "learning_rate": 3.307406366163746e-06, "loss": 0.0479, "step": 172620 }, { "epoch": 48.54, "learning_rate": 3.28866398025802e-06, "loss": 0.0529, "step": 172650 }, { "epoch": 48.55, "learning_rate": 3.2699215943522946e-06, "loss": 0.0545, "step": 172680 }, { "epoch": 48.55, "learning_rate": 3.251179208446569e-06, "loss": 0.0522, "step": 172710 }, { "epoch": 48.56, "learning_rate": 3.232436822540843e-06, "loss": 0.0598, "step": 172740 }, { "epoch": 48.57, "learning_rate": 3.2136944366351176e-06, "loss": 0.0462, "step": 172770 }, { "epoch": 48.58, "learning_rate": 3.1949520507293913e-06, "loss": 0.0521, "step": 172800 }, { "epoch": 48.59, "learning_rate": 3.1762096648236655e-06, "loss": 0.0532, "step": 172830 }, { "epoch": 48.6, "learning_rate": 3.1574672789179397e-06, "loss": 0.0518, "step": 172860 }, { "epoch": 48.61, "learning_rate": 3.138724893012214e-06, "loss": 0.0619, "step": 172890 }, { "epoch": 48.61, "learning_rate": 3.119982507106488e-06, "loss": 0.0485, "step": 172920 }, { "epoch": 48.62, "learning_rate": 3.1012401212007623e-06, "loss": 0.0556, "step": 172950 }, { "epoch": 48.63, "learning_rate": 3.0824977352950365e-06, "loss": 0.0496, "step": 172980 }, { "epoch": 48.64, "learning_rate": 3.0637553493893107e-06, "loss": 0.0494, "step": 173010 }, { "epoch": 48.65, "learning_rate": 3.045012963483585e-06, "loss": 0.0602, "step": 173040 }, { "epoch": 48.66, "learning_rate": 3.0262705775778595e-06, "loss": 0.0502, "step": 173070 }, { "epoch": 48.66, "learning_rate": 3.0075281916721337e-06, "loss": 0.0546, "step": 173100 }, { "epoch": 48.67, "learning_rate": 2.9887858057664074e-06, "loss": 0.0525, "step": 173130 }, { "epoch": 48.68, "learning_rate": 2.9700434198606816e-06, "loss": 0.0543, "step": 173160 }, { "epoch": 48.69, "learning_rate": 2.951301033954956e-06, "loss": 0.0594, "step": 173190 }, { "epoch": 48.7, "learning_rate": 2.93255864804923e-06, "loss": 0.0473, "step": 173220 }, { "epoch": 48.71, "learning_rate": 2.913816262143504e-06, "loss": 0.0531, "step": 173250 }, { "epoch": 48.72, "learning_rate": 2.8950738762377784e-06, "loss": 0.0539, "step": 173280 }, { "epoch": 48.72, "learning_rate": 2.876331490332053e-06, "loss": 0.0522, "step": 173310 }, { "epoch": 48.73, "learning_rate": 2.857589104426327e-06, "loss": 0.0575, "step": 173340 }, { "epoch": 48.74, "learning_rate": 2.8388467185206014e-06, "loss": 0.0487, "step": 173370 }, { "epoch": 48.75, "learning_rate": 2.8201043326148756e-06, "loss": 0.0583, "step": 173400 }, { "epoch": 48.76, "learning_rate": 2.8013619467091493e-06, "loss": 0.0527, "step": 173430 }, { "epoch": 48.77, "learning_rate": 2.7826195608034235e-06, "loss": 0.0557, "step": 173460 }, { "epoch": 48.77, "learning_rate": 2.7638771748976977e-06, "loss": 0.059, "step": 173490 }, { "epoch": 48.78, "learning_rate": 2.745134788991972e-06, "loss": 0.0476, "step": 173520 }, { "epoch": 48.79, "learning_rate": 2.7263924030862465e-06, "loss": 0.0529, "step": 173550 }, { "epoch": 48.8, "learning_rate": 2.7076500171805207e-06, "loss": 0.0501, "step": 173580 }, { "epoch": 48.81, "learning_rate": 2.688907631274795e-06, "loss": 0.0546, "step": 173610 }, { "epoch": 48.82, "learning_rate": 2.670165245369069e-06, "loss": 0.059, "step": 173640 }, { "epoch": 48.82, "learning_rate": 2.6514228594633433e-06, "loss": 0.0502, "step": 173670 }, { "epoch": 48.83, "learning_rate": 2.6326804735576175e-06, "loss": 0.0598, "step": 173700 }, { "epoch": 48.84, "learning_rate": 2.6139380876518917e-06, "loss": 0.0528, "step": 173730 }, { "epoch": 48.85, "learning_rate": 2.5951957017461654e-06, "loss": 0.0519, "step": 173760 }, { "epoch": 48.86, "learning_rate": 2.57645331584044e-06, "loss": 0.057, "step": 173790 }, { "epoch": 48.87, "learning_rate": 2.5577109299347142e-06, "loss": 0.0445, "step": 173820 }, { "epoch": 48.88, "learning_rate": 2.5389685440289884e-06, "loss": 0.0532, "step": 173850 }, { "epoch": 48.88, "learning_rate": 2.5202261581232626e-06, "loss": 0.0501, "step": 173880 }, { "epoch": 48.89, "learning_rate": 2.501483772217537e-06, "loss": 0.0557, "step": 173910 }, { "epoch": 48.9, "learning_rate": 2.482741386311811e-06, "loss": 0.0579, "step": 173940 }, { "epoch": 48.91, "learning_rate": 2.463999000406085e-06, "loss": 0.0465, "step": 173970 }, { "epoch": 48.92, "learning_rate": 2.4452566145003594e-06, "loss": 0.055, "step": 174000 }, { "epoch": 48.93, "learning_rate": 2.4265142285946336e-06, "loss": 0.0534, "step": 174030 }, { "epoch": 48.93, "learning_rate": 2.4077718426889078e-06, "loss": 0.0498, "step": 174060 }, { "epoch": 48.94, "learning_rate": 2.389029456783182e-06, "loss": 0.0587, "step": 174090 }, { "epoch": 48.95, "learning_rate": 2.370287070877456e-06, "loss": 0.0475, "step": 174120 }, { "epoch": 48.96, "learning_rate": 2.3515446849717303e-06, "loss": 0.0592, "step": 174150 }, { "epoch": 48.97, "learning_rate": 2.3328022990660045e-06, "loss": 0.0507, "step": 174180 }, { "epoch": 48.98, "learning_rate": 2.3140599131602787e-06, "loss": 0.0554, "step": 174210 }, { "epoch": 48.98, "learning_rate": 2.295317527254553e-06, "loss": 0.0582, "step": 174240 }, { "epoch": 48.99, "learning_rate": 2.276575141348827e-06, "loss": 0.0507, "step": 174270 }, { "epoch": 49.0, "eval_loss": 0.1752515286207199, "eval_runtime": 501.7816, "eval_samples_per_second": 31.952, "eval_steps_per_second": 1.0, "eval_wer": 0.12116332073205682, "step": 174293 }, { "epoch": 49.0, "learning_rate": 2.2578327554431013e-06, "loss": 0.0557, "step": 174300 }, { "epoch": 49.01, "learning_rate": 2.2390903695373755e-06, "loss": 0.047, "step": 174330 }, { "epoch": 49.02, "learning_rate": 2.2203479836316497e-06, "loss": 0.0596, "step": 174360 }, { "epoch": 49.03, "learning_rate": 2.201605597725924e-06, "loss": 0.0517, "step": 174390 }, { "epoch": 49.04, "learning_rate": 2.182863211820198e-06, "loss": 0.049, "step": 174420 }, { "epoch": 49.04, "learning_rate": 2.1641208259144722e-06, "loss": 0.0616, "step": 174450 }, { "epoch": 49.05, "learning_rate": 2.1453784400087464e-06, "loss": 0.0516, "step": 174480 }, { "epoch": 49.06, "learning_rate": 2.127260800299878e-06, "loss": 0.0727, "step": 174510 }, { "epoch": 49.07, "learning_rate": 2.1085184143941527e-06, "loss": 0.0534, "step": 174540 }, { "epoch": 49.08, "learning_rate": 2.089776028488427e-06, "loss": 0.0548, "step": 174570 }, { "epoch": 49.09, "learning_rate": 2.071033642582701e-06, "loss": 0.0605, "step": 174600 }, { "epoch": 49.09, "learning_rate": 2.0522912566769753e-06, "loss": 0.0444, "step": 174630 }, { "epoch": 49.1, "learning_rate": 2.0335488707712495e-06, "loss": 0.0542, "step": 174660 }, { "epoch": 49.11, "learning_rate": 2.0148064848655232e-06, "loss": 0.0583, "step": 174690 }, { "epoch": 49.12, "learning_rate": 1.9960640989597974e-06, "loss": 0.0491, "step": 174720 }, { "epoch": 49.13, "learning_rate": 1.9773217130540716e-06, "loss": 0.0561, "step": 174750 }, { "epoch": 49.14, "learning_rate": 1.9585793271483462e-06, "loss": 0.0487, "step": 174780 }, { "epoch": 49.15, "learning_rate": 1.9398369412426204e-06, "loss": 0.0557, "step": 174810 }, { "epoch": 49.15, "learning_rate": 1.9210945553368946e-06, "loss": 0.0518, "step": 174840 }, { "epoch": 49.16, "learning_rate": 1.9023521694311688e-06, "loss": 0.0501, "step": 174870 }, { "epoch": 49.17, "learning_rate": 1.8836097835254428e-06, "loss": 0.0557, "step": 174900 }, { "epoch": 49.18, "learning_rate": 1.864867397619717e-06, "loss": 0.0483, "step": 174930 }, { "epoch": 49.19, "learning_rate": 1.8461250117139912e-06, "loss": 0.0521, "step": 174960 }, { "epoch": 49.2, "learning_rate": 1.8273826258082653e-06, "loss": 0.0543, "step": 174990 }, { "epoch": 49.2, "learning_rate": 1.8086402399025398e-06, "loss": 0.0483, "step": 175020 }, { "epoch": 49.21, "learning_rate": 1.789897853996814e-06, "loss": 0.0589, "step": 175050 }, { "epoch": 49.22, "learning_rate": 1.7711554680910881e-06, "loss": 0.0513, "step": 175080 }, { "epoch": 49.23, "learning_rate": 1.7524130821853623e-06, "loss": 0.052, "step": 175110 }, { "epoch": 49.24, "learning_rate": 1.7336706962796365e-06, "loss": 0.0544, "step": 175140 }, { "epoch": 49.25, "learning_rate": 1.7149283103739107e-06, "loss": 0.0525, "step": 175170 }, { "epoch": 49.25, "learning_rate": 1.6961859244681847e-06, "loss": 0.0579, "step": 175200 }, { "epoch": 49.26, "learning_rate": 1.6774435385624589e-06, "loss": 0.0489, "step": 175230 }, { "epoch": 49.27, "learning_rate": 1.6587011526567335e-06, "loss": 0.0567, "step": 175260 }, { "epoch": 49.28, "learning_rate": 1.6399587667510077e-06, "loss": 0.0503, "step": 175290 }, { "epoch": 49.29, "learning_rate": 1.6212163808452817e-06, "loss": 0.0498, "step": 175320 }, { "epoch": 49.3, "learning_rate": 1.6024739949395558e-06, "loss": 0.0578, "step": 175350 }, { "epoch": 49.31, "learning_rate": 1.58373160903383e-06, "loss": 0.0477, "step": 175380 }, { "epoch": 49.31, "learning_rate": 1.5649892231281042e-06, "loss": 0.0539, "step": 175410 }, { "epoch": 49.32, "learning_rate": 1.5462468372223786e-06, "loss": 0.059, "step": 175440 }, { "epoch": 49.33, "learning_rate": 1.5275044513166526e-06, "loss": 0.055, "step": 175470 }, { "epoch": 49.34, "learning_rate": 1.5087620654109268e-06, "loss": 0.0548, "step": 175500 }, { "epoch": 49.35, "learning_rate": 1.490019679505201e-06, "loss": 0.0494, "step": 175530 }, { "epoch": 49.36, "learning_rate": 1.4712772935994754e-06, "loss": 0.0526, "step": 175560 }, { "epoch": 49.36, "learning_rate": 1.4525349076937496e-06, "loss": 0.0554, "step": 175590 }, { "epoch": 49.37, "learning_rate": 1.4337925217880238e-06, "loss": 0.048, "step": 175620 }, { "epoch": 49.38, "learning_rate": 1.4150501358822978e-06, "loss": 0.057, "step": 175650 }, { "epoch": 49.39, "learning_rate": 1.3963077499765722e-06, "loss": 0.0498, "step": 175680 }, { "epoch": 49.4, "learning_rate": 1.3775653640708463e-06, "loss": 0.0549, "step": 175710 }, { "epoch": 49.41, "learning_rate": 1.3588229781651205e-06, "loss": 0.0579, "step": 175740 }, { "epoch": 49.42, "learning_rate": 1.3400805922593947e-06, "loss": 0.0468, "step": 175770 }, { "epoch": 49.42, "learning_rate": 1.321338206353669e-06, "loss": 0.0585, "step": 175800 }, { "epoch": 49.43, "learning_rate": 1.3025958204479431e-06, "loss": 0.0475, "step": 175830 }, { "epoch": 49.44, "learning_rate": 1.2838534345422173e-06, "loss": 0.0553, "step": 175860 }, { "epoch": 49.45, "learning_rate": 1.2651110486364915e-06, "loss": 0.053, "step": 175890 }, { "epoch": 49.46, "learning_rate": 1.2463686627307657e-06, "loss": 0.0531, "step": 175920 }, { "epoch": 49.47, "learning_rate": 1.2276262768250399e-06, "loss": 0.0588, "step": 175950 }, { "epoch": 49.47, "learning_rate": 1.208883890919314e-06, "loss": 0.0482, "step": 175980 }, { "epoch": 49.48, "learning_rate": 1.1901415050135883e-06, "loss": 0.0512, "step": 176010 }, { "epoch": 49.49, "learning_rate": 1.1713991191078627e-06, "loss": 0.0531, "step": 176040 }, { "epoch": 49.5, "learning_rate": 1.1526567332021366e-06, "loss": 0.0494, "step": 176070 }, { "epoch": 49.51, "learning_rate": 1.1339143472964108e-06, "loss": 0.059, "step": 176100 }, { "epoch": 49.52, "learning_rate": 1.115171961390685e-06, "loss": 0.0451, "step": 176130 }, { "epoch": 49.52, "learning_rate": 1.0964295754849594e-06, "loss": 0.0564, "step": 176160 }, { "epoch": 49.53, "learning_rate": 1.0776871895792336e-06, "loss": 0.0512, "step": 176190 }, { "epoch": 49.54, "learning_rate": 1.0589448036735076e-06, "loss": 0.0482, "step": 176220 }, { "epoch": 49.55, "learning_rate": 1.0402024177677818e-06, "loss": 0.0549, "step": 176250 }, { "epoch": 49.56, "learning_rate": 1.0214600318620562e-06, "loss": 0.0501, "step": 176280 }, { "epoch": 49.57, "learning_rate": 1.0027176459563304e-06, "loss": 0.0544, "step": 176310 }, { "epoch": 49.58, "learning_rate": 9.839752600506046e-07, "loss": 0.0524, "step": 176340 }, { "epoch": 49.58, "learning_rate": 9.652328741448785e-07, "loss": 0.047, "step": 176370 }, { "epoch": 49.59, "learning_rate": 9.464904882391528e-07, "loss": 0.0544, "step": 176400 }, { "epoch": 49.6, "learning_rate": 9.277481023334271e-07, "loss": 0.048, "step": 176430 }, { "epoch": 49.61, "learning_rate": 9.090057164277013e-07, "loss": 0.0566, "step": 176460 }, { "epoch": 49.62, "learning_rate": 8.902633305219754e-07, "loss": 0.053, "step": 176490 }, { "epoch": 49.63, "learning_rate": 8.715209446162496e-07, "loss": 0.049, "step": 176520 }, { "epoch": 49.63, "learning_rate": 8.527785587105239e-07, "loss": 0.058, "step": 176550 }, { "epoch": 49.64, "learning_rate": 8.340361728047981e-07, "loss": 0.0511, "step": 176580 }, { "epoch": 49.65, "learning_rate": 8.152937868990723e-07, "loss": 0.0571, "step": 176610 }, { "epoch": 49.66, "learning_rate": 7.965514009933464e-07, "loss": 0.0534, "step": 176640 }, { "epoch": 49.67, "learning_rate": 7.778090150876207e-07, "loss": 0.0514, "step": 176670 }, { "epoch": 49.68, "learning_rate": 7.590666291818949e-07, "loss": 0.0587, "step": 176700 }, { "epoch": 49.69, "learning_rate": 7.40324243276169e-07, "loss": 0.0506, "step": 176730 }, { "epoch": 49.69, "learning_rate": 7.215818573704433e-07, "loss": 0.0516, "step": 176760 }, { "epoch": 49.7, "learning_rate": 7.028394714647174e-07, "loss": 0.0537, "step": 176790 }, { "epoch": 49.71, "learning_rate": 6.847218317558492e-07, "loss": 0.0545, "step": 176820 }, { "epoch": 49.72, "learning_rate": 6.659794458501234e-07, "loss": 0.0559, "step": 176850 }, { "epoch": 49.73, "learning_rate": 6.472370599443977e-07, "loss": 0.0464, "step": 176880 }, { "epoch": 49.74, "learning_rate": 6.284946740386718e-07, "loss": 0.0533, "step": 176910 }, { "epoch": 49.74, "learning_rate": 6.097522881329461e-07, "loss": 0.0526, "step": 176940 }, { "epoch": 49.75, "learning_rate": 5.910099022272201e-07, "loss": 0.0481, "step": 176970 }, { "epoch": 49.76, "learning_rate": 5.722675163214944e-07, "loss": 0.06, "step": 177000 }, { "epoch": 49.77, "learning_rate": 5.535251304157686e-07, "loss": 0.0481, "step": 177030 }, { "epoch": 49.78, "learning_rate": 5.347827445100428e-07, "loss": 0.0515, "step": 177060 }, { "epoch": 49.79, "learning_rate": 5.16040358604317e-07, "loss": 0.0556, "step": 177090 }, { "epoch": 49.79, "learning_rate": 4.972979726985912e-07, "loss": 0.049, "step": 177120 }, { "epoch": 49.8, "learning_rate": 4.785555867928654e-07, "loss": 0.0578, "step": 177150 }, { "epoch": 49.81, "learning_rate": 4.5981320088713964e-07, "loss": 0.0505, "step": 177180 }, { "epoch": 49.82, "learning_rate": 4.410708149814138e-07, "loss": 0.0534, "step": 177210 }, { "epoch": 49.83, "learning_rate": 4.22328429075688e-07, "loss": 0.0532, "step": 177240 }, { "epoch": 49.84, "learning_rate": 4.035860431699622e-07, "loss": 0.0508, "step": 177270 }, { "epoch": 49.85, "learning_rate": 3.848436572642364e-07, "loss": 0.0569, "step": 177300 }, { "epoch": 49.85, "learning_rate": 3.661012713585106e-07, "loss": 0.0508, "step": 177330 }, { "epoch": 49.86, "learning_rate": 3.473588854527848e-07, "loss": 0.0516, "step": 177360 }, { "epoch": 49.87, "learning_rate": 3.2861649954705903e-07, "loss": 0.0528, "step": 177390 }, { "epoch": 49.88, "learning_rate": 3.098741136413332e-07, "loss": 0.0497, "step": 177420 }, { "epoch": 49.89, "learning_rate": 2.911317277356074e-07, "loss": 0.0543, "step": 177450 }, { "epoch": 49.9, "learning_rate": 2.723893418298816e-07, "loss": 0.0496, "step": 177480 }, { "epoch": 49.9, "learning_rate": 2.536469559241558e-07, "loss": 0.0525, "step": 177510 }, { "epoch": 49.91, "learning_rate": 2.3490457001843e-07, "loss": 0.0556, "step": 177540 }, { "epoch": 49.92, "learning_rate": 2.161621841127042e-07, "loss": 0.0506, "step": 177570 }, { "epoch": 49.93, "learning_rate": 1.9741979820697842e-07, "loss": 0.0552, "step": 177600 }, { "epoch": 49.94, "learning_rate": 1.7867741230125263e-07, "loss": 0.0478, "step": 177630 }, { "epoch": 49.95, "learning_rate": 1.5993502639552682e-07, "loss": 0.0597, "step": 177660 }, { "epoch": 49.95, "learning_rate": 1.4119264048980104e-07, "loss": 0.0508, "step": 177690 }, { "epoch": 49.96, "learning_rate": 1.2245025458407523e-07, "loss": 0.0461, "step": 177720 }, { "epoch": 49.97, "learning_rate": 1.0370786867834943e-07, "loss": 0.0566, "step": 177750 }, { "epoch": 49.98, "learning_rate": 8.496548277262363e-08, "loss": 0.0489, "step": 177780 }, { "epoch": 49.99, "learning_rate": 6.622309686689783e-08, "loss": 0.0531, "step": 177810 }, { "epoch": 50.0, "learning_rate": 4.748071096117203e-08, "loss": 0.0577, "step": 177840 }, { "epoch": 50.0, "eval_loss": 0.1741643100976944, "eval_runtime": 533.0988, "eval_samples_per_second": 30.075, "eval_steps_per_second": 0.942, "eval_wer": 0.12089719269034979, "step": 177850 }, { "epoch": 50.0, "step": 177850, "total_flos": 1.1784689236730266e+21, "train_loss": 0.042193543246732794, "train_runtime": 659833.0285, "train_samples_per_second": 34.505, "train_steps_per_second": 0.27 } ], "max_steps": 177850, "num_train_epochs": 50, "total_flos": 1.1784689236730266e+21, "trial_name": null, "trial_params": null }