{ "best_metric": 0.09092025712063107, "best_model_checkpoint": "./wav2vec2-large-xlsr-53-german-cv9/checkpoint-160065", "epoch": 49.999859451862264, "global_step": 177850, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.01, "learning_rate": 1.686814731515322e-07, "loss": 12.2823, "step": 30 }, { "epoch": 0.02, "learning_rate": 3.3174023053134664e-07, "loss": 12.8864, "step": 60 }, { "epoch": 0.03, "learning_rate": 5.004217036828789e-07, "loss": 11.7331, "step": 90 }, { "epoch": 0.03, "learning_rate": 6.691031768344111e-07, "loss": 12.8009, "step": 120 }, { "epoch": 0.04, "learning_rate": 8.377846499859433e-07, "loss": 12.1084, "step": 150 }, { "epoch": 0.05, "learning_rate": 1.0064661231374754e-06, "loss": 12.08, "step": 180 }, { "epoch": 0.06, "learning_rate": 1.1751475962890077e-06, "loss": 12.5185, "step": 210 }, { "epoch": 0.07, "learning_rate": 1.3382063536688221e-06, "loss": 11.5036, "step": 240 }, { "epoch": 0.08, "learning_rate": 1.5068878268203542e-06, "loss": 12.2999, "step": 270 }, { "epoch": 0.08, "learning_rate": 1.6699465842001688e-06, "loss": 11.3572, "step": 300 }, { "epoch": 0.09, "learning_rate": 1.838628057351701e-06, "loss": 10.856, "step": 330 }, { "epoch": 0.1, "learning_rate": 2.007309530503233e-06, "loss": 10.7287, "step": 360 }, { "epoch": 0.11, "learning_rate": 2.1759910036547654e-06, "loss": 9.3588, "step": 390 }, { "epoch": 0.12, "learning_rate": 2.3446724768062973e-06, "loss": 9.3074, "step": 420 }, { "epoch": 0.13, "learning_rate": 2.5133539499578296e-06, "loss": 8.1078, "step": 450 }, { "epoch": 0.13, "learning_rate": 2.682035423109362e-06, "loss": 7.0939, "step": 480 }, { "epoch": 0.14, "learning_rate": 2.850716896260894e-06, "loss": 6.2733, "step": 510 }, { "epoch": 0.15, "learning_rate": 3.0193983694124264e-06, "loss": 5.3202, "step": 540 }, { "epoch": 0.16, "learning_rate": 3.1880798425639583e-06, "loss": 5.0092, "step": 570 }, { "epoch": 0.17, "learning_rate": 3.3567613157154906e-06, "loss": 4.4977, "step": 600 }, { "epoch": 0.18, "learning_rate": 3.525442788867023e-06, "loss": 4.201, "step": 630 }, { "epoch": 0.19, "learning_rate": 3.694124262018555e-06, "loss": 4.019, "step": 660 }, { "epoch": 0.19, "learning_rate": 3.8628057351700874e-06, "loss": 3.7649, "step": 690 }, { "epoch": 0.2, "learning_rate": 4.03148720832162e-06, "loss": 3.7088, "step": 720 }, { "epoch": 0.21, "learning_rate": 4.200168681473152e-06, "loss": 3.5882, "step": 750 }, { "epoch": 0.22, "learning_rate": 4.368850154624684e-06, "loss": 3.4896, "step": 780 }, { "epoch": 0.23, "learning_rate": 4.5375316277762166e-06, "loss": 3.4466, "step": 810 }, { "epoch": 0.24, "learning_rate": 4.706213100927748e-06, "loss": 3.3378, "step": 840 }, { "epoch": 0.24, "learning_rate": 4.87489457407928e-06, "loss": 3.3351, "step": 870 }, { "epoch": 0.25, "learning_rate": 5.043576047230813e-06, "loss": 3.2781, "step": 900 }, { "epoch": 0.26, "learning_rate": 5.212257520382345e-06, "loss": 3.2183, "step": 930 }, { "epoch": 0.27, "learning_rate": 5.380938993533877e-06, "loss": 3.2128, "step": 960 }, { "epoch": 0.28, "learning_rate": 5.5496204666854094e-06, "loss": 3.1512, "step": 990 }, { "epoch": 0.29, "learning_rate": 5.718301939836942e-06, "loss": 3.1617, "step": 1020 }, { "epoch": 0.3, "learning_rate": 5.886983412988474e-06, "loss": 3.1274, "step": 1050 }, { "epoch": 0.3, "learning_rate": 6.0556648861400054e-06, "loss": 3.0881, "step": 1080 }, { "epoch": 0.31, "learning_rate": 6.224346359291538e-06, "loss": 3.098, "step": 1110 }, { "epoch": 0.32, "learning_rate": 6.39302783244307e-06, "loss": 3.0544, "step": 1140 }, { "epoch": 0.33, "learning_rate": 6.561709305594603e-06, "loss": 3.0735, "step": 1170 }, { "epoch": 0.34, "learning_rate": 6.7303907787461346e-06, "loss": 3.0573, "step": 1200 }, { "epoch": 0.35, "learning_rate": 6.899072251897668e-06, "loss": 3.0233, "step": 1230 }, { "epoch": 0.35, "learning_rate": 7.067753725049199e-06, "loss": 3.0445, "step": 1260 }, { "epoch": 0.36, "learning_rate": 7.236435198200732e-06, "loss": 3.0156, "step": 1290 }, { "epoch": 0.37, "learning_rate": 7.405116671352264e-06, "loss": 3.0256, "step": 1320 }, { "epoch": 0.38, "learning_rate": 7.573798144503795e-06, "loss": 3.0266, "step": 1350 }, { "epoch": 0.39, "learning_rate": 7.742479617655327e-06, "loss": 2.9992, "step": 1380 }, { "epoch": 0.4, "learning_rate": 7.91116109080686e-06, "loss": 3.0169, "step": 1410 }, { "epoch": 0.4, "learning_rate": 8.079842563958392e-06, "loss": 2.9879, "step": 1440 }, { "epoch": 0.41, "learning_rate": 8.248524037109924e-06, "loss": 3.0014, "step": 1470 }, { "epoch": 0.42, "learning_rate": 8.417205510261457e-06, "loss": 3.0054, "step": 1500 }, { "epoch": 0.43, "learning_rate": 8.585886983412989e-06, "loss": 2.9833, "step": 1530 }, { "epoch": 0.44, "learning_rate": 8.754568456564521e-06, "loss": 3.0009, "step": 1560 }, { "epoch": 0.45, "learning_rate": 8.923249929716053e-06, "loss": 2.9731, "step": 1590 }, { "epoch": 0.46, "learning_rate": 9.091931402867586e-06, "loss": 2.9975, "step": 1620 }, { "epoch": 0.46, "learning_rate": 9.260612876019118e-06, "loss": 2.997, "step": 1650 }, { "epoch": 0.47, "learning_rate": 9.42929434917065e-06, "loss": 2.9667, "step": 1680 }, { "epoch": 0.48, "learning_rate": 9.597975822322183e-06, "loss": 2.9925, "step": 1710 }, { "epoch": 0.49, "learning_rate": 9.766657295473715e-06, "loss": 2.9607, "step": 1740 }, { "epoch": 0.5, "learning_rate": 9.935338768625247e-06, "loss": 2.9754, "step": 1770 }, { "epoch": 0.51, "learning_rate": 1.010402024177678e-05, "loss": 2.9615, "step": 1800 }, { "epoch": 0.51, "learning_rate": 1.0272701714928312e-05, "loss": 2.9534, "step": 1830 }, { "epoch": 0.52, "learning_rate": 1.0441383188079842e-05, "loss": 2.9674, "step": 1860 }, { "epoch": 0.53, "learning_rate": 1.0610064661231375e-05, "loss": 2.9443, "step": 1890 }, { "epoch": 0.54, "learning_rate": 1.0778746134382907e-05, "loss": 2.9559, "step": 1920 }, { "epoch": 0.55, "learning_rate": 1.0947427607534439e-05, "loss": 2.9475, "step": 1950 }, { "epoch": 0.56, "learning_rate": 1.1116109080685971e-05, "loss": 2.94, "step": 1980 }, { "epoch": 0.57, "learning_rate": 1.1284790553837504e-05, "loss": 2.9509, "step": 2010 }, { "epoch": 0.57, "learning_rate": 1.1453472026989036e-05, "loss": 2.9327, "step": 2040 }, { "epoch": 0.58, "learning_rate": 1.1622153500140568e-05, "loss": 2.9454, "step": 2070 }, { "epoch": 0.59, "learning_rate": 1.17908349732921e-05, "loss": 2.9409, "step": 2100 }, { "epoch": 0.6, "learning_rate": 1.1959516446443633e-05, "loss": 2.9342, "step": 2130 }, { "epoch": 0.61, "learning_rate": 1.2128197919595165e-05, "loss": 2.9434, "step": 2160 }, { "epoch": 0.62, "learning_rate": 1.2296879392746697e-05, "loss": 2.9311, "step": 2190 }, { "epoch": 0.62, "learning_rate": 1.246556086589823e-05, "loss": 2.939, "step": 2220 }, { "epoch": 0.63, "learning_rate": 1.2634242339049762e-05, "loss": 2.9328, "step": 2250 }, { "epoch": 0.64, "learning_rate": 1.2802923812201296e-05, "loss": 2.929, "step": 2280 }, { "epoch": 0.65, "learning_rate": 1.2971605285352825e-05, "loss": 2.9352, "step": 2310 }, { "epoch": 0.66, "learning_rate": 1.3140286758504359e-05, "loss": 2.9237, "step": 2340 }, { "epoch": 0.67, "learning_rate": 1.3308968231655891e-05, "loss": 2.9313, "step": 2370 }, { "epoch": 0.67, "learning_rate": 1.3477649704807422e-05, "loss": 2.9168, "step": 2400 }, { "epoch": 0.68, "learning_rate": 1.3646331177958954e-05, "loss": 2.9164, "step": 2430 }, { "epoch": 0.69, "learning_rate": 1.3815012651110488e-05, "loss": 2.9112, "step": 2460 }, { "epoch": 0.7, "learning_rate": 1.398369412426202e-05, "loss": 2.8939, "step": 2490 }, { "epoch": 0.71, "learning_rate": 1.415237559741355e-05, "loss": 2.893, "step": 2520 }, { "epoch": 0.72, "learning_rate": 1.4321057070565083e-05, "loss": 2.8611, "step": 2550 }, { "epoch": 0.73, "learning_rate": 1.4489738543716615e-05, "loss": 2.8146, "step": 2580 }, { "epoch": 0.73, "learning_rate": 1.465842001686815e-05, "loss": 2.7328, "step": 2610 }, { "epoch": 0.74, "learning_rate": 1.482710149001968e-05, "loss": 2.5982, "step": 2640 }, { "epoch": 0.75, "learning_rate": 1.4995782963171212e-05, "loss": 2.4667, "step": 2670 }, { "epoch": 0.76, "learning_rate": 1.5164464436322745e-05, "loss": 2.237, "step": 2700 }, { "epoch": 0.77, "learning_rate": 1.533314590947428e-05, "loss": 2.0234, "step": 2730 }, { "epoch": 0.78, "learning_rate": 1.5501827382625807e-05, "loss": 1.7856, "step": 2760 }, { "epoch": 0.78, "learning_rate": 1.567050885577734e-05, "loss": 1.4936, "step": 2790 }, { "epoch": 0.79, "learning_rate": 1.5839190328928875e-05, "loss": 1.3168, "step": 2820 }, { "epoch": 0.8, "learning_rate": 1.6007871802080408e-05, "loss": 1.1575, "step": 2850 }, { "epoch": 0.81, "learning_rate": 1.6176553275231937e-05, "loss": 1.0244, "step": 2880 }, { "epoch": 0.82, "learning_rate": 1.634523474838347e-05, "loss": 0.9434, "step": 2910 }, { "epoch": 0.83, "learning_rate": 1.6513916221535004e-05, "loss": 0.8609, "step": 2940 }, { "epoch": 0.83, "learning_rate": 1.6682597694686533e-05, "loss": 0.8089, "step": 2970 }, { "epoch": 0.84, "learning_rate": 1.6851279167838066e-05, "loss": 0.7682, "step": 3000 }, { "epoch": 0.85, "learning_rate": 1.7019960640989598e-05, "loss": 0.7005, "step": 3030 }, { "epoch": 0.86, "learning_rate": 1.718864211414113e-05, "loss": 0.691, "step": 3060 }, { "epoch": 0.87, "learning_rate": 1.7357323587292663e-05, "loss": 0.6244, "step": 3090 }, { "epoch": 0.88, "learning_rate": 1.7526005060444195e-05, "loss": 0.6426, "step": 3120 }, { "epoch": 0.89, "learning_rate": 1.7694686533595727e-05, "loss": 0.6254, "step": 3150 }, { "epoch": 0.89, "learning_rate": 1.786336800674726e-05, "loss": 0.5489, "step": 3180 }, { "epoch": 0.9, "learning_rate": 1.803204947989879e-05, "loss": 0.5744, "step": 3210 }, { "epoch": 0.91, "learning_rate": 1.8200730953050324e-05, "loss": 0.5247, "step": 3240 }, { "epoch": 0.92, "learning_rate": 1.8369412426201856e-05, "loss": 0.5261, "step": 3270 }, { "epoch": 0.93, "learning_rate": 1.853809389935339e-05, "loss": 0.5122, "step": 3300 }, { "epoch": 0.94, "learning_rate": 1.870677537250492e-05, "loss": 0.4845, "step": 3330 }, { "epoch": 0.94, "learning_rate": 1.8875456845656453e-05, "loss": 0.5051, "step": 3360 }, { "epoch": 0.95, "learning_rate": 1.9044138318807985e-05, "loss": 0.4715, "step": 3390 }, { "epoch": 0.96, "learning_rate": 1.9212819791959518e-05, "loss": 0.484, "step": 3420 }, { "epoch": 0.97, "learning_rate": 1.938150126511105e-05, "loss": 0.4563, "step": 3450 }, { "epoch": 0.98, "learning_rate": 1.9550182738262582e-05, "loss": 0.4204, "step": 3480 }, { "epoch": 0.99, "learning_rate": 1.9718864211414114e-05, "loss": 0.4372, "step": 3510 }, { "epoch": 1.0, "learning_rate": 1.9887545684565643e-05, "loss": 0.4129, "step": 3540 }, { "epoch": 1.0, "eval_loss": 0.30152174830436707, "eval_runtime": 623.0811, "eval_samples_per_second": 25.732, "eval_steps_per_second": 0.806, "eval_wer": 0.24989423116291132, "step": 3557 }, { "epoch": 1.0, "learning_rate": 2.005622715771718e-05, "loss": 0.4449, "step": 3570 }, { "epoch": 1.01, "learning_rate": 2.022490863086871e-05, "loss": 0.4039, "step": 3600 }, { "epoch": 1.02, "learning_rate": 2.0393590104020244e-05, "loss": 0.418, "step": 3630 }, { "epoch": 1.03, "learning_rate": 2.0562271577171773e-05, "loss": 0.4121, "step": 3660 }, { "epoch": 1.04, "learning_rate": 2.0730953050323308e-05, "loss": 0.3687, "step": 3690 }, { "epoch": 1.05, "learning_rate": 2.089963452347484e-05, "loss": 0.383, "step": 3720 }, { "epoch": 1.05, "learning_rate": 2.1068315996626373e-05, "loss": 0.3786, "step": 3750 }, { "epoch": 1.06, "learning_rate": 2.12369974697779e-05, "loss": 0.3714, "step": 3780 }, { "epoch": 1.07, "learning_rate": 2.1405678942929437e-05, "loss": 0.3948, "step": 3810 }, { "epoch": 1.08, "learning_rate": 2.157436041608097e-05, "loss": 0.334, "step": 3840 }, { "epoch": 1.09, "learning_rate": 2.1743041889232502e-05, "loss": 0.3746, "step": 3870 }, { "epoch": 1.1, "learning_rate": 2.191172336238403e-05, "loss": 0.3451, "step": 3900 }, { "epoch": 1.1, "learning_rate": 2.2080404835535563e-05, "loss": 0.3487, "step": 3930 }, { "epoch": 1.11, "learning_rate": 2.22490863086871e-05, "loss": 0.3646, "step": 3960 }, { "epoch": 1.12, "learning_rate": 2.2417767781838628e-05, "loss": 0.3259, "step": 3990 }, { "epoch": 1.13, "learning_rate": 2.258644925499016e-05, "loss": 0.3539, "step": 4020 }, { "epoch": 1.14, "learning_rate": 2.2755130728141692e-05, "loss": 0.3308, "step": 4050 }, { "epoch": 1.15, "learning_rate": 2.2923812201293228e-05, "loss": 0.3477, "step": 4080 }, { "epoch": 1.16, "learning_rate": 2.3092493674444757e-05, "loss": 0.3484, "step": 4110 }, { "epoch": 1.16, "learning_rate": 2.326117514759629e-05, "loss": 0.3045, "step": 4140 }, { "epoch": 1.17, "learning_rate": 2.342985662074782e-05, "loss": 0.3454, "step": 4170 }, { "epoch": 1.18, "learning_rate": 2.3598538093899357e-05, "loss": 0.3136, "step": 4200 }, { "epoch": 1.19, "learning_rate": 2.3767219567050886e-05, "loss": 0.3281, "step": 4230 }, { "epoch": 1.2, "learning_rate": 2.3935901040202418e-05, "loss": 0.3355, "step": 4260 }, { "epoch": 1.21, "learning_rate": 2.410458251335395e-05, "loss": 0.2986, "step": 4290 }, { "epoch": 1.21, "learning_rate": 2.4273263986505486e-05, "loss": 0.3142, "step": 4320 }, { "epoch": 1.22, "learning_rate": 2.4441945459657015e-05, "loss": 0.2982, "step": 4350 }, { "epoch": 1.23, "learning_rate": 2.4610626932808547e-05, "loss": 0.3141, "step": 4380 }, { "epoch": 1.24, "learning_rate": 2.477930840596008e-05, "loss": 0.315, "step": 4410 }, { "epoch": 1.25, "learning_rate": 2.4947989879111612e-05, "loss": 0.2788, "step": 4440 }, { "epoch": 1.26, "learning_rate": 2.5116671352263144e-05, "loss": 0.315, "step": 4470 }, { "epoch": 1.27, "learning_rate": 2.5285352825414676e-05, "loss": 0.2849, "step": 4500 }, { "epoch": 1.27, "learning_rate": 2.545403429856621e-05, "loss": 0.2895, "step": 4530 }, { "epoch": 1.28, "learning_rate": 2.562271577171774e-05, "loss": 0.3063, "step": 4560 }, { "epoch": 1.29, "learning_rate": 2.5791397244869277e-05, "loss": 0.2696, "step": 4590 }, { "epoch": 1.3, "learning_rate": 2.5960078718020802e-05, "loss": 0.2898, "step": 4620 }, { "epoch": 1.31, "learning_rate": 2.6128760191172335e-05, "loss": 0.2863, "step": 4650 }, { "epoch": 1.32, "learning_rate": 2.629744166432387e-05, "loss": 0.2812, "step": 4680 }, { "epoch": 1.32, "learning_rate": 2.6466123137475402e-05, "loss": 0.3064, "step": 4710 }, { "epoch": 1.33, "learning_rate": 2.6634804610626935e-05, "loss": 0.2684, "step": 4740 }, { "epoch": 1.34, "learning_rate": 2.6803486083778467e-05, "loss": 0.2983, "step": 4770 }, { "epoch": 1.35, "learning_rate": 2.697216755693e-05, "loss": 0.2669, "step": 4800 }, { "epoch": 1.36, "learning_rate": 2.714084903008153e-05, "loss": 0.2748, "step": 4830 }, { "epoch": 1.37, "learning_rate": 2.730953050323306e-05, "loss": 0.295, "step": 4860 }, { "epoch": 1.37, "learning_rate": 2.7478211976384593e-05, "loss": 0.2643, "step": 4890 }, { "epoch": 1.38, "learning_rate": 2.7646893449536125e-05, "loss": 0.2695, "step": 4920 }, { "epoch": 1.39, "learning_rate": 2.781557492268766e-05, "loss": 0.2522, "step": 4950 }, { "epoch": 1.4, "learning_rate": 2.7984256395839193e-05, "loss": 0.2639, "step": 4980 }, { "epoch": 1.41, "learning_rate": 2.8152937868990725e-05, "loss": 0.2784, "step": 5010 }, { "epoch": 1.42, "learning_rate": 2.8321619342142258e-05, "loss": 0.2378, "step": 5040 }, { "epoch": 1.43, "learning_rate": 2.8490300815293786e-05, "loss": 0.2685, "step": 5070 }, { "epoch": 1.43, "learning_rate": 2.865898228844532e-05, "loss": 0.2423, "step": 5100 }, { "epoch": 1.44, "learning_rate": 2.882766376159685e-05, "loss": 0.2529, "step": 5130 }, { "epoch": 1.45, "learning_rate": 2.8996345234748383e-05, "loss": 0.2808, "step": 5160 }, { "epoch": 1.46, "learning_rate": 2.916502670789992e-05, "loss": 0.2333, "step": 5190 }, { "epoch": 1.47, "learning_rate": 2.933370818105145e-05, "loss": 0.2647, "step": 5220 }, { "epoch": 1.48, "learning_rate": 2.9502389654202984e-05, "loss": 0.2424, "step": 5250 }, { "epoch": 1.48, "learning_rate": 2.9671071127354516e-05, "loss": 0.2479, "step": 5280 }, { "epoch": 1.49, "learning_rate": 2.9839752600506045e-05, "loss": 0.2717, "step": 5310 }, { "epoch": 1.5, "learning_rate": 3.0008434073657577e-05, "loss": 0.2188, "step": 5340 }, { "epoch": 1.51, "learning_rate": 3.017711554680911e-05, "loss": 0.258, "step": 5370 }, { "epoch": 1.52, "learning_rate": 3.034579701996064e-05, "loss": 0.2504, "step": 5400 }, { "epoch": 1.53, "learning_rate": 3.0514478493112174e-05, "loss": 0.2478, "step": 5430 }, { "epoch": 1.53, "learning_rate": 3.068315996626371e-05, "loss": 0.2725, "step": 5460 }, { "epoch": 1.54, "learning_rate": 3.085184143941524e-05, "loss": 0.2233, "step": 5490 }, { "epoch": 1.55, "learning_rate": 3.1020522912566774e-05, "loss": 0.2592, "step": 5520 }, { "epoch": 1.56, "learning_rate": 3.11892043857183e-05, "loss": 0.231, "step": 5550 }, { "epoch": 1.57, "learning_rate": 3.135788585886983e-05, "loss": 0.2413, "step": 5580 }, { "epoch": 1.58, "learning_rate": 3.1526567332021364e-05, "loss": 0.2557, "step": 5610 }, { "epoch": 1.59, "learning_rate": 3.16952488051729e-05, "loss": 0.2252, "step": 5640 }, { "epoch": 1.59, "learning_rate": 3.1863930278324436e-05, "loss": 0.2532, "step": 5670 }, { "epoch": 1.6, "learning_rate": 3.203261175147597e-05, "loss": 0.2228, "step": 5700 }, { "epoch": 1.61, "learning_rate": 3.22012932246275e-05, "loss": 0.2448, "step": 5730 }, { "epoch": 1.62, "learning_rate": 3.2369974697779026e-05, "loss": 0.2447, "step": 5760 }, { "epoch": 1.63, "learning_rate": 3.253865617093056e-05, "loss": 0.212, "step": 5790 }, { "epoch": 1.64, "learning_rate": 3.270733764408209e-05, "loss": 0.2454, "step": 5820 }, { "epoch": 1.64, "learning_rate": 3.287601911723362e-05, "loss": 0.2195, "step": 5850 }, { "epoch": 1.65, "learning_rate": 3.3044700590385155e-05, "loss": 0.2381, "step": 5880 }, { "epoch": 1.66, "learning_rate": 3.3213382063536694e-05, "loss": 0.2493, "step": 5910 }, { "epoch": 1.67, "learning_rate": 3.3382063536688226e-05, "loss": 0.2076, "step": 5940 }, { "epoch": 1.68, "learning_rate": 3.355074500983976e-05, "loss": 0.2393, "step": 5970 }, { "epoch": 1.69, "learning_rate": 3.3719426482991284e-05, "loss": 0.2199, "step": 6000 }, { "epoch": 1.7, "learning_rate": 3.3888107956142816e-05, "loss": 0.222, "step": 6030 }, { "epoch": 1.7, "learning_rate": 3.405678942929435e-05, "loss": 0.2496, "step": 6060 }, { "epoch": 1.71, "learning_rate": 3.422547090244588e-05, "loss": 0.2088, "step": 6090 }, { "epoch": 1.72, "learning_rate": 3.439415237559741e-05, "loss": 0.2253, "step": 6120 }, { "epoch": 1.73, "learning_rate": 3.456283384874895e-05, "loss": 0.2095, "step": 6150 }, { "epoch": 1.74, "learning_rate": 3.4731515321900484e-05, "loss": 0.213, "step": 6180 }, { "epoch": 1.75, "learning_rate": 3.490019679505201e-05, "loss": 0.2355, "step": 6210 }, { "epoch": 1.75, "learning_rate": 3.506887826820354e-05, "loss": 0.2123, "step": 6240 }, { "epoch": 1.76, "learning_rate": 3.5237559741355074e-05, "loss": 0.2308, "step": 6270 }, { "epoch": 1.77, "learning_rate": 3.540624121450661e-05, "loss": 0.2101, "step": 6300 }, { "epoch": 1.78, "learning_rate": 3.557492268765814e-05, "loss": 0.2167, "step": 6330 }, { "epoch": 1.79, "learning_rate": 3.574360416080967e-05, "loss": 0.2397, "step": 6360 }, { "epoch": 1.8, "learning_rate": 3.5912285633961204e-05, "loss": 0.1999, "step": 6390 }, { "epoch": 1.8, "learning_rate": 3.608096710711274e-05, "loss": 0.2222, "step": 6420 }, { "epoch": 1.81, "learning_rate": 3.624964858026427e-05, "loss": 0.2063, "step": 6450 }, { "epoch": 1.82, "learning_rate": 3.64183300534158e-05, "loss": 0.2067, "step": 6480 }, { "epoch": 1.83, "learning_rate": 3.658701152656733e-05, "loss": 0.2246, "step": 6510 }, { "epoch": 1.84, "learning_rate": 3.6755692999718865e-05, "loss": 0.1943, "step": 6540 }, { "epoch": 1.85, "learning_rate": 3.69243744728704e-05, "loss": 0.2244, "step": 6570 }, { "epoch": 1.86, "learning_rate": 3.709305594602193e-05, "loss": 0.2056, "step": 6600 }, { "epoch": 1.86, "learning_rate": 3.726173741917346e-05, "loss": 0.2057, "step": 6630 }, { "epoch": 1.87, "learning_rate": 3.7430418892324994e-05, "loss": 0.2234, "step": 6660 }, { "epoch": 1.88, "learning_rate": 3.7599100365476526e-05, "loss": 0.1853, "step": 6690 }, { "epoch": 1.89, "learning_rate": 3.776778183862806e-05, "loss": 0.2223, "step": 6720 }, { "epoch": 1.9, "learning_rate": 3.793646331177959e-05, "loss": 0.2018, "step": 6750 }, { "epoch": 1.91, "learning_rate": 3.810514478493112e-05, "loss": 0.2041, "step": 6780 }, { "epoch": 1.91, "learning_rate": 3.8273826258082656e-05, "loss": 0.2263, "step": 6810 }, { "epoch": 1.92, "learning_rate": 3.844250773123419e-05, "loss": 0.1908, "step": 6840 }, { "epoch": 1.93, "learning_rate": 3.861118920438572e-05, "loss": 0.218, "step": 6870 }, { "epoch": 1.94, "learning_rate": 3.877987067753725e-05, "loss": 0.1993, "step": 6900 }, { "epoch": 1.95, "learning_rate": 3.8948552150688785e-05, "loss": 0.2047, "step": 6930 }, { "epoch": 1.96, "learning_rate": 3.911723362384032e-05, "loss": 0.2235, "step": 6960 }, { "epoch": 1.97, "learning_rate": 3.928591509699185e-05, "loss": 0.1838, "step": 6990 }, { "epoch": 1.97, "learning_rate": 3.945459657014338e-05, "loss": 0.2098, "step": 7020 }, { "epoch": 1.98, "learning_rate": 3.9623278043294914e-05, "loss": 0.1947, "step": 7050 }, { "epoch": 1.99, "learning_rate": 3.9791959516446446e-05, "loss": 0.203, "step": 7080 }, { "epoch": 2.0, "learning_rate": 3.996064098959797e-05, "loss": 0.2121, "step": 7110 }, { "epoch": 2.0, "eval_loss": 0.15964379906654358, "eval_runtime": 627.5077, "eval_samples_per_second": 25.55, "eval_steps_per_second": 0.8, "eval_wer": 0.15666753101415254, "step": 7114 }, { "epoch": 2.01, "learning_rate": 4.012932246274951e-05, "loss": 0.1881, "step": 7140 }, { "epoch": 2.02, "learning_rate": 4.029800393590104e-05, "loss": 0.2157, "step": 7170 }, { "epoch": 2.02, "learning_rate": 4.0466685409052575e-05, "loss": 0.1762, "step": 7200 }, { "epoch": 2.03, "learning_rate": 4.063536688220411e-05, "loss": 0.193, "step": 7230 }, { "epoch": 2.04, "learning_rate": 4.080404835535564e-05, "loss": 0.1967, "step": 7260 }, { "epoch": 2.05, "learning_rate": 4.097272982850717e-05, "loss": 0.1824, "step": 7290 }, { "epoch": 2.06, "learning_rate": 4.1141411301658704e-05, "loss": 0.2006, "step": 7320 }, { "epoch": 2.07, "learning_rate": 4.131009277481023e-05, "loss": 0.1734, "step": 7350 }, { "epoch": 2.07, "learning_rate": 4.147877424796177e-05, "loss": 0.2023, "step": 7380 }, { "epoch": 2.08, "learning_rate": 4.16474557211133e-05, "loss": 0.1827, "step": 7410 }, { "epoch": 2.09, "learning_rate": 4.1816137194264834e-05, "loss": 0.1903, "step": 7440 }, { "epoch": 2.1, "learning_rate": 4.1984818667416366e-05, "loss": 0.2175, "step": 7470 }, { "epoch": 2.11, "learning_rate": 4.21535001405679e-05, "loss": 0.1789, "step": 7500 }, { "epoch": 2.12, "learning_rate": 4.232218161371943e-05, "loss": 0.2071, "step": 7530 }, { "epoch": 2.13, "learning_rate": 4.249086308687096e-05, "loss": 0.1964, "step": 7560 }, { "epoch": 2.13, "learning_rate": 4.265954456002249e-05, "loss": 0.1821, "step": 7590 }, { "epoch": 2.14, "learning_rate": 4.282822603317402e-05, "loss": 0.2075, "step": 7620 }, { "epoch": 2.15, "learning_rate": 4.299690750632556e-05, "loss": 0.1699, "step": 7650 }, { "epoch": 2.16, "learning_rate": 4.316558897947709e-05, "loss": 0.1778, "step": 7680 }, { "epoch": 2.17, "learning_rate": 4.3334270452628624e-05, "loss": 0.191, "step": 7710 }, { "epoch": 2.18, "learning_rate": 4.3502951925780156e-05, "loss": 0.1773, "step": 7740 }, { "epoch": 2.18, "learning_rate": 4.367163339893169e-05, "loss": 0.202, "step": 7770 }, { "epoch": 2.19, "learning_rate": 4.3840314872083214e-05, "loss": 0.1645, "step": 7800 }, { "epoch": 2.2, "learning_rate": 4.4008996345234746e-05, "loss": 0.1896, "step": 7830 }, { "epoch": 2.21, "learning_rate": 4.417767781838628e-05, "loss": 0.1864, "step": 7860 }, { "epoch": 2.22, "learning_rate": 4.434635929153782e-05, "loss": 0.1854, "step": 7890 }, { "epoch": 2.23, "learning_rate": 4.451504076468935e-05, "loss": 0.1959, "step": 7920 }, { "epoch": 2.23, "learning_rate": 4.468372223784088e-05, "loss": 0.1658, "step": 7950 }, { "epoch": 2.24, "learning_rate": 4.4852403710992415e-05, "loss": 0.1884, "step": 7980 }, { "epoch": 2.25, "learning_rate": 4.502108518414395e-05, "loss": 0.1841, "step": 8010 }, { "epoch": 2.26, "learning_rate": 4.518976665729547e-05, "loss": 0.1774, "step": 8040 }, { "epoch": 2.27, "learning_rate": 4.5358448130447005e-05, "loss": 0.1997, "step": 8070 }, { "epoch": 2.28, "learning_rate": 4.552712960359854e-05, "loss": 0.1656, "step": 8100 }, { "epoch": 2.29, "learning_rate": 4.569581107675007e-05, "loss": 0.1964, "step": 8130 }, { "epoch": 2.29, "learning_rate": 4.586449254990161e-05, "loss": 0.1807, "step": 8160 }, { "epoch": 2.3, "learning_rate": 4.603317402305314e-05, "loss": 0.1777, "step": 8190 }, { "epoch": 2.31, "learning_rate": 4.620185549620467e-05, "loss": 0.1921, "step": 8220 }, { "epoch": 2.32, "learning_rate": 4.63705369693562e-05, "loss": 0.1708, "step": 8250 }, { "epoch": 2.33, "learning_rate": 4.653921844250773e-05, "loss": 0.1743, "step": 8280 }, { "epoch": 2.34, "learning_rate": 4.670789991565926e-05, "loss": 0.1758, "step": 8310 }, { "epoch": 2.34, "learning_rate": 4.6876581388810795e-05, "loss": 0.1789, "step": 8340 }, { "epoch": 2.35, "learning_rate": 4.704526286196233e-05, "loss": 0.1953, "step": 8370 }, { "epoch": 2.36, "learning_rate": 4.7213944335113867e-05, "loss": 0.1648, "step": 8400 }, { "epoch": 2.37, "learning_rate": 4.73826258082654e-05, "loss": 0.1803, "step": 8430 }, { "epoch": 2.38, "learning_rate": 4.755130728141693e-05, "loss": 0.1767, "step": 8460 }, { "epoch": 2.39, "learning_rate": 4.771998875456846e-05, "loss": 0.1703, "step": 8490 }, { "epoch": 2.4, "learning_rate": 4.788867022771999e-05, "loss": 0.1928, "step": 8520 }, { "epoch": 2.4, "learning_rate": 4.805735170087152e-05, "loss": 0.1645, "step": 8550 }, { "epoch": 2.41, "learning_rate": 4.8226033174023054e-05, "loss": 0.1894, "step": 8580 }, { "epoch": 2.42, "learning_rate": 4.8394714647174586e-05, "loss": 0.1749, "step": 8610 }, { "epoch": 2.43, "learning_rate": 4.856339612032612e-05, "loss": 0.1707, "step": 8640 }, { "epoch": 2.44, "learning_rate": 4.873207759347766e-05, "loss": 0.1834, "step": 8670 }, { "epoch": 2.45, "learning_rate": 4.890075906662918e-05, "loss": 0.1675, "step": 8700 }, { "epoch": 2.45, "learning_rate": 4.9069440539780715e-05, "loss": 0.1894, "step": 8730 }, { "epoch": 2.46, "learning_rate": 4.923812201293225e-05, "loss": 0.1742, "step": 8760 }, { "epoch": 2.47, "learning_rate": 4.940680348608378e-05, "loss": 0.1704, "step": 8790 }, { "epoch": 2.48, "learning_rate": 4.957548495923531e-05, "loss": 0.1758, "step": 8820 }, { "epoch": 2.49, "learning_rate": 4.9744166432386844e-05, "loss": 0.1603, "step": 8850 }, { "epoch": 2.5, "learning_rate": 4.9912847905538376e-05, "loss": 0.18, "step": 8880 }, { "epoch": 2.5, "learning_rate": 5.008152937868991e-05, "loss": 0.1695, "step": 8910 }, { "epoch": 2.51, "learning_rate": 5.025021085184144e-05, "loss": 0.1637, "step": 8940 }, { "epoch": 2.52, "learning_rate": 5.041889232499297e-05, "loss": 0.1739, "step": 8970 }, { "epoch": 2.53, "learning_rate": 5.0587573798144506e-05, "loss": 0.1587, "step": 9000 }, { "epoch": 2.54, "learning_rate": 5.075625527129604e-05, "loss": 0.1834, "step": 9030 }, { "epoch": 2.55, "learning_rate": 5.092493674444757e-05, "loss": 0.1678, "step": 9060 }, { "epoch": 2.56, "learning_rate": 5.10936182175991e-05, "loss": 0.166, "step": 9090 }, { "epoch": 2.56, "learning_rate": 5.1262299690750635e-05, "loss": 0.1821, "step": 9120 }, { "epoch": 2.57, "learning_rate": 5.143098116390217e-05, "loss": 0.1633, "step": 9150 }, { "epoch": 2.58, "learning_rate": 5.1599662637053706e-05, "loss": 0.1758, "step": 9180 }, { "epoch": 2.59, "learning_rate": 5.176834411020524e-05, "loss": 0.1663, "step": 9210 }, { "epoch": 2.6, "learning_rate": 5.193702558335677e-05, "loss": 0.1625, "step": 9240 }, { "epoch": 2.61, "learning_rate": 5.210570705650829e-05, "loss": 0.1889, "step": 9270 }, { "epoch": 2.61, "learning_rate": 5.227438852965982e-05, "loss": 0.1523, "step": 9300 }, { "epoch": 2.62, "learning_rate": 5.2443070002811354e-05, "loss": 0.1687, "step": 9330 }, { "epoch": 2.63, "learning_rate": 5.2611751475962886e-05, "loss": 0.1646, "step": 9360 }, { "epoch": 2.64, "learning_rate": 5.2780432949114425e-05, "loss": 0.1666, "step": 9390 }, { "epoch": 2.65, "learning_rate": 5.294911442226596e-05, "loss": 0.1743, "step": 9420 }, { "epoch": 2.66, "learning_rate": 5.311779589541749e-05, "loss": 0.1561, "step": 9450 }, { "epoch": 2.67, "learning_rate": 5.328647736856902e-05, "loss": 0.1784, "step": 9480 }, { "epoch": 2.67, "learning_rate": 5.3455158841720554e-05, "loss": 0.1673, "step": 9510 }, { "epoch": 2.68, "learning_rate": 5.3623840314872087e-05, "loss": 0.1732, "step": 9540 }, { "epoch": 2.69, "learning_rate": 5.379252178802362e-05, "loss": 0.1679, "step": 9570 }, { "epoch": 2.7, "learning_rate": 5.396120326117515e-05, "loss": 0.1542, "step": 9600 }, { "epoch": 2.71, "learning_rate": 5.4129884734326683e-05, "loss": 0.1692, "step": 9630 }, { "epoch": 2.72, "learning_rate": 5.4298566207478216e-05, "loss": 0.1589, "step": 9660 }, { "epoch": 2.72, "learning_rate": 5.4467247680629755e-05, "loss": 0.1563, "step": 9690 }, { "epoch": 2.73, "learning_rate": 5.463592915378129e-05, "loss": 0.1766, "step": 9720 }, { "epoch": 2.74, "learning_rate": 5.4804610626932806e-05, "loss": 0.1475, "step": 9750 }, { "epoch": 2.75, "learning_rate": 5.497329210008434e-05, "loss": 0.1816, "step": 9780 }, { "epoch": 2.76, "learning_rate": 5.514197357323587e-05, "loss": 0.1729, "step": 9810 }, { "epoch": 2.77, "learning_rate": 5.53106550463874e-05, "loss": 0.1575, "step": 9840 }, { "epoch": 2.77, "learning_rate": 5.5479336519538935e-05, "loss": 0.1817, "step": 9870 }, { "epoch": 2.78, "learning_rate": 5.5648017992690474e-05, "loss": 0.1444, "step": 9900 }, { "epoch": 2.79, "learning_rate": 5.5816699465842006e-05, "loss": 0.1692, "step": 9930 }, { "epoch": 2.8, "learning_rate": 5.598538093899354e-05, "loss": 0.1668, "step": 9960 }, { "epoch": 2.81, "learning_rate": 5.615406241214507e-05, "loss": 0.1577, "step": 9990 }, { "epoch": 2.82, "learning_rate": 5.63227438852966e-05, "loss": 0.1751, "step": 10020 }, { "epoch": 2.83, "learning_rate": 5.6491425358448135e-05, "loss": 0.1488, "step": 10050 }, { "epoch": 2.83, "learning_rate": 5.666010683159967e-05, "loss": 0.1676, "step": 10080 }, { "epoch": 2.84, "learning_rate": 5.68287883047512e-05, "loss": 0.1643, "step": 10110 }, { "epoch": 2.85, "learning_rate": 5.699746977790273e-05, "loss": 0.1543, "step": 10140 }, { "epoch": 2.86, "learning_rate": 5.7166151251054265e-05, "loss": 0.1774, "step": 10170 }, { "epoch": 2.87, "learning_rate": 5.733483272420579e-05, "loss": 0.1443, "step": 10200 }, { "epoch": 2.88, "learning_rate": 5.750351419735732e-05, "loss": 0.1646, "step": 10230 }, { "epoch": 2.88, "learning_rate": 5.7672195670508855e-05, "loss": 0.1643, "step": 10260 }, { "epoch": 2.89, "learning_rate": 5.784087714366039e-05, "loss": 0.155, "step": 10290 }, { "epoch": 2.9, "learning_rate": 5.800955861681192e-05, "loss": 0.1762, "step": 10320 }, { "epoch": 2.91, "learning_rate": 5.817824008996345e-05, "loss": 0.1512, "step": 10350 }, { "epoch": 2.92, "learning_rate": 5.8346921563114984e-05, "loss": 0.1664, "step": 10380 }, { "epoch": 2.93, "learning_rate": 5.851560303626652e-05, "loss": 0.1529, "step": 10410 }, { "epoch": 2.93, "learning_rate": 5.8684284509418055e-05, "loss": 0.1604, "step": 10440 }, { "epoch": 2.94, "learning_rate": 5.885296598256959e-05, "loss": 0.1697, "step": 10470 }, { "epoch": 2.95, "learning_rate": 5.902164745572112e-05, "loss": 0.1388, "step": 10500 }, { "epoch": 2.96, "learning_rate": 5.919032892887265e-05, "loss": 0.1636, "step": 10530 }, { "epoch": 2.97, "learning_rate": 5.9359010402024184e-05, "loss": 0.1558, "step": 10560 }, { "epoch": 2.98, "learning_rate": 5.9527691875175717e-05, "loss": 0.1585, "step": 10590 }, { "epoch": 2.99, "learning_rate": 5.969637334832725e-05, "loss": 0.1678, "step": 10620 }, { "epoch": 2.99, "learning_rate": 5.9865054821478774e-05, "loss": 0.1455, "step": 10650 }, { "epoch": 3.0, "eval_loss": 0.13774625957012177, "eval_runtime": 628.643, "eval_samples_per_second": 25.504, "eval_steps_per_second": 0.799, "eval_wer": 0.1353977590654129, "step": 10671 }, { "epoch": 3.0, "learning_rate": 6.003373629463031e-05, "loss": 0.1738, "step": 10680 }, { "epoch": 3.01, "learning_rate": 6.020241776778184e-05, "loss": 0.1472, "step": 10710 }, { "epoch": 3.02, "learning_rate": 6.037109924093337e-05, "loss": 0.1587, "step": 10740 }, { "epoch": 3.03, "learning_rate": 6.0539780714084903e-05, "loss": 0.1587, "step": 10770 }, { "epoch": 3.04, "learning_rate": 6.0708462187236436e-05, "loss": 0.1487, "step": 10800 }, { "epoch": 3.04, "learning_rate": 6.087714366038797e-05, "loss": 0.1543, "step": 10830 }, { "epoch": 3.05, "learning_rate": 6.104582513353951e-05, "loss": 0.1412, "step": 10860 }, { "epoch": 3.06, "learning_rate": 6.121450660669103e-05, "loss": 0.1551, "step": 10890 }, { "epoch": 3.07, "learning_rate": 6.138318807984257e-05, "loss": 0.1595, "step": 10920 }, { "epoch": 3.08, "learning_rate": 6.15518695529941e-05, "loss": 0.1491, "step": 10950 }, { "epoch": 3.09, "learning_rate": 6.172055102614564e-05, "loss": 0.1575, "step": 10980 }, { "epoch": 3.1, "learning_rate": 6.188923249929716e-05, "loss": 0.1436, "step": 11010 }, { "epoch": 3.1, "learning_rate": 6.20579139724487e-05, "loss": 0.1531, "step": 11040 }, { "epoch": 3.11, "learning_rate": 6.222659544560024e-05, "loss": 0.1581, "step": 11070 }, { "epoch": 3.12, "learning_rate": 6.239527691875175e-05, "loss": 0.1305, "step": 11100 }, { "epoch": 3.13, "learning_rate": 6.256395839190329e-05, "loss": 0.1692, "step": 11130 }, { "epoch": 3.14, "learning_rate": 6.273263986505482e-05, "loss": 0.1425, "step": 11160 }, { "epoch": 3.15, "learning_rate": 6.290132133820636e-05, "loss": 0.1494, "step": 11190 }, { "epoch": 3.15, "learning_rate": 6.307000281135788e-05, "loss": 0.1584, "step": 11220 }, { "epoch": 3.16, "learning_rate": 6.323868428450942e-05, "loss": 0.1428, "step": 11250 }, { "epoch": 3.17, "learning_rate": 6.340736575766096e-05, "loss": 0.163, "step": 11280 }, { "epoch": 3.18, "learning_rate": 6.357604723081248e-05, "loss": 0.1385, "step": 11310 }, { "epoch": 3.19, "learning_rate": 6.374472870396402e-05, "loss": 0.147, "step": 11340 }, { "epoch": 3.2, "learning_rate": 6.391341017711555e-05, "loss": 0.1579, "step": 11370 }, { "epoch": 3.2, "learning_rate": 6.408209165026709e-05, "loss": 0.1411, "step": 11400 }, { "epoch": 3.21, "learning_rate": 6.425077312341861e-05, "loss": 0.1604, "step": 11430 }, { "epoch": 3.22, "learning_rate": 6.441945459657015e-05, "loss": 0.1443, "step": 11460 }, { "epoch": 3.23, "learning_rate": 6.458813606972168e-05, "loss": 0.1461, "step": 11490 }, { "epoch": 3.24, "learning_rate": 6.475681754287322e-05, "loss": 0.1501, "step": 11520 }, { "epoch": 3.25, "learning_rate": 6.492549901602474e-05, "loss": 0.1332, "step": 11550 }, { "epoch": 3.26, "learning_rate": 6.509418048917627e-05, "loss": 0.1569, "step": 11580 }, { "epoch": 3.26, "learning_rate": 6.526286196232781e-05, "loss": 0.1349, "step": 11610 }, { "epoch": 3.27, "learning_rate": 6.543154343547933e-05, "loss": 0.1458, "step": 11640 }, { "epoch": 3.28, "learning_rate": 6.560022490863087e-05, "loss": 0.1578, "step": 11670 }, { "epoch": 3.29, "learning_rate": 6.57689063817824e-05, "loss": 0.1379, "step": 11700 }, { "epoch": 3.3, "learning_rate": 6.593758785493394e-05, "loss": 0.1585, "step": 11730 }, { "epoch": 3.31, "learning_rate": 6.610626932808546e-05, "loss": 0.138, "step": 11760 }, { "epoch": 3.31, "learning_rate": 6.6274950801237e-05, "loss": 0.1526, "step": 11790 }, { "epoch": 3.32, "learning_rate": 6.644363227438854e-05, "loss": 0.157, "step": 11820 }, { "epoch": 3.33, "learning_rate": 6.661231374754007e-05, "loss": 0.1379, "step": 11850 }, { "epoch": 3.34, "learning_rate": 6.67809952206916e-05, "loss": 0.1561, "step": 11880 }, { "epoch": 3.35, "learning_rate": 6.694967669384313e-05, "loss": 0.1351, "step": 11910 }, { "epoch": 3.36, "learning_rate": 6.711835816699467e-05, "loss": 0.1455, "step": 11940 }, { "epoch": 3.37, "learning_rate": 6.72870396401462e-05, "loss": 0.1473, "step": 11970 }, { "epoch": 3.37, "learning_rate": 6.745572111329772e-05, "loss": 0.1342, "step": 12000 }, { "epoch": 3.38, "learning_rate": 6.762440258644926e-05, "loss": 0.1529, "step": 12030 }, { "epoch": 3.39, "learning_rate": 6.779308405960078e-05, "loss": 0.138, "step": 12060 }, { "epoch": 3.4, "learning_rate": 6.796176553275232e-05, "loss": 0.1462, "step": 12090 }, { "epoch": 3.41, "learning_rate": 6.813044700590385e-05, "loss": 0.1569, "step": 12120 }, { "epoch": 3.42, "learning_rate": 6.829912847905539e-05, "loss": 0.1276, "step": 12150 }, { "epoch": 3.42, "learning_rate": 6.846780995220691e-05, "loss": 0.1538, "step": 12180 }, { "epoch": 3.43, "learning_rate": 6.863649142535845e-05, "loss": 0.1323, "step": 12210 }, { "epoch": 3.44, "learning_rate": 6.880517289850998e-05, "loss": 0.1457, "step": 12240 }, { "epoch": 3.45, "learning_rate": 6.897385437166152e-05, "loss": 0.1473, "step": 12270 }, { "epoch": 3.46, "learning_rate": 6.914253584481306e-05, "loss": 0.14, "step": 12300 }, { "epoch": 3.47, "learning_rate": 6.931121731796458e-05, "loss": 0.1591, "step": 12330 }, { "epoch": 3.47, "learning_rate": 6.947989879111612e-05, "loss": 0.1314, "step": 12360 }, { "epoch": 3.48, "learning_rate": 6.964858026426765e-05, "loss": 0.1424, "step": 12390 }, { "epoch": 3.49, "learning_rate": 6.981726173741919e-05, "loss": 0.1491, "step": 12420 }, { "epoch": 3.5, "learning_rate": 6.99859432105707e-05, "loss": 0.1307, "step": 12450 }, { "epoch": 3.51, "learning_rate": 7.015462468372224e-05, "loss": 0.1511, "step": 12480 }, { "epoch": 3.52, "learning_rate": 7.032330615687378e-05, "loss": 0.1432, "step": 12510 }, { "epoch": 3.53, "learning_rate": 7.04919876300253e-05, "loss": 0.152, "step": 12540 }, { "epoch": 3.53, "learning_rate": 7.066066910317684e-05, "loss": 0.1535, "step": 12570 }, { "epoch": 3.54, "learning_rate": 7.082935057632837e-05, "loss": 0.1311, "step": 12600 }, { "epoch": 3.55, "learning_rate": 7.09980320494799e-05, "loss": 0.1493, "step": 12630 }, { "epoch": 3.56, "learning_rate": 7.116671352263143e-05, "loss": 0.1343, "step": 12660 }, { "epoch": 3.57, "learning_rate": 7.133539499578297e-05, "loss": 0.1404, "step": 12690 }, { "epoch": 3.58, "learning_rate": 7.15040764689345e-05, "loss": 0.1464, "step": 12720 }, { "epoch": 3.58, "learning_rate": 7.167275794208603e-05, "loss": 0.1255, "step": 12750 }, { "epoch": 3.59, "learning_rate": 7.184143941523756e-05, "loss": 0.1548, "step": 12780 }, { "epoch": 3.6, "learning_rate": 7.20101208883891e-05, "loss": 0.1306, "step": 12810 }, { "epoch": 3.61, "learning_rate": 7.217880236154064e-05, "loss": 0.144, "step": 12840 }, { "epoch": 3.62, "learning_rate": 7.234748383469216e-05, "loss": 0.1428, "step": 12870 }, { "epoch": 3.63, "learning_rate": 7.251616530784369e-05, "loss": 0.132, "step": 12900 }, { "epoch": 3.63, "learning_rate": 7.268484678099521e-05, "loss": 0.146, "step": 12930 }, { "epoch": 3.64, "learning_rate": 7.285352825414675e-05, "loss": 0.135, "step": 12960 }, { "epoch": 3.65, "learning_rate": 7.302220972729828e-05, "loss": 0.1459, "step": 12990 }, { "epoch": 3.66, "learning_rate": 7.319089120044982e-05, "loss": 0.1482, "step": 13020 }, { "epoch": 3.67, "learning_rate": 7.335957267360136e-05, "loss": 0.1349, "step": 13050 }, { "epoch": 3.68, "learning_rate": 7.352825414675288e-05, "loss": 0.1419, "step": 13080 }, { "epoch": 3.69, "learning_rate": 7.369693561990442e-05, "loss": 0.137, "step": 13110 }, { "epoch": 3.69, "learning_rate": 7.386561709305595e-05, "loss": 0.1477, "step": 13140 }, { "epoch": 3.7, "learning_rate": 7.403429856620749e-05, "loss": 0.1484, "step": 13170 }, { "epoch": 3.71, "learning_rate": 7.419735732358729e-05, "loss": 0.1337, "step": 13200 }, { "epoch": 3.72, "learning_rate": 7.436603879673882e-05, "loss": 0.1481, "step": 13230 }, { "epoch": 3.73, "learning_rate": 7.453472026989036e-05, "loss": 0.1271, "step": 13260 }, { "epoch": 3.74, "learning_rate": 7.470340174304189e-05, "loss": 0.1405, "step": 13290 }, { "epoch": 3.74, "learning_rate": 7.487208321619343e-05, "loss": 0.1385, "step": 13320 }, { "epoch": 3.75, "learning_rate": 7.504076468934495e-05, "loss": 0.1286, "step": 13350 }, { "epoch": 3.76, "learning_rate": 7.520944616249649e-05, "loss": 0.1471, "step": 13380 }, { "epoch": 3.77, "learning_rate": 7.537812763564802e-05, "loss": 0.1327, "step": 13410 }, { "epoch": 3.78, "learning_rate": 7.554680910879956e-05, "loss": 0.1433, "step": 13440 }, { "epoch": 3.79, "learning_rate": 7.571549058195108e-05, "loss": 0.1452, "step": 13470 }, { "epoch": 3.8, "learning_rate": 7.588417205510262e-05, "loss": 0.1322, "step": 13500 }, { "epoch": 3.8, "learning_rate": 7.605285352825415e-05, "loss": 0.1502, "step": 13530 }, { "epoch": 3.81, "learning_rate": 7.622153500140569e-05, "loss": 0.1287, "step": 13560 }, { "epoch": 3.82, "learning_rate": 7.639021647455723e-05, "loss": 0.1398, "step": 13590 }, { "epoch": 3.83, "learning_rate": 7.655889794770875e-05, "loss": 0.151, "step": 13620 }, { "epoch": 3.84, "learning_rate": 7.672757942086028e-05, "loss": 0.1299, "step": 13650 }, { "epoch": 3.85, "learning_rate": 7.68962608940118e-05, "loss": 0.1452, "step": 13680 }, { "epoch": 3.85, "learning_rate": 7.706494236716334e-05, "loss": 0.1324, "step": 13710 }, { "epoch": 3.86, "learning_rate": 7.723362384031487e-05, "loss": 0.1426, "step": 13740 }, { "epoch": 3.87, "learning_rate": 7.74023053134664e-05, "loss": 0.1505, "step": 13770 }, { "epoch": 3.88, "learning_rate": 7.757098678661794e-05, "loss": 0.1359, "step": 13800 }, { "epoch": 3.89, "learning_rate": 7.773966825976947e-05, "loss": 0.1563, "step": 13830 }, { "epoch": 3.9, "learning_rate": 7.790834973292101e-05, "loss": 0.1286, "step": 13860 }, { "epoch": 3.9, "learning_rate": 7.807703120607253e-05, "loss": 0.1375, "step": 13890 }, { "epoch": 3.91, "learning_rate": 7.824571267922407e-05, "loss": 0.1508, "step": 13920 }, { "epoch": 3.92, "learning_rate": 7.84143941523756e-05, "loss": 0.1322, "step": 13950 }, { "epoch": 3.93, "learning_rate": 7.858307562552714e-05, "loss": 0.1438, "step": 13980 }, { "epoch": 3.94, "learning_rate": 7.875175709867866e-05, "loss": 0.1308, "step": 14010 }, { "epoch": 3.95, "learning_rate": 7.89204385718302e-05, "loss": 0.1372, "step": 14040 }, { "epoch": 3.96, "learning_rate": 7.908912004498173e-05, "loss": 0.1504, "step": 14070 }, { "epoch": 3.96, "learning_rate": 7.925780151813325e-05, "loss": 0.1307, "step": 14100 }, { "epoch": 3.97, "learning_rate": 7.942648299128479e-05, "loss": 0.141, "step": 14130 }, { "epoch": 3.98, "learning_rate": 7.959516446443632e-05, "loss": 0.1327, "step": 14160 }, { "epoch": 3.99, "learning_rate": 7.976384593758786e-05, "loss": 0.1374, "step": 14190 }, { "epoch": 4.0, "learning_rate": 7.993252741073938e-05, "loss": 0.1436, "step": 14220 }, { "epoch": 4.0, "eval_loss": 0.13012589514255524, "eval_runtime": 625.1324, "eval_samples_per_second": 25.647, "eval_steps_per_second": 0.803, "eval_wer": 0.12817818295961678, "step": 14228 }, { "epoch": 4.01, "learning_rate": 8.010120888389092e-05, "loss": 0.1245, "step": 14250 }, { "epoch": 4.01, "learning_rate": 8.026989035704246e-05, "loss": 0.1439, "step": 14280 }, { "epoch": 4.02, "learning_rate": 8.043857183019399e-05, "loss": 0.1188, "step": 14310 }, { "epoch": 4.03, "learning_rate": 8.060725330334553e-05, "loss": 0.1393, "step": 14340 }, { "epoch": 4.04, "learning_rate": 8.077593477649705e-05, "loss": 0.1295, "step": 14370 }, { "epoch": 4.05, "learning_rate": 8.094461624964859e-05, "loss": 0.1367, "step": 14400 }, { "epoch": 4.06, "learning_rate": 8.111329772280012e-05, "loss": 0.1476, "step": 14430 }, { "epoch": 4.07, "learning_rate": 8.128197919595165e-05, "loss": 0.1218, "step": 14460 }, { "epoch": 4.07, "learning_rate": 8.145066066910318e-05, "loss": 0.1414, "step": 14490 }, { "epoch": 4.08, "learning_rate": 8.161934214225472e-05, "loss": 0.1294, "step": 14520 }, { "epoch": 4.09, "learning_rate": 8.178802361540624e-05, "loss": 0.1356, "step": 14550 }, { "epoch": 4.1, "learning_rate": 8.195670508855777e-05, "loss": 0.1385, "step": 14580 }, { "epoch": 4.11, "learning_rate": 8.212538656170931e-05, "loss": 0.1148, "step": 14610 }, { "epoch": 4.12, "learning_rate": 8.229406803486083e-05, "loss": 0.143, "step": 14640 }, { "epoch": 4.12, "learning_rate": 8.246274950801237e-05, "loss": 0.1218, "step": 14670 }, { "epoch": 4.13, "learning_rate": 8.26314309811639e-05, "loss": 0.1396, "step": 14700 }, { "epoch": 4.14, "learning_rate": 8.280011245431544e-05, "loss": 0.1485, "step": 14730 }, { "epoch": 4.15, "learning_rate": 8.296879392746696e-05, "loss": 0.1223, "step": 14760 }, { "epoch": 4.16, "learning_rate": 8.31374754006185e-05, "loss": 0.1386, "step": 14790 }, { "epoch": 4.17, "learning_rate": 8.330615687377004e-05, "loss": 0.1233, "step": 14820 }, { "epoch": 4.17, "learning_rate": 8.347483834692157e-05, "loss": 0.1244, "step": 14850 }, { "epoch": 4.18, "learning_rate": 8.36435198200731e-05, "loss": 0.1429, "step": 14880 }, { "epoch": 4.19, "learning_rate": 8.381220129322463e-05, "loss": 0.1153, "step": 14910 }, { "epoch": 4.2, "learning_rate": 8.398088276637617e-05, "loss": 0.1345, "step": 14940 }, { "epoch": 4.21, "learning_rate": 8.41495642395277e-05, "loss": 0.1261, "step": 14970 }, { "epoch": 4.22, "learning_rate": 8.431824571267924e-05, "loss": 0.1281, "step": 15000 }, { "epoch": 4.23, "learning_rate": 8.448692718583076e-05, "loss": 0.1434, "step": 15030 }, { "epoch": 4.23, "learning_rate": 8.465560865898229e-05, "loss": 0.1189, "step": 15060 }, { "epoch": 4.24, "learning_rate": 8.482429013213383e-05, "loss": 0.1377, "step": 15090 }, { "epoch": 4.25, "learning_rate": 8.499297160528535e-05, "loss": 0.1259, "step": 15120 }, { "epoch": 4.26, "learning_rate": 8.516165307843689e-05, "loss": 0.1236, "step": 15150 }, { "epoch": 4.27, "learning_rate": 8.533033455158842e-05, "loss": 0.1369, "step": 15180 }, { "epoch": 4.28, "learning_rate": 8.549901602473995e-05, "loss": 0.1149, "step": 15210 }, { "epoch": 4.28, "learning_rate": 8.566769749789148e-05, "loss": 0.1368, "step": 15240 }, { "epoch": 4.29, "learning_rate": 8.583637897104302e-05, "loss": 0.1288, "step": 15270 }, { "epoch": 4.3, "learning_rate": 8.600506044419455e-05, "loss": 0.1219, "step": 15300 }, { "epoch": 4.31, "learning_rate": 8.617374191734608e-05, "loss": 0.139, "step": 15330 }, { "epoch": 4.32, "learning_rate": 8.634242339049762e-05, "loss": 0.116, "step": 15360 }, { "epoch": 4.33, "learning_rate": 8.651110486364915e-05, "loss": 0.1371, "step": 15390 }, { "epoch": 4.34, "learning_rate": 8.667978633680069e-05, "loss": 0.1161, "step": 15420 }, { "epoch": 4.34, "learning_rate": 8.684846780995221e-05, "loss": 0.1289, "step": 15450 }, { "epoch": 4.35, "learning_rate": 8.701714928310374e-05, "loss": 0.1379, "step": 15480 }, { "epoch": 4.36, "learning_rate": 8.718583075625528e-05, "loss": 0.1205, "step": 15510 }, { "epoch": 4.37, "learning_rate": 8.73545122294068e-05, "loss": 0.1332, "step": 15540 }, { "epoch": 4.38, "learning_rate": 8.752319370255834e-05, "loss": 0.1217, "step": 15570 }, { "epoch": 4.39, "learning_rate": 8.769187517570987e-05, "loss": 0.1257, "step": 15600 }, { "epoch": 4.39, "learning_rate": 8.786055664886141e-05, "loss": 0.1427, "step": 15630 }, { "epoch": 4.4, "learning_rate": 8.802923812201293e-05, "loss": 0.1179, "step": 15660 }, { "epoch": 4.41, "learning_rate": 8.819791959516447e-05, "loss": 0.1446, "step": 15690 }, { "epoch": 4.42, "learning_rate": 8.8366601068316e-05, "loss": 0.1253, "step": 15720 }, { "epoch": 4.43, "learning_rate": 8.853528254146754e-05, "loss": 0.1275, "step": 15750 }, { "epoch": 4.44, "learning_rate": 8.870396401461906e-05, "loss": 0.145, "step": 15780 }, { "epoch": 4.44, "learning_rate": 8.88726454877706e-05, "loss": 0.115, "step": 15810 }, { "epoch": 4.45, "learning_rate": 8.904132696092214e-05, "loss": 0.1337, "step": 15840 }, { "epoch": 4.46, "learning_rate": 8.921000843407367e-05, "loss": 0.1186, "step": 15870 }, { "epoch": 4.47, "learning_rate": 8.93786899072252e-05, "loss": 0.1335, "step": 15900 }, { "epoch": 4.48, "learning_rate": 8.954737138037672e-05, "loss": 0.1424, "step": 15930 }, { "epoch": 4.49, "learning_rate": 8.971605285352826e-05, "loss": 0.1137, "step": 15960 }, { "epoch": 4.5, "learning_rate": 8.988473432667978e-05, "loss": 0.1335, "step": 15990 }, { "epoch": 4.5, "learning_rate": 9.005341579983132e-05, "loss": 0.1251, "step": 16020 }, { "epoch": 4.51, "learning_rate": 9.022209727298286e-05, "loss": 0.1289, "step": 16050 }, { "epoch": 4.52, "learning_rate": 9.039077874613438e-05, "loss": 0.1452, "step": 16080 }, { "epoch": 4.53, "learning_rate": 9.055946021928592e-05, "loss": 0.1185, "step": 16110 }, { "epoch": 4.54, "learning_rate": 9.072814169243745e-05, "loss": 0.1337, "step": 16140 }, { "epoch": 4.55, "learning_rate": 9.089682316558899e-05, "loss": 0.1189, "step": 16170 }, { "epoch": 4.55, "learning_rate": 9.10598819229688e-05, "loss": 0.1336, "step": 16200 }, { "epoch": 4.56, "learning_rate": 9.122856339612033e-05, "loss": 0.1361, "step": 16230 }, { "epoch": 4.57, "learning_rate": 9.139724486927187e-05, "loss": 0.1131, "step": 16260 }, { "epoch": 4.58, "learning_rate": 9.156592634242339e-05, "loss": 0.1351, "step": 16290 }, { "epoch": 4.59, "learning_rate": 9.173460781557493e-05, "loss": 0.1209, "step": 16320 }, { "epoch": 4.6, "learning_rate": 9.190328928872646e-05, "loss": 0.1382, "step": 16350 }, { "epoch": 4.6, "learning_rate": 9.2071970761878e-05, "loss": 0.1471, "step": 16380 }, { "epoch": 4.61, "learning_rate": 9.224065223502952e-05, "loss": 0.1148, "step": 16410 }, { "epoch": 4.62, "learning_rate": 9.240933370818106e-05, "loss": 0.1442, "step": 16440 }, { "epoch": 4.63, "learning_rate": 9.257801518133258e-05, "loss": 0.1244, "step": 16470 }, { "epoch": 4.64, "learning_rate": 9.274669665448412e-05, "loss": 0.1324, "step": 16500 }, { "epoch": 4.65, "learning_rate": 9.291537812763565e-05, "loss": 0.1369, "step": 16530 }, { "epoch": 4.66, "learning_rate": 9.308405960078719e-05, "loss": 0.1125, "step": 16560 }, { "epoch": 4.66, "learning_rate": 9.325274107393873e-05, "loss": 0.1342, "step": 16590 }, { "epoch": 4.67, "learning_rate": 9.342142254709025e-05, "loss": 0.1169, "step": 16620 }, { "epoch": 4.68, "learning_rate": 9.359010402024179e-05, "loss": 0.131, "step": 16650 }, { "epoch": 4.69, "learning_rate": 9.37587854933933e-05, "loss": 0.1433, "step": 16680 }, { "epoch": 4.7, "learning_rate": 9.392746696654484e-05, "loss": 0.1083, "step": 16710 }, { "epoch": 4.71, "learning_rate": 9.409614843969637e-05, "loss": 0.141, "step": 16740 }, { "epoch": 4.71, "learning_rate": 9.426482991284791e-05, "loss": 0.1252, "step": 16770 }, { "epoch": 4.72, "learning_rate": 9.443351138599945e-05, "loss": 0.1307, "step": 16800 }, { "epoch": 4.73, "learning_rate": 9.460219285915097e-05, "loss": 0.1423, "step": 16830 }, { "epoch": 4.74, "learning_rate": 9.477087433230251e-05, "loss": 0.1153, "step": 16860 }, { "epoch": 4.75, "learning_rate": 9.493955580545404e-05, "loss": 0.1344, "step": 16890 }, { "epoch": 4.76, "learning_rate": 9.510823727860558e-05, "loss": 0.1187, "step": 16920 }, { "epoch": 4.77, "learning_rate": 9.52769187517571e-05, "loss": 0.1296, "step": 16950 }, { "epoch": 4.77, "learning_rate": 9.544560022490864e-05, "loss": 0.1412, "step": 16980 }, { "epoch": 4.78, "learning_rate": 9.561428169806017e-05, "loss": 0.117, "step": 17010 }, { "epoch": 4.79, "learning_rate": 9.57829631712117e-05, "loss": 0.1399, "step": 17040 }, { "epoch": 4.8, "learning_rate": 9.595164464436323e-05, "loss": 0.1281, "step": 17070 }, { "epoch": 4.81, "learning_rate": 9.612032611751477e-05, "loss": 0.1314, "step": 17100 }, { "epoch": 4.82, "learning_rate": 9.62890075906663e-05, "loss": 0.1426, "step": 17130 }, { "epoch": 4.82, "learning_rate": 9.645768906381782e-05, "loss": 0.1215, "step": 17160 }, { "epoch": 4.83, "learning_rate": 9.662637053696936e-05, "loss": 0.1377, "step": 17190 }, { "epoch": 4.84, "learning_rate": 9.679505201012088e-05, "loss": 0.1169, "step": 17220 }, { "epoch": 4.85, "learning_rate": 9.696373348327242e-05, "loss": 0.1264, "step": 17250 }, { "epoch": 4.86, "learning_rate": 9.713241495642396e-05, "loss": 0.1354, "step": 17280 }, { "epoch": 4.87, "learning_rate": 9.730109642957549e-05, "loss": 0.1142, "step": 17310 }, { "epoch": 4.87, "learning_rate": 9.746977790272703e-05, "loss": 0.1394, "step": 17340 }, { "epoch": 4.88, "learning_rate": 9.763845937587855e-05, "loss": 0.1206, "step": 17370 }, { "epoch": 4.89, "learning_rate": 9.780714084903009e-05, "loss": 0.1298, "step": 17400 }, { "epoch": 4.9, "learning_rate": 9.797582232218162e-05, "loss": 0.1363, "step": 17430 }, { "epoch": 4.91, "learning_rate": 9.814450379533316e-05, "loss": 0.1116, "step": 17460 }, { "epoch": 4.92, "learning_rate": 9.831318526848468e-05, "loss": 0.1366, "step": 17490 }, { "epoch": 4.93, "learning_rate": 9.848186674163622e-05, "loss": 0.1215, "step": 17520 }, { "epoch": 4.93, "learning_rate": 9.865054821478775e-05, "loss": 0.1261, "step": 17550 }, { "epoch": 4.94, "learning_rate": 9.881922968793927e-05, "loss": 0.1375, "step": 17580 }, { "epoch": 4.95, "learning_rate": 9.898791116109081e-05, "loss": 0.117, "step": 17610 }, { "epoch": 4.96, "learning_rate": 9.915096991847062e-05, "loss": 0.1364, "step": 17640 }, { "epoch": 4.97, "learning_rate": 9.931965139162216e-05, "loss": 0.122, "step": 17670 }, { "epoch": 4.98, "learning_rate": 9.948833286477369e-05, "loss": 0.1229, "step": 17700 }, { "epoch": 4.98, "learning_rate": 9.965701433792523e-05, "loss": 0.1445, "step": 17730 }, { "epoch": 4.99, "learning_rate": 9.982569581107675e-05, "loss": 0.1144, "step": 17760 }, { "epoch": 5.0, "eval_loss": 0.12248270958662033, "eval_runtime": 627.1117, "eval_samples_per_second": 25.566, "eval_steps_per_second": 0.8, "eval_wer": 0.12450015694730665, "step": 17785 }, { "epoch": 5.0, "learning_rate": 9.999437728422829e-05, "loss": 0.1411, "step": 17790 }, { "epoch": 5.01, "learning_rate": 9.998188236029113e-05, "loss": 0.1146, "step": 17820 }, { "epoch": 5.02, "learning_rate": 9.996313997438541e-05, "loss": 0.1221, "step": 17850 }, { "epoch": 5.03, "learning_rate": 9.99443975884797e-05, "loss": 0.1168, "step": 17880 }, { "epoch": 5.04, "learning_rate": 9.992565520257396e-05, "loss": 0.1176, "step": 17910 }, { "epoch": 5.04, "learning_rate": 9.990691281666823e-05, "loss": 0.1309, "step": 17940 }, { "epoch": 5.05, "learning_rate": 9.988817043076251e-05, "loss": 0.1072, "step": 17970 }, { "epoch": 5.06, "learning_rate": 9.986942804485678e-05, "loss": 0.1279, "step": 18000 }, { "epoch": 5.07, "learning_rate": 9.985068565895106e-05, "loss": 0.1234, "step": 18030 }, { "epoch": 5.08, "learning_rate": 9.983194327304533e-05, "loss": 0.121, "step": 18060 }, { "epoch": 5.09, "learning_rate": 9.98132008871396e-05, "loss": 0.1344, "step": 18090 }, { "epoch": 5.09, "learning_rate": 9.979445850123387e-05, "loss": 0.1082, "step": 18120 }, { "epoch": 5.1, "learning_rate": 9.977571611532816e-05, "loss": 0.1277, "step": 18150 }, { "epoch": 5.11, "learning_rate": 9.975697372942244e-05, "loss": 0.1176, "step": 18180 }, { "epoch": 5.12, "learning_rate": 9.97382313435167e-05, "loss": 0.1147, "step": 18210 }, { "epoch": 5.13, "learning_rate": 9.971948895761097e-05, "loss": 0.1317, "step": 18240 }, { "epoch": 5.14, "learning_rate": 9.970074657170525e-05, "loss": 0.1043, "step": 18270 }, { "epoch": 5.14, "learning_rate": 9.968200418579953e-05, "loss": 0.1252, "step": 18300 }, { "epoch": 5.15, "learning_rate": 9.96632617998938e-05, "loss": 0.1184, "step": 18330 }, { "epoch": 5.16, "learning_rate": 9.964451941398807e-05, "loss": 0.1156, "step": 18360 }, { "epoch": 5.17, "learning_rate": 9.962577702808235e-05, "loss": 0.1261, "step": 18390 }, { "epoch": 5.18, "learning_rate": 9.960703464217662e-05, "loss": 0.1075, "step": 18420 }, { "epoch": 5.19, "learning_rate": 9.95882922562709e-05, "loss": 0.1218, "step": 18450 }, { "epoch": 5.2, "learning_rate": 9.956954987036516e-05, "loss": 0.1193, "step": 18480 }, { "epoch": 5.2, "learning_rate": 9.955080748445945e-05, "loss": 0.1216, "step": 18510 }, { "epoch": 5.21, "learning_rate": 9.953206509855371e-05, "loss": 0.1381, "step": 18540 }, { "epoch": 5.22, "learning_rate": 9.9513322712648e-05, "loss": 0.1051, "step": 18570 }, { "epoch": 5.23, "learning_rate": 9.949458032674227e-05, "loss": 0.1266, "step": 18600 }, { "epoch": 5.24, "learning_rate": 9.947583794083654e-05, "loss": 0.1243, "step": 18630 }, { "epoch": 5.25, "learning_rate": 9.945709555493081e-05, "loss": 0.1207, "step": 18660 }, { "epoch": 5.25, "learning_rate": 9.943835316902509e-05, "loss": 0.1342, "step": 18690 }, { "epoch": 5.26, "learning_rate": 9.941961078311937e-05, "loss": 0.1095, "step": 18720 }, { "epoch": 5.27, "learning_rate": 9.940086839721363e-05, "loss": 0.1304, "step": 18750 }, { "epoch": 5.28, "learning_rate": 9.93821260113079e-05, "loss": 0.1147, "step": 18780 }, { "epoch": 5.29, "learning_rate": 9.936338362540219e-05, "loss": 0.1176, "step": 18810 }, { "epoch": 5.3, "learning_rate": 9.934464123949645e-05, "loss": 0.129, "step": 18840 }, { "epoch": 5.3, "learning_rate": 9.932589885359074e-05, "loss": 0.103, "step": 18870 }, { "epoch": 5.31, "learning_rate": 9.9307156467685e-05, "loss": 0.1184, "step": 18900 }, { "epoch": 5.32, "learning_rate": 9.928841408177928e-05, "loss": 0.1172, "step": 18930 }, { "epoch": 5.33, "learning_rate": 9.926967169587355e-05, "loss": 0.1195, "step": 18960 }, { "epoch": 5.34, "learning_rate": 9.925092930996783e-05, "loss": 0.126, "step": 18990 }, { "epoch": 5.35, "learning_rate": 9.923218692406211e-05, "loss": 0.1127, "step": 19020 }, { "epoch": 5.36, "learning_rate": 9.921344453815638e-05, "loss": 0.1259, "step": 19050 }, { "epoch": 5.36, "learning_rate": 9.919470215225065e-05, "loss": 0.1195, "step": 19080 }, { "epoch": 5.37, "learning_rate": 9.917595976634493e-05, "loss": 0.1089, "step": 19110 }, { "epoch": 5.38, "learning_rate": 9.915721738043921e-05, "loss": 0.1389, "step": 19140 }, { "epoch": 5.39, "learning_rate": 9.913847499453346e-05, "loss": 0.1102, "step": 19170 }, { "epoch": 5.4, "learning_rate": 9.911973260862774e-05, "loss": 0.1206, "step": 19200 }, { "epoch": 5.41, "learning_rate": 9.910099022272203e-05, "loss": 0.1193, "step": 19230 }, { "epoch": 5.41, "learning_rate": 9.90822478368163e-05, "loss": 0.1218, "step": 19260 }, { "epoch": 5.42, "learning_rate": 9.906350545091057e-05, "loss": 0.1265, "step": 19290 }, { "epoch": 5.43, "learning_rate": 9.904476306500484e-05, "loss": 0.1105, "step": 19320 }, { "epoch": 5.44, "learning_rate": 9.902602067909912e-05, "loss": 0.1318, "step": 19350 }, { "epoch": 5.45, "learning_rate": 9.900727829319339e-05, "loss": 0.121, "step": 19380 }, { "epoch": 5.46, "learning_rate": 9.898853590728767e-05, "loss": 0.1148, "step": 19410 }, { "epoch": 5.47, "learning_rate": 9.896979352138195e-05, "loss": 0.1305, "step": 19440 }, { "epoch": 5.47, "learning_rate": 9.895105113547622e-05, "loss": 0.1039, "step": 19470 }, { "epoch": 5.48, "learning_rate": 9.893230874957049e-05, "loss": 0.1283, "step": 19500 }, { "epoch": 5.49, "learning_rate": 9.891356636366477e-05, "loss": 0.1151, "step": 19530 }, { "epoch": 5.5, "learning_rate": 9.889482397775905e-05, "loss": 0.121, "step": 19560 }, { "epoch": 5.51, "learning_rate": 9.88760815918533e-05, "loss": 0.1295, "step": 19590 }, { "epoch": 5.52, "learning_rate": 9.885733920594758e-05, "loss": 0.1097, "step": 19620 }, { "epoch": 5.52, "learning_rate": 9.883922156623871e-05, "loss": 0.1259, "step": 19650 }, { "epoch": 5.53, "learning_rate": 9.882047918033299e-05, "loss": 0.1212, "step": 19680 }, { "epoch": 5.54, "learning_rate": 9.880173679442727e-05, "loss": 0.1193, "step": 19710 }, { "epoch": 5.55, "learning_rate": 9.878299440852154e-05, "loss": 0.1309, "step": 19740 }, { "epoch": 5.56, "learning_rate": 9.876425202261582e-05, "loss": 0.1048, "step": 19770 }, { "epoch": 5.57, "learning_rate": 9.874550963671009e-05, "loss": 0.1282, "step": 19800 }, { "epoch": 5.57, "learning_rate": 9.872676725080437e-05, "loss": 0.1152, "step": 19830 }, { "epoch": 5.58, "learning_rate": 9.870802486489864e-05, "loss": 0.1177, "step": 19860 }, { "epoch": 5.59, "learning_rate": 9.868928247899292e-05, "loss": 0.1279, "step": 19890 }, { "epoch": 5.6, "learning_rate": 9.867054009308719e-05, "loss": 0.1092, "step": 19920 }, { "epoch": 5.61, "learning_rate": 9.865179770718145e-05, "loss": 0.1178, "step": 19950 }, { "epoch": 5.62, "learning_rate": 9.863305532127573e-05, "loss": 0.1149, "step": 19980 }, { "epoch": 5.63, "learning_rate": 9.861431293537001e-05, "loss": 0.1173, "step": 20010 }, { "epoch": 5.63, "learning_rate": 9.859557054946428e-05, "loss": 0.1246, "step": 20040 }, { "epoch": 5.64, "learning_rate": 9.857682816355855e-05, "loss": 0.1084, "step": 20070 }, { "epoch": 5.65, "learning_rate": 9.855808577765283e-05, "loss": 0.125, "step": 20100 }, { "epoch": 5.66, "learning_rate": 9.853934339174711e-05, "loss": 0.1209, "step": 20130 }, { "epoch": 5.67, "learning_rate": 9.852060100584138e-05, "loss": 0.1118, "step": 20160 }, { "epoch": 5.68, "learning_rate": 9.850185861993566e-05, "loss": 0.1235, "step": 20190 }, { "epoch": 5.68, "learning_rate": 9.848311623402993e-05, "loss": 0.1085, "step": 20220 }, { "epoch": 5.69, "learning_rate": 9.846437384812421e-05, "loss": 0.1163, "step": 20250 }, { "epoch": 5.7, "learning_rate": 9.844563146221848e-05, "loss": 0.1152, "step": 20280 }, { "epoch": 5.71, "learning_rate": 9.842688907631276e-05, "loss": 0.1136, "step": 20310 }, { "epoch": 5.72, "learning_rate": 9.840814669040702e-05, "loss": 0.1284, "step": 20340 }, { "epoch": 5.73, "learning_rate": 9.838940430450129e-05, "loss": 0.1105, "step": 20370 }, { "epoch": 5.74, "learning_rate": 9.837066191859557e-05, "loss": 0.1203, "step": 20400 }, { "epoch": 5.74, "learning_rate": 9.835191953268985e-05, "loss": 0.1209, "step": 20430 }, { "epoch": 5.75, "learning_rate": 9.833317714678413e-05, "loss": 0.1164, "step": 20460 }, { "epoch": 5.76, "learning_rate": 9.831443476087839e-05, "loss": 0.1279, "step": 20490 }, { "epoch": 5.77, "learning_rate": 9.829569237497267e-05, "loss": 0.1042, "step": 20520 }, { "epoch": 5.78, "learning_rate": 9.827694998906695e-05, "loss": 0.1151, "step": 20550 }, { "epoch": 5.79, "learning_rate": 9.825820760316122e-05, "loss": 0.1168, "step": 20580 }, { "epoch": 5.79, "learning_rate": 9.82394652172555e-05, "loss": 0.1163, "step": 20610 }, { "epoch": 5.8, "learning_rate": 9.822072283134977e-05, "loss": 0.1276, "step": 20640 }, { "epoch": 5.81, "learning_rate": 9.820198044544405e-05, "loss": 0.1113, "step": 20670 }, { "epoch": 5.82, "learning_rate": 9.818323805953831e-05, "loss": 0.1254, "step": 20700 }, { "epoch": 5.83, "learning_rate": 9.81644956736326e-05, "loss": 0.1181, "step": 20730 }, { "epoch": 5.84, "learning_rate": 9.814575328772686e-05, "loss": 0.1087, "step": 20760 }, { "epoch": 5.84, "learning_rate": 9.812701090182113e-05, "loss": 0.128, "step": 20790 }, { "epoch": 5.85, "learning_rate": 9.810826851591541e-05, "loss": 0.1078, "step": 20820 }, { "epoch": 5.86, "learning_rate": 9.808952613000969e-05, "loss": 0.1185, "step": 20850 }, { "epoch": 5.87, "learning_rate": 9.807078374410397e-05, "loss": 0.1132, "step": 20880 }, { "epoch": 5.88, "learning_rate": 9.805204135819823e-05, "loss": 0.1106, "step": 20910 }, { "epoch": 5.89, "learning_rate": 9.803329897229251e-05, "loss": 0.133, "step": 20940 }, { "epoch": 5.9, "learning_rate": 9.801455658638679e-05, "loss": 0.1055, "step": 20970 }, { "epoch": 5.9, "learning_rate": 9.799581420048106e-05, "loss": 0.1229, "step": 21000 }, { "epoch": 5.91, "learning_rate": 9.797707181457534e-05, "loss": 0.1156, "step": 21030 }, { "epoch": 5.92, "learning_rate": 9.79583294286696e-05, "loss": 0.1154, "step": 21060 }, { "epoch": 5.93, "learning_rate": 9.793958704276389e-05, "loss": 0.1361, "step": 21090 }, { "epoch": 5.94, "learning_rate": 9.792084465685815e-05, "loss": 0.1038, "step": 21120 }, { "epoch": 5.95, "learning_rate": 9.790210227095243e-05, "loss": 0.1232, "step": 21150 }, { "epoch": 5.95, "learning_rate": 9.78833598850467e-05, "loss": 0.1156, "step": 21180 }, { "epoch": 5.96, "learning_rate": 9.786461749914098e-05, "loss": 0.1133, "step": 21210 }, { "epoch": 5.97, "learning_rate": 9.784587511323525e-05, "loss": 0.1224, "step": 21240 }, { "epoch": 5.98, "learning_rate": 9.782713272732953e-05, "loss": 0.1007, "step": 21270 }, { "epoch": 5.99, "learning_rate": 9.780839034142381e-05, "loss": 0.1266, "step": 21300 }, { "epoch": 6.0, "learning_rate": 9.778964795551807e-05, "loss": 0.1219, "step": 21330 }, { "epoch": 6.0, "eval_loss": 0.125444233417511, "eval_runtime": 626.7572, "eval_samples_per_second": 25.581, "eval_steps_per_second": 0.801, "eval_wer": 0.12082895473093773, "step": 21342 }, { "epoch": 6.01, "learning_rate": 9.777090556961235e-05, "loss": 0.1218, "step": 21360 }, { "epoch": 6.01, "learning_rate": 9.775216318370663e-05, "loss": 0.1176, "step": 21390 }, { "epoch": 6.02, "learning_rate": 9.77334207978009e-05, "loss": 0.1088, "step": 21420 }, { "epoch": 6.03, "learning_rate": 9.771467841189518e-05, "loss": 0.1211, "step": 21450 }, { "epoch": 6.04, "learning_rate": 9.769593602598944e-05, "loss": 0.103, "step": 21480 }, { "epoch": 6.05, "learning_rate": 9.767719364008372e-05, "loss": 0.1174, "step": 21510 }, { "epoch": 6.06, "learning_rate": 9.765845125417799e-05, "loss": 0.1166, "step": 21540 }, { "epoch": 6.06, "learning_rate": 9.763970886827227e-05, "loss": 0.1097, "step": 21570 }, { "epoch": 6.07, "learning_rate": 9.762096648236654e-05, "loss": 0.1197, "step": 21600 }, { "epoch": 6.08, "learning_rate": 9.760222409646082e-05, "loss": 0.101, "step": 21630 }, { "epoch": 6.09, "learning_rate": 9.758348171055509e-05, "loss": 0.1148, "step": 21660 }, { "epoch": 6.1, "learning_rate": 9.756473932464937e-05, "loss": 0.1132, "step": 21690 }, { "epoch": 6.11, "learning_rate": 9.754599693874365e-05, "loss": 0.1092, "step": 21720 }, { "epoch": 6.11, "learning_rate": 9.75272545528379e-05, "loss": 0.1224, "step": 21750 }, { "epoch": 6.12, "learning_rate": 9.750851216693219e-05, "loss": 0.1093, "step": 21780 }, { "epoch": 6.13, "learning_rate": 9.748976978102647e-05, "loss": 0.1147, "step": 21810 }, { "epoch": 6.14, "learning_rate": 9.747102739512073e-05, "loss": 0.1112, "step": 21840 }, { "epoch": 6.15, "learning_rate": 9.745228500921501e-05, "loss": 0.1098, "step": 21870 }, { "epoch": 6.16, "learning_rate": 9.743354262330928e-05, "loss": 0.1251, "step": 21900 }, { "epoch": 6.17, "learning_rate": 9.741480023740356e-05, "loss": 0.1047, "step": 21930 }, { "epoch": 6.17, "learning_rate": 9.739605785149783e-05, "loss": 0.1153, "step": 21960 }, { "epoch": 6.18, "learning_rate": 9.737731546559211e-05, "loss": 0.1176, "step": 21990 }, { "epoch": 6.19, "learning_rate": 9.735857307968638e-05, "loss": 0.1144, "step": 22020 }, { "epoch": 6.2, "learning_rate": 9.733983069378066e-05, "loss": 0.1197, "step": 22050 }, { "epoch": 6.21, "learning_rate": 9.732108830787493e-05, "loss": 0.1081, "step": 22080 }, { "epoch": 6.22, "learning_rate": 9.730234592196921e-05, "loss": 0.1182, "step": 22110 }, { "epoch": 6.22, "learning_rate": 9.728360353606349e-05, "loss": 0.1163, "step": 22140 }, { "epoch": 6.23, "learning_rate": 9.726486115015774e-05, "loss": 0.1116, "step": 22170 }, { "epoch": 6.24, "learning_rate": 9.724611876425202e-05, "loss": 0.128, "step": 22200 }, { "epoch": 6.25, "learning_rate": 9.72273763783463e-05, "loss": 0.1085, "step": 22230 }, { "epoch": 6.26, "learning_rate": 9.720863399244057e-05, "loss": 0.1119, "step": 22260 }, { "epoch": 6.27, "learning_rate": 9.718989160653485e-05, "loss": 0.1225, "step": 22290 }, { "epoch": 6.27, "learning_rate": 9.717114922062912e-05, "loss": 0.1034, "step": 22320 }, { "epoch": 6.28, "learning_rate": 9.71524068347234e-05, "loss": 0.1188, "step": 22350 }, { "epoch": 6.29, "learning_rate": 9.713366444881767e-05, "loss": 0.104, "step": 22380 }, { "epoch": 6.3, "learning_rate": 9.711492206291195e-05, "loss": 0.1139, "step": 22410 }, { "epoch": 6.31, "learning_rate": 9.709617967700622e-05, "loss": 0.1144, "step": 22440 }, { "epoch": 6.32, "learning_rate": 9.70774372911005e-05, "loss": 0.106, "step": 22470 }, { "epoch": 6.33, "learning_rate": 9.705869490519477e-05, "loss": 0.1213, "step": 22500 }, { "epoch": 6.33, "learning_rate": 9.703995251928905e-05, "loss": 0.1006, "step": 22530 }, { "epoch": 6.34, "learning_rate": 9.702121013338333e-05, "loss": 0.1111, "step": 22560 }, { "epoch": 6.35, "learning_rate": 9.700246774747758e-05, "loss": 0.1114, "step": 22590 }, { "epoch": 6.36, "learning_rate": 9.698372536157186e-05, "loss": 0.1058, "step": 22620 }, { "epoch": 6.37, "learning_rate": 9.696498297566614e-05, "loss": 0.1228, "step": 22650 }, { "epoch": 6.38, "learning_rate": 9.694624058976041e-05, "loss": 0.1041, "step": 22680 }, { "epoch": 6.38, "learning_rate": 9.692749820385469e-05, "loss": 0.1129, "step": 22710 }, { "epoch": 6.39, "learning_rate": 9.690875581794896e-05, "loss": 0.1166, "step": 22740 }, { "epoch": 6.4, "learning_rate": 9.689001343204324e-05, "loss": 0.1027, "step": 22770 }, { "epoch": 6.41, "learning_rate": 9.687127104613751e-05, "loss": 0.1201, "step": 22800 }, { "epoch": 6.42, "learning_rate": 9.685252866023179e-05, "loss": 0.1033, "step": 22830 }, { "epoch": 6.43, "learning_rate": 9.683378627432606e-05, "loss": 0.1159, "step": 22860 }, { "epoch": 6.44, "learning_rate": 9.681504388842034e-05, "loss": 0.1184, "step": 22890 }, { "epoch": 6.44, "learning_rate": 9.67963015025146e-05, "loss": 0.1047, "step": 22920 }, { "epoch": 6.45, "learning_rate": 9.677755911660889e-05, "loss": 0.1189, "step": 22950 }, { "epoch": 6.46, "learning_rate": 9.675881673070317e-05, "loss": 0.1022, "step": 22980 }, { "epoch": 6.47, "learning_rate": 9.674007434479742e-05, "loss": 0.1202, "step": 23010 }, { "epoch": 6.48, "learning_rate": 9.67213319588917e-05, "loss": 0.12, "step": 23040 }, { "epoch": 6.49, "learning_rate": 9.670258957298598e-05, "loss": 0.1041, "step": 23070 }, { "epoch": 6.49, "learning_rate": 9.668384718708025e-05, "loss": 0.1231, "step": 23100 }, { "epoch": 6.5, "learning_rate": 9.666510480117452e-05, "loss": 0.103, "step": 23130 }, { "epoch": 6.51, "learning_rate": 9.66463624152688e-05, "loss": 0.1197, "step": 23160 }, { "epoch": 6.52, "learning_rate": 9.662762002936308e-05, "loss": 0.1136, "step": 23190 }, { "epoch": 6.53, "learning_rate": 9.660887764345735e-05, "loss": 0.105, "step": 23220 }, { "epoch": 6.54, "learning_rate": 9.659013525755163e-05, "loss": 0.1207, "step": 23250 }, { "epoch": 6.54, "learning_rate": 9.65713928716459e-05, "loss": 0.1041, "step": 23280 }, { "epoch": 6.55, "learning_rate": 9.655265048574018e-05, "loss": 0.1146, "step": 23310 }, { "epoch": 6.56, "learning_rate": 9.653390809983444e-05, "loss": 0.1191, "step": 23340 }, { "epoch": 6.57, "learning_rate": 9.651516571392872e-05, "loss": 0.1014, "step": 23370 }, { "epoch": 6.58, "learning_rate": 9.6496423328023e-05, "loss": 0.1168, "step": 23400 }, { "epoch": 6.59, "learning_rate": 9.647768094211726e-05, "loss": 0.1076, "step": 23430 }, { "epoch": 6.6, "learning_rate": 9.645893855621154e-05, "loss": 0.1125, "step": 23460 }, { "epoch": 6.6, "learning_rate": 9.644019617030582e-05, "loss": 0.1171, "step": 23490 }, { "epoch": 6.61, "learning_rate": 9.64214537844001e-05, "loss": 0.1105, "step": 23520 }, { "epoch": 6.62, "learning_rate": 9.640271139849436e-05, "loss": 0.1239, "step": 23550 }, { "epoch": 6.63, "learning_rate": 9.638396901258864e-05, "loss": 0.1027, "step": 23580 }, { "epoch": 6.64, "learning_rate": 9.636522662668292e-05, "loss": 0.117, "step": 23610 }, { "epoch": 6.65, "learning_rate": 9.634648424077719e-05, "loss": 0.1105, "step": 23640 }, { "epoch": 6.65, "learning_rate": 9.632774185487147e-05, "loss": 0.1073, "step": 23670 }, { "epoch": 6.66, "learning_rate": 9.630899946896573e-05, "loss": 0.1228, "step": 23700 }, { "epoch": 6.67, "learning_rate": 9.629025708306001e-05, "loss": 0.1066, "step": 23730 }, { "epoch": 6.68, "learning_rate": 9.627213944335114e-05, "loss": 0.1145, "step": 23760 }, { "epoch": 6.69, "learning_rate": 9.625339705744541e-05, "loss": 0.1163, "step": 23790 }, { "epoch": 6.7, "learning_rate": 9.623527941773655e-05, "loss": 0.1052, "step": 23820 }, { "epoch": 6.7, "learning_rate": 9.621653703183082e-05, "loss": 0.1171, "step": 23850 }, { "epoch": 6.71, "learning_rate": 9.61977946459251e-05, "loss": 0.1045, "step": 23880 }, { "epoch": 6.72, "learning_rate": 9.617905226001938e-05, "loss": 0.1056, "step": 23910 }, { "epoch": 6.73, "learning_rate": 9.616030987411365e-05, "loss": 0.115, "step": 23940 }, { "epoch": 6.74, "learning_rate": 9.614156748820791e-05, "loss": 0.1036, "step": 23970 }, { "epoch": 6.75, "learning_rate": 9.61228251023022e-05, "loss": 0.1216, "step": 24000 }, { "epoch": 6.76, "learning_rate": 9.610408271639648e-05, "loss": 0.1045, "step": 24030 }, { "epoch": 6.76, "learning_rate": 9.608534033049074e-05, "loss": 0.1125, "step": 24060 }, { "epoch": 6.77, "learning_rate": 9.606659794458501e-05, "loss": 0.1166, "step": 24090 }, { "epoch": 6.78, "learning_rate": 9.604785555867929e-05, "loss": 0.1079, "step": 24120 }, { "epoch": 6.79, "learning_rate": 9.602911317277356e-05, "loss": 0.123, "step": 24150 }, { "epoch": 6.8, "learning_rate": 9.601037078686784e-05, "loss": 0.104, "step": 24180 }, { "epoch": 6.81, "learning_rate": 9.599162840096212e-05, "loss": 0.1192, "step": 24210 }, { "epoch": 6.81, "learning_rate": 9.597288601505639e-05, "loss": 0.1106, "step": 24240 }, { "epoch": 6.82, "learning_rate": 9.595414362915066e-05, "loss": 0.11, "step": 24270 }, { "epoch": 6.83, "learning_rate": 9.593540124324494e-05, "loss": 0.1188, "step": 24300 }, { "epoch": 6.84, "learning_rate": 9.591665885733922e-05, "loss": 0.1059, "step": 24330 }, { "epoch": 6.85, "learning_rate": 9.589791647143349e-05, "loss": 0.1184, "step": 24360 }, { "epoch": 6.86, "learning_rate": 9.587917408552775e-05, "loss": 0.1098, "step": 24390 }, { "epoch": 6.87, "learning_rate": 9.586043169962203e-05, "loss": 0.1039, "step": 24420 }, { "epoch": 6.87, "learning_rate": 9.584168931371632e-05, "loss": 0.1155, "step": 24450 }, { "epoch": 6.88, "learning_rate": 9.582294692781058e-05, "loss": 0.1036, "step": 24480 }, { "epoch": 6.89, "learning_rate": 9.580420454190485e-05, "loss": 0.1124, "step": 24510 }, { "epoch": 6.9, "learning_rate": 9.578546215599913e-05, "loss": 0.1142, "step": 24540 }, { "epoch": 6.91, "learning_rate": 9.57667197700934e-05, "loss": 0.1034, "step": 24570 }, { "epoch": 6.92, "learning_rate": 9.574797738418768e-05, "loss": 0.1178, "step": 24600 }, { "epoch": 6.92, "learning_rate": 9.572923499828196e-05, "loss": 0.105, "step": 24630 }, { "epoch": 6.93, "learning_rate": 9.571049261237623e-05, "loss": 0.1113, "step": 24660 }, { "epoch": 6.94, "learning_rate": 9.56917502264705e-05, "loss": 0.1224, "step": 24690 }, { "epoch": 6.95, "learning_rate": 9.567300784056478e-05, "loss": 0.1039, "step": 24720 }, { "epoch": 6.96, "learning_rate": 9.565426545465906e-05, "loss": 0.1194, "step": 24750 }, { "epoch": 6.97, "learning_rate": 9.563552306875332e-05, "loss": 0.104, "step": 24780 }, { "epoch": 6.97, "learning_rate": 9.561678068284759e-05, "loss": 0.1157, "step": 24810 }, { "epoch": 6.98, "learning_rate": 9.559803829694187e-05, "loss": 0.1143, "step": 24840 }, { "epoch": 6.99, "learning_rate": 9.557929591103615e-05, "loss": 0.104, "step": 24870 }, { "epoch": 7.0, "eval_loss": 0.11984840035438538, "eval_runtime": 626.0548, "eval_samples_per_second": 25.61, "eval_steps_per_second": 0.802, "eval_wer": 0.1232309309022423, "step": 24899 }, { "epoch": 7.0, "learning_rate": 9.556055352513042e-05, "loss": 0.1258, "step": 24900 }, { "epoch": 7.01, "learning_rate": 9.554181113922469e-05, "loss": 0.0959, "step": 24930 }, { "epoch": 7.02, "learning_rate": 9.552306875331897e-05, "loss": 0.1123, "step": 24960 }, { "epoch": 7.03, "learning_rate": 9.550432636741324e-05, "loss": 0.1, "step": 24990 }, { "epoch": 7.03, "learning_rate": 9.548558398150752e-05, "loss": 0.1059, "step": 25020 }, { "epoch": 7.04, "learning_rate": 9.546684159560179e-05, "loss": 0.1174, "step": 25050 }, { "epoch": 7.05, "learning_rate": 9.544809920969607e-05, "loss": 0.0959, "step": 25080 }, { "epoch": 7.06, "learning_rate": 9.542935682379033e-05, "loss": 0.1112, "step": 25110 }, { "epoch": 7.07, "learning_rate": 9.541061443788461e-05, "loss": 0.1046, "step": 25140 }, { "epoch": 7.08, "learning_rate": 9.53918720519789e-05, "loss": 0.11, "step": 25170 }, { "epoch": 7.08, "learning_rate": 9.537312966607316e-05, "loss": 0.117, "step": 25200 }, { "epoch": 7.09, "learning_rate": 9.535438728016743e-05, "loss": 0.0927, "step": 25230 }, { "epoch": 7.1, "learning_rate": 9.533564489426171e-05, "loss": 0.1123, "step": 25260 }, { "epoch": 7.11, "learning_rate": 9.531690250835599e-05, "loss": 0.0996, "step": 25290 }, { "epoch": 7.12, "learning_rate": 9.529816012245026e-05, "loss": 0.1092, "step": 25320 }, { "epoch": 7.13, "learning_rate": 9.527941773654453e-05, "loss": 0.1121, "step": 25350 }, { "epoch": 7.14, "learning_rate": 9.526067535063881e-05, "loss": 0.0937, "step": 25380 }, { "epoch": 7.14, "learning_rate": 9.524193296473309e-05, "loss": 0.1096, "step": 25410 }, { "epoch": 7.15, "learning_rate": 9.522319057882736e-05, "loss": 0.1018, "step": 25440 }, { "epoch": 7.16, "learning_rate": 9.520444819292162e-05, "loss": 0.1078, "step": 25470 }, { "epoch": 7.17, "learning_rate": 9.51857058070159e-05, "loss": 0.115, "step": 25500 }, { "epoch": 7.18, "learning_rate": 9.516696342111017e-05, "loss": 0.0936, "step": 25530 }, { "epoch": 7.19, "learning_rate": 9.514822103520445e-05, "loss": 0.1174, "step": 25560 }, { "epoch": 7.19, "learning_rate": 9.512947864929873e-05, "loss": 0.1086, "step": 25590 }, { "epoch": 7.2, "learning_rate": 9.5110736263393e-05, "loss": 0.1098, "step": 25620 }, { "epoch": 7.21, "learning_rate": 9.509199387748727e-05, "loss": 0.1126, "step": 25650 }, { "epoch": 7.22, "learning_rate": 9.507325149158155e-05, "loss": 0.0935, "step": 25680 }, { "epoch": 7.23, "learning_rate": 9.505450910567583e-05, "loss": 0.1122, "step": 25710 }, { "epoch": 7.24, "learning_rate": 9.50357667197701e-05, "loss": 0.1018, "step": 25740 }, { "epoch": 7.24, "learning_rate": 9.501702433386437e-05, "loss": 0.1102, "step": 25770 }, { "epoch": 7.25, "learning_rate": 9.499828194795865e-05, "loss": 0.1164, "step": 25800 }, { "epoch": 7.26, "learning_rate": 9.497953956205293e-05, "loss": 0.092, "step": 25830 }, { "epoch": 7.27, "learning_rate": 9.49607971761472e-05, "loss": 0.1108, "step": 25860 }, { "epoch": 7.28, "learning_rate": 9.494205479024146e-05, "loss": 0.0969, "step": 25890 }, { "epoch": 7.29, "learning_rate": 9.492331240433574e-05, "loss": 0.1029, "step": 25920 }, { "epoch": 7.3, "learning_rate": 9.490457001843001e-05, "loss": 0.1139, "step": 25950 }, { "epoch": 7.3, "learning_rate": 9.488582763252429e-05, "loss": 0.0978, "step": 25980 }, { "epoch": 7.31, "learning_rate": 9.486708524661857e-05, "loss": 0.1136, "step": 26010 }, { "epoch": 7.32, "learning_rate": 9.484834286071284e-05, "loss": 0.0996, "step": 26040 }, { "epoch": 7.33, "learning_rate": 9.482960047480711e-05, "loss": 0.1053, "step": 26070 }, { "epoch": 7.34, "learning_rate": 9.481085808890139e-05, "loss": 0.1142, "step": 26100 }, { "epoch": 7.35, "learning_rate": 9.479211570299567e-05, "loss": 0.0979, "step": 26130 }, { "epoch": 7.35, "learning_rate": 9.477337331708994e-05, "loss": 0.1102, "step": 26160 }, { "epoch": 7.36, "learning_rate": 9.47546309311842e-05, "loss": 0.1011, "step": 26190 }, { "epoch": 7.37, "learning_rate": 9.473588854527849e-05, "loss": 0.1068, "step": 26220 }, { "epoch": 7.38, "learning_rate": 9.471714615937277e-05, "loss": 0.1188, "step": 26250 }, { "epoch": 7.39, "learning_rate": 9.469840377346703e-05, "loss": 0.0927, "step": 26280 }, { "epoch": 7.4, "learning_rate": 9.46796613875613e-05, "loss": 0.1174, "step": 26310 }, { "epoch": 7.41, "learning_rate": 9.466091900165558e-05, "loss": 0.0982, "step": 26340 }, { "epoch": 7.41, "learning_rate": 9.464217661574985e-05, "loss": 0.1112, "step": 26370 }, { "epoch": 7.42, "learning_rate": 9.462405897604099e-05, "loss": 0.1149, "step": 26400 }, { "epoch": 7.43, "learning_rate": 9.460531659013526e-05, "loss": 0.0922, "step": 26430 }, { "epoch": 7.44, "learning_rate": 9.458657420422954e-05, "loss": 0.1148, "step": 26460 }, { "epoch": 7.45, "learning_rate": 9.456783181832382e-05, "loss": 0.1004, "step": 26490 }, { "epoch": 7.46, "learning_rate": 9.454908943241809e-05, "loss": 0.1057, "step": 26520 }, { "epoch": 7.46, "learning_rate": 9.453034704651235e-05, "loss": 0.1195, "step": 26550 }, { "epoch": 7.47, "learning_rate": 9.451160466060664e-05, "loss": 0.095, "step": 26580 }, { "epoch": 7.48, "learning_rate": 9.449286227470092e-05, "loss": 0.1192, "step": 26610 }, { "epoch": 7.49, "learning_rate": 9.447411988879517e-05, "loss": 0.1084, "step": 26640 }, { "epoch": 7.5, "learning_rate": 9.445537750288945e-05, "loss": 0.1083, "step": 26670 }, { "epoch": 7.51, "learning_rate": 9.443663511698373e-05, "loss": 0.1119, "step": 26700 }, { "epoch": 7.51, "learning_rate": 9.4417892731078e-05, "loss": 0.096, "step": 26730 }, { "epoch": 7.52, "learning_rate": 9.439915034517228e-05, "loss": 0.1226, "step": 26760 }, { "epoch": 7.53, "learning_rate": 9.438040795926655e-05, "loss": 0.099, "step": 26790 }, { "epoch": 7.54, "learning_rate": 9.436166557336083e-05, "loss": 0.1103, "step": 26820 }, { "epoch": 7.55, "learning_rate": 9.43429231874551e-05, "loss": 0.1186, "step": 26850 }, { "epoch": 7.56, "learning_rate": 9.432418080154938e-05, "loss": 0.0976, "step": 26880 }, { "epoch": 7.57, "learning_rate": 9.430543841564366e-05, "loss": 0.1112, "step": 26910 }, { "epoch": 7.57, "learning_rate": 9.428669602973793e-05, "loss": 0.1035, "step": 26940 }, { "epoch": 7.58, "learning_rate": 9.42679536438322e-05, "loss": 0.1073, "step": 26970 }, { "epoch": 7.59, "learning_rate": 9.424921125792647e-05, "loss": 0.1147, "step": 27000 }, { "epoch": 7.6, "learning_rate": 9.423046887202076e-05, "loss": 0.0989, "step": 27030 }, { "epoch": 7.61, "learning_rate": 9.421172648611501e-05, "loss": 0.1166, "step": 27060 }, { "epoch": 7.62, "learning_rate": 9.419298410020929e-05, "loss": 0.0969, "step": 27090 }, { "epoch": 7.62, "learning_rate": 9.417424171430357e-05, "loss": 0.1039, "step": 27120 }, { "epoch": 7.63, "learning_rate": 9.415549932839784e-05, "loss": 0.1216, "step": 27150 }, { "epoch": 7.64, "learning_rate": 9.413675694249212e-05, "loss": 0.0946, "step": 27180 }, { "epoch": 7.65, "learning_rate": 9.411801455658639e-05, "loss": 0.1187, "step": 27210 }, { "epoch": 7.66, "learning_rate": 9.409927217068067e-05, "loss": 0.1028, "step": 27240 }, { "epoch": 7.67, "learning_rate": 9.408052978477494e-05, "loss": 0.1044, "step": 27270 }, { "epoch": 7.67, "learning_rate": 9.406178739886922e-05, "loss": 0.1126, "step": 27300 }, { "epoch": 7.68, "learning_rate": 9.40430450129635e-05, "loss": 0.0944, "step": 27330 }, { "epoch": 7.69, "learning_rate": 9.402430262705776e-05, "loss": 0.1097, "step": 27360 }, { "epoch": 7.7, "learning_rate": 9.400556024115203e-05, "loss": 0.1006, "step": 27390 }, { "epoch": 7.71, "learning_rate": 9.398681785524631e-05, "loss": 0.1033, "step": 27420 }, { "epoch": 7.72, "learning_rate": 9.39680754693406e-05, "loss": 0.1064, "step": 27450 }, { "epoch": 7.73, "learning_rate": 9.394933308343485e-05, "loss": 0.0932, "step": 27480 }, { "epoch": 7.73, "learning_rate": 9.393059069752913e-05, "loss": 0.1108, "step": 27510 }, { "epoch": 7.74, "learning_rate": 9.391184831162341e-05, "loss": 0.0994, "step": 27540 }, { "epoch": 7.75, "learning_rate": 9.389310592571768e-05, "loss": 0.1026, "step": 27570 }, { "epoch": 7.76, "learning_rate": 9.387436353981196e-05, "loss": 0.1104, "step": 27600 }, { "epoch": 7.77, "learning_rate": 9.385562115390623e-05, "loss": 0.0941, "step": 27630 }, { "epoch": 7.78, "learning_rate": 9.383687876800051e-05, "loss": 0.1146, "step": 27660 }, { "epoch": 7.78, "learning_rate": 9.381813638209477e-05, "loss": 0.106, "step": 27690 }, { "epoch": 7.79, "learning_rate": 9.379939399618906e-05, "loss": 0.1102, "step": 27720 }, { "epoch": 7.8, "learning_rate": 9.378065161028334e-05, "loss": 0.108, "step": 27750 }, { "epoch": 7.81, "learning_rate": 9.37619092243776e-05, "loss": 0.0949, "step": 27780 }, { "epoch": 7.82, "learning_rate": 9.374316683847187e-05, "loss": 0.1134, "step": 27810 }, { "epoch": 7.83, "learning_rate": 9.372442445256615e-05, "loss": 0.0981, "step": 27840 }, { "epoch": 7.84, "learning_rate": 9.370568206666043e-05, "loss": 0.1079, "step": 27870 }, { "epoch": 7.84, "learning_rate": 9.368693968075469e-05, "loss": 0.1165, "step": 27900 }, { "epoch": 7.85, "learning_rate": 9.366819729484897e-05, "loss": 0.0959, "step": 27930 }, { "epoch": 7.86, "learning_rate": 9.364945490894325e-05, "loss": 0.1193, "step": 27960 }, { "epoch": 7.87, "learning_rate": 9.363071252303752e-05, "loss": 0.1038, "step": 27990 }, { "epoch": 7.88, "learning_rate": 9.36119701371318e-05, "loss": 0.1072, "step": 28020 }, { "epoch": 7.89, "learning_rate": 9.359322775122606e-05, "loss": 0.1191, "step": 28050 }, { "epoch": 7.89, "learning_rate": 9.357448536532035e-05, "loss": 0.0997, "step": 28080 }, { "epoch": 7.9, "learning_rate": 9.355574297941461e-05, "loss": 0.1102, "step": 28110 }, { "epoch": 7.91, "learning_rate": 9.35370005935089e-05, "loss": 0.1058, "step": 28140 }, { "epoch": 7.92, "learning_rate": 9.351825820760317e-05, "loss": 0.0983, "step": 28170 }, { "epoch": 7.93, "learning_rate": 9.349951582169744e-05, "loss": 0.1127, "step": 28200 }, { "epoch": 7.94, "learning_rate": 9.348077343579171e-05, "loss": 0.0877, "step": 28230 }, { "epoch": 7.94, "learning_rate": 9.346203104988599e-05, "loss": 0.1073, "step": 28260 }, { "epoch": 7.95, "learning_rate": 9.344328866398027e-05, "loss": 0.0968, "step": 28290 }, { "epoch": 7.96, "learning_rate": 9.342454627807453e-05, "loss": 0.1089, "step": 28320 }, { "epoch": 7.97, "learning_rate": 9.34058038921688e-05, "loss": 0.1091, "step": 28350 }, { "epoch": 7.98, "learning_rate": 9.338706150626309e-05, "loss": 0.09, "step": 28380 }, { "epoch": 7.99, "learning_rate": 9.336831912035735e-05, "loss": 0.1115, "step": 28410 }, { "epoch": 8.0, "learning_rate": 9.334957673445164e-05, "loss": 0.1016, "step": 28440 }, { "epoch": 8.0, "eval_loss": 0.11488943547010422, "eval_runtime": 627.1988, "eval_samples_per_second": 25.563, "eval_steps_per_second": 0.8, "eval_wer": 0.11741023296439343, "step": 28456 }, { "epoch": 8.0, "learning_rate": 9.33308343485459e-05, "loss": 0.1083, "step": 28470 }, { "epoch": 8.01, "learning_rate": 9.331209196264018e-05, "loss": 0.0995, "step": 28500 }, { "epoch": 8.02, "learning_rate": 9.329334957673445e-05, "loss": 0.1002, "step": 28530 }, { "epoch": 8.03, "learning_rate": 9.327523193702559e-05, "loss": 0.1104, "step": 28560 }, { "epoch": 8.04, "learning_rate": 9.325648955111986e-05, "loss": 0.0921, "step": 28590 }, { "epoch": 8.05, "learning_rate": 9.323774716521414e-05, "loss": 0.1051, "step": 28620 }, { "epoch": 8.05, "learning_rate": 9.321900477930841e-05, "loss": 0.0953, "step": 28650 }, { "epoch": 8.06, "learning_rate": 9.320026239340268e-05, "loss": 0.1033, "step": 28680 }, { "epoch": 8.07, "learning_rate": 9.318214475369382e-05, "loss": 0.1058, "step": 28710 }, { "epoch": 8.08, "learning_rate": 9.316340236778808e-05, "loss": 0.092, "step": 28740 }, { "epoch": 8.09, "learning_rate": 9.314465998188237e-05, "loss": 0.1034, "step": 28770 }, { "epoch": 8.1, "learning_rate": 9.312591759597665e-05, "loss": 0.098, "step": 28800 }, { "epoch": 8.11, "learning_rate": 9.310717521007091e-05, "loss": 0.1031, "step": 28830 }, { "epoch": 8.11, "learning_rate": 9.308843282416518e-05, "loss": 0.1135, "step": 28860 }, { "epoch": 8.12, "learning_rate": 9.306969043825946e-05, "loss": 0.0926, "step": 28890 }, { "epoch": 8.13, "learning_rate": 9.305094805235374e-05, "loss": 0.1015, "step": 28920 }, { "epoch": 8.14, "learning_rate": 9.303220566644801e-05, "loss": 0.0998, "step": 28950 }, { "epoch": 8.15, "learning_rate": 9.301346328054228e-05, "loss": 0.0955, "step": 28980 }, { "epoch": 8.16, "learning_rate": 9.299472089463656e-05, "loss": 0.108, "step": 29010 }, { "epoch": 8.16, "learning_rate": 9.297597850873083e-05, "loss": 0.0934, "step": 29040 }, { "epoch": 8.17, "learning_rate": 9.295723612282511e-05, "loss": 0.1025, "step": 29070 }, { "epoch": 8.18, "learning_rate": 9.293849373691939e-05, "loss": 0.097, "step": 29100 }, { "epoch": 8.19, "learning_rate": 9.291975135101366e-05, "loss": 0.1069, "step": 29130 }, { "epoch": 8.2, "learning_rate": 9.290100896510792e-05, "loss": 0.1104, "step": 29160 }, { "epoch": 8.21, "learning_rate": 9.28822665792022e-05, "loss": 0.0895, "step": 29190 }, { "epoch": 8.21, "learning_rate": 9.286352419329648e-05, "loss": 0.1026, "step": 29220 }, { "epoch": 8.22, "learning_rate": 9.284478180739075e-05, "loss": 0.0924, "step": 29250 }, { "epoch": 8.23, "learning_rate": 9.282603942148502e-05, "loss": 0.0973, "step": 29280 }, { "epoch": 8.24, "learning_rate": 9.28072970355793e-05, "loss": 0.1098, "step": 29310 }, { "epoch": 8.25, "learning_rate": 9.278855464967358e-05, "loss": 0.0942, "step": 29340 }, { "epoch": 8.26, "learning_rate": 9.276981226376785e-05, "loss": 0.1048, "step": 29370 }, { "epoch": 8.27, "learning_rate": 9.275106987786212e-05, "loss": 0.0945, "step": 29400 }, { "epoch": 8.27, "learning_rate": 9.27323274919564e-05, "loss": 0.0995, "step": 29430 }, { "epoch": 8.28, "learning_rate": 9.271358510605066e-05, "loss": 0.1078, "step": 29460 }, { "epoch": 8.29, "learning_rate": 9.269484272014495e-05, "loss": 0.0921, "step": 29490 }, { "epoch": 8.3, "learning_rate": 9.267610033423923e-05, "loss": 0.1061, "step": 29520 }, { "epoch": 8.31, "learning_rate": 9.26573579483335e-05, "loss": 0.1074, "step": 29550 }, { "epoch": 8.32, "learning_rate": 9.263861556242776e-05, "loss": 0.1011, "step": 29580 }, { "epoch": 8.32, "learning_rate": 9.261987317652204e-05, "loss": 0.1112, "step": 29610 }, { "epoch": 8.33, "learning_rate": 9.260113079061632e-05, "loss": 0.0914, "step": 29640 }, { "epoch": 8.34, "learning_rate": 9.258238840471059e-05, "loss": 0.1067, "step": 29670 }, { "epoch": 8.35, "learning_rate": 9.256364601880486e-05, "loss": 0.0999, "step": 29700 }, { "epoch": 8.36, "learning_rate": 9.254490363289914e-05, "loss": 0.1004, "step": 29730 }, { "epoch": 8.37, "learning_rate": 9.252616124699342e-05, "loss": 0.1104, "step": 29760 }, { "epoch": 8.37, "learning_rate": 9.250741886108769e-05, "loss": 0.0894, "step": 29790 }, { "epoch": 8.38, "learning_rate": 9.248867647518196e-05, "loss": 0.1061, "step": 29820 }, { "epoch": 8.39, "learning_rate": 9.246993408927624e-05, "loss": 0.0998, "step": 29850 }, { "epoch": 8.4, "learning_rate": 9.24511917033705e-05, "loss": 0.1022, "step": 29880 }, { "epoch": 8.41, "learning_rate": 9.243244931746478e-05, "loss": 0.1088, "step": 29910 }, { "epoch": 8.42, "learning_rate": 9.241370693155907e-05, "loss": 0.0886, "step": 29940 }, { "epoch": 8.43, "learning_rate": 9.239496454565333e-05, "loss": 0.1035, "step": 29970 }, { "epoch": 8.43, "learning_rate": 9.23762221597476e-05, "loss": 0.1044, "step": 30000 }, { "epoch": 8.44, "learning_rate": 9.235747977384188e-05, "loss": 0.1073, "step": 30030 }, { "epoch": 8.45, "learning_rate": 9.233873738793616e-05, "loss": 0.108, "step": 30060 }, { "epoch": 8.46, "learning_rate": 9.231999500203043e-05, "loss": 0.0909, "step": 30090 }, { "epoch": 8.47, "learning_rate": 9.23012526161247e-05, "loss": 0.105, "step": 30120 }, { "epoch": 8.48, "learning_rate": 9.228251023021898e-05, "loss": 0.1061, "step": 30150 }, { "epoch": 8.48, "learning_rate": 9.226376784431326e-05, "loss": 0.0993, "step": 30180 }, { "epoch": 8.49, "learning_rate": 9.224502545840753e-05, "loss": 0.1154, "step": 30210 }, { "epoch": 8.5, "learning_rate": 9.22262830725018e-05, "loss": 0.0923, "step": 30240 }, { "epoch": 8.51, "learning_rate": 9.220754068659607e-05, "loss": 0.1011, "step": 30270 }, { "epoch": 8.52, "learning_rate": 9.218879830069036e-05, "loss": 0.0979, "step": 30300 }, { "epoch": 8.53, "learning_rate": 9.217005591478462e-05, "loss": 0.1008, "step": 30330 }, { "epoch": 8.54, "learning_rate": 9.21513135288789e-05, "loss": 0.1122, "step": 30360 }, { "epoch": 8.54, "learning_rate": 9.213257114297317e-05, "loss": 0.0901, "step": 30390 }, { "epoch": 8.55, "learning_rate": 9.211382875706744e-05, "loss": 0.105, "step": 30420 }, { "epoch": 8.56, "learning_rate": 9.209508637116172e-05, "loss": 0.1004, "step": 30450 }, { "epoch": 8.57, "learning_rate": 9.2076343985256e-05, "loss": 0.1007, "step": 30480 }, { "epoch": 8.58, "learning_rate": 9.205760159935027e-05, "loss": 0.1087, "step": 30510 }, { "epoch": 8.59, "learning_rate": 9.203885921344454e-05, "loss": 0.089, "step": 30540 }, { "epoch": 8.59, "learning_rate": 9.202011682753882e-05, "loss": 0.1043, "step": 30570 }, { "epoch": 8.6, "learning_rate": 9.20013744416331e-05, "loss": 0.0993, "step": 30600 }, { "epoch": 8.61, "learning_rate": 9.198263205572736e-05, "loss": 0.1034, "step": 30630 }, { "epoch": 8.62, "learning_rate": 9.196388966982163e-05, "loss": 0.1131, "step": 30660 }, { "epoch": 8.63, "learning_rate": 9.194514728391591e-05, "loss": 0.0932, "step": 30690 }, { "epoch": 8.64, "learning_rate": 9.19264048980102e-05, "loss": 0.1048, "step": 30720 }, { "epoch": 8.64, "learning_rate": 9.190766251210446e-05, "loss": 0.0999, "step": 30750 }, { "epoch": 8.65, "learning_rate": 9.188892012619874e-05, "loss": 0.0966, "step": 30780 }, { "epoch": 8.66, "learning_rate": 9.187017774029301e-05, "loss": 0.1145, "step": 30810 }, { "epoch": 8.67, "learning_rate": 9.185143535438728e-05, "loss": 0.091, "step": 30840 }, { "epoch": 8.68, "learning_rate": 9.183269296848156e-05, "loss": 0.1044, "step": 30870 }, { "epoch": 8.69, "learning_rate": 9.181395058257584e-05, "loss": 0.1011, "step": 30900 }, { "epoch": 8.7, "learning_rate": 9.179520819667011e-05, "loss": 0.1018, "step": 30930 }, { "epoch": 8.7, "learning_rate": 9.177646581076437e-05, "loss": 0.1124, "step": 30960 }, { "epoch": 8.71, "learning_rate": 9.175772342485866e-05, "loss": 0.0898, "step": 30990 }, { "epoch": 8.72, "learning_rate": 9.173898103895294e-05, "loss": 0.1051, "step": 31020 }, { "epoch": 8.73, "learning_rate": 9.17202386530472e-05, "loss": 0.0969, "step": 31050 }, { "epoch": 8.74, "learning_rate": 9.170149626714147e-05, "loss": 0.104, "step": 31080 }, { "epoch": 8.75, "learning_rate": 9.168275388123575e-05, "loss": 0.1103, "step": 31110 }, { "epoch": 8.75, "learning_rate": 9.166401149533003e-05, "loss": 0.0957, "step": 31140 }, { "epoch": 8.76, "learning_rate": 9.16452691094243e-05, "loss": 0.1092, "step": 31170 }, { "epoch": 8.77, "learning_rate": 9.162652672351858e-05, "loss": 0.0989, "step": 31200 }, { "epoch": 8.78, "learning_rate": 9.160778433761285e-05, "loss": 0.1058, "step": 31230 }, { "epoch": 8.79, "learning_rate": 9.158904195170712e-05, "loss": 0.1142, "step": 31260 }, { "epoch": 8.8, "learning_rate": 9.15702995658014e-05, "loss": 0.0938, "step": 31290 }, { "epoch": 8.81, "learning_rate": 9.155155717989568e-05, "loss": 0.1088, "step": 31320 }, { "epoch": 8.81, "learning_rate": 9.153281479398995e-05, "loss": 0.097, "step": 31350 }, { "epoch": 8.82, "learning_rate": 9.151407240808421e-05, "loss": 0.1025, "step": 31380 }, { "epoch": 8.83, "learning_rate": 9.14953300221785e-05, "loss": 0.1101, "step": 31410 }, { "epoch": 8.84, "learning_rate": 9.147658763627277e-05, "loss": 0.0961, "step": 31440 }, { "epoch": 8.85, "learning_rate": 9.145784525036704e-05, "loss": 0.1039, "step": 31470 }, { "epoch": 8.86, "learning_rate": 9.143910286446131e-05, "loss": 0.0936, "step": 31500 }, { "epoch": 8.86, "learning_rate": 9.142036047855559e-05, "loss": 0.1052, "step": 31530 }, { "epoch": 8.87, "learning_rate": 9.140161809264987e-05, "loss": 0.1137, "step": 31560 }, { "epoch": 8.88, "learning_rate": 9.138287570674414e-05, "loss": 0.0901, "step": 31590 }, { "epoch": 8.89, "learning_rate": 9.136413332083842e-05, "loss": 0.1114, "step": 31620 }, { "epoch": 8.9, "learning_rate": 9.134539093493269e-05, "loss": 0.1087, "step": 31650 }, { "epoch": 8.91, "learning_rate": 9.132664854902695e-05, "loss": 0.0996, "step": 31680 }, { "epoch": 8.91, "learning_rate": 9.130790616312124e-05, "loss": 0.1099, "step": 31710 }, { "epoch": 8.92, "learning_rate": 9.128916377721552e-05, "loss": 0.0931, "step": 31740 }, { "epoch": 8.93, "learning_rate": 9.127042139130978e-05, "loss": 0.1089, "step": 31770 }, { "epoch": 8.94, "learning_rate": 9.125167900540405e-05, "loss": 0.0992, "step": 31800 }, { "epoch": 8.95, "learning_rate": 9.123293661949833e-05, "loss": 0.0979, "step": 31830 }, { "epoch": 8.96, "learning_rate": 9.121419423359261e-05, "loss": 0.1147, "step": 31860 }, { "epoch": 8.97, "learning_rate": 9.119545184768688e-05, "loss": 0.0898, "step": 31890 }, { "epoch": 8.97, "learning_rate": 9.117670946178115e-05, "loss": 0.11, "step": 31920 }, { "epoch": 8.98, "learning_rate": 9.115796707587543e-05, "loss": 0.1, "step": 31950 }, { "epoch": 8.99, "learning_rate": 9.113922468996971e-05, "loss": 0.0993, "step": 31980 }, { "epoch": 9.0, "learning_rate": 9.112048230406398e-05, "loss": 0.1093, "step": 32010 }, { "epoch": 9.0, "eval_loss": 0.1185522973537445, "eval_runtime": 627.341, "eval_samples_per_second": 25.557, "eval_steps_per_second": 0.8, "eval_wer": 0.11861122105004572, "step": 32013 }, { "epoch": 9.01, "learning_rate": 9.110173991815826e-05, "loss": 0.0927, "step": 32040 }, { "epoch": 9.02, "learning_rate": 9.108299753225253e-05, "loss": 0.1062, "step": 32070 }, { "epoch": 9.02, "learning_rate": 9.10642551463468e-05, "loss": 0.0905, "step": 32100 }, { "epoch": 9.03, "learning_rate": 9.104551276044107e-05, "loss": 0.0989, "step": 32130 }, { "epoch": 9.04, "learning_rate": 9.102677037453536e-05, "loss": 0.0978, "step": 32160 }, { "epoch": 9.05, "learning_rate": 9.100802798862962e-05, "loss": 0.0939, "step": 32190 }, { "epoch": 9.06, "learning_rate": 9.098928560272389e-05, "loss": 0.1024, "step": 32220 }, { "epoch": 9.07, "learning_rate": 9.097054321681817e-05, "loss": 0.0957, "step": 32250 }, { "epoch": 9.08, "learning_rate": 9.095180083091245e-05, "loss": 0.1051, "step": 32280 }, { "epoch": 9.08, "learning_rate": 9.093305844500672e-05, "loss": 0.1007, "step": 32310 }, { "epoch": 9.09, "learning_rate": 9.091431605910099e-05, "loss": 0.0893, "step": 32340 }, { "epoch": 9.1, "learning_rate": 9.089557367319527e-05, "loss": 0.1098, "step": 32370 }, { "epoch": 9.11, "learning_rate": 9.087683128728955e-05, "loss": 0.0906, "step": 32400 }, { "epoch": 9.12, "learning_rate": 9.085808890138382e-05, "loss": 0.0999, "step": 32430 }, { "epoch": 9.13, "learning_rate": 9.08393465154781e-05, "loss": 0.0995, "step": 32460 }, { "epoch": 9.13, "learning_rate": 9.082060412957236e-05, "loss": 0.096, "step": 32490 }, { "epoch": 9.14, "learning_rate": 9.080186174366663e-05, "loss": 0.1018, "step": 32520 }, { "epoch": 9.15, "learning_rate": 9.078311935776091e-05, "loss": 0.0923, "step": 32550 }, { "epoch": 9.16, "learning_rate": 9.07643769718552e-05, "loss": 0.1083, "step": 32580 }, { "epoch": 9.17, "learning_rate": 9.074563458594946e-05, "loss": 0.1014, "step": 32610 }, { "epoch": 9.18, "learning_rate": 9.072689220004373e-05, "loss": 0.0928, "step": 32640 }, { "epoch": 9.18, "learning_rate": 9.070814981413801e-05, "loss": 0.1015, "step": 32670 }, { "epoch": 9.19, "learning_rate": 9.068940742823229e-05, "loss": 0.087, "step": 32700 }, { "epoch": 9.2, "learning_rate": 9.067066504232656e-05, "loss": 0.0975, "step": 32730 }, { "epoch": 9.21, "learning_rate": 9.065192265642083e-05, "loss": 0.1041, "step": 32760 }, { "epoch": 9.22, "learning_rate": 9.063380501671197e-05, "loss": 0.0955, "step": 32790 }, { "epoch": 9.23, "learning_rate": 9.061506263080623e-05, "loss": 0.1057, "step": 32820 }, { "epoch": 9.24, "learning_rate": 9.059632024490052e-05, "loss": 0.0912, "step": 32850 }, { "epoch": 9.24, "learning_rate": 9.057757785899478e-05, "loss": 0.1005, "step": 32880 }, { "epoch": 9.25, "learning_rate": 9.055883547308906e-05, "loss": 0.0988, "step": 32910 }, { "epoch": 9.26, "learning_rate": 9.054009308718333e-05, "loss": 0.0931, "step": 32940 }, { "epoch": 9.27, "learning_rate": 9.052135070127761e-05, "loss": 0.0993, "step": 32970 }, { "epoch": 9.28, "learning_rate": 9.050260831537188e-05, "loss": 0.0924, "step": 33000 }, { "epoch": 9.29, "learning_rate": 9.048386592946616e-05, "loss": 0.1019, "step": 33030 }, { "epoch": 9.29, "learning_rate": 9.046512354356044e-05, "loss": 0.1037, "step": 33060 }, { "epoch": 9.3, "learning_rate": 9.044638115765471e-05, "loss": 0.0935, "step": 33090 }, { "epoch": 9.31, "learning_rate": 9.042763877174898e-05, "loss": 0.1092, "step": 33120 }, { "epoch": 9.32, "learning_rate": 9.040889638584326e-05, "loss": 0.0934, "step": 33150 }, { "epoch": 9.33, "learning_rate": 9.039015399993754e-05, "loss": 0.0979, "step": 33180 }, { "epoch": 9.34, "learning_rate": 9.03714116140318e-05, "loss": 0.0993, "step": 33210 }, { "epoch": 9.34, "learning_rate": 9.035266922812607e-05, "loss": 0.097, "step": 33240 }, { "epoch": 9.35, "learning_rate": 9.033392684222035e-05, "loss": 0.1051, "step": 33270 }, { "epoch": 9.36, "learning_rate": 9.031518445631462e-05, "loss": 0.0935, "step": 33300 }, { "epoch": 9.37, "learning_rate": 9.02964420704089e-05, "loss": 0.1072, "step": 33330 }, { "epoch": 9.38, "learning_rate": 9.027769968450317e-05, "loss": 0.0984, "step": 33360 }, { "epoch": 9.39, "learning_rate": 9.025895729859745e-05, "loss": 0.0939, "step": 33390 }, { "epoch": 9.4, "learning_rate": 9.024021491269172e-05, "loss": 0.1067, "step": 33420 }, { "epoch": 9.4, "learning_rate": 9.0221472526786e-05, "loss": 0.0906, "step": 33450 }, { "epoch": 9.41, "learning_rate": 9.020273014088028e-05, "loss": 0.1041, "step": 33480 }, { "epoch": 9.42, "learning_rate": 9.018398775497455e-05, "loss": 0.1022, "step": 33510 }, { "epoch": 9.43, "learning_rate": 9.016524536906881e-05, "loss": 0.0975, "step": 33540 }, { "epoch": 9.44, "learning_rate": 9.01465029831631e-05, "loss": 0.1084, "step": 33570 }, { "epoch": 9.45, "learning_rate": 9.012776059725738e-05, "loss": 0.0915, "step": 33600 }, { "epoch": 9.45, "learning_rate": 9.010901821135164e-05, "loss": 0.1043, "step": 33630 }, { "epoch": 9.46, "learning_rate": 9.009027582544591e-05, "loss": 0.1025, "step": 33660 }, { "epoch": 9.47, "learning_rate": 9.007153343954019e-05, "loss": 0.0935, "step": 33690 }, { "epoch": 9.48, "learning_rate": 9.005279105363446e-05, "loss": 0.1033, "step": 33720 }, { "epoch": 9.49, "learning_rate": 9.003404866772874e-05, "loss": 0.0919, "step": 33750 }, { "epoch": 9.5, "learning_rate": 9.001530628182301e-05, "loss": 0.1023, "step": 33780 }, { "epoch": 9.51, "learning_rate": 8.999656389591729e-05, "loss": 0.1017, "step": 33810 }, { "epoch": 9.51, "learning_rate": 8.997782151001156e-05, "loss": 0.0952, "step": 33840 }, { "epoch": 9.52, "learning_rate": 8.995907912410584e-05, "loss": 0.1087, "step": 33870 }, { "epoch": 9.53, "learning_rate": 8.994033673820012e-05, "loss": 0.0983, "step": 33900 }, { "epoch": 9.54, "learning_rate": 8.992159435229439e-05, "loss": 0.1104, "step": 33930 }, { "epoch": 9.55, "learning_rate": 8.990285196638865e-05, "loss": 0.1017, "step": 33960 }, { "epoch": 9.56, "learning_rate": 8.988410958048293e-05, "loss": 0.0936, "step": 33990 }, { "epoch": 9.56, "learning_rate": 8.986536719457722e-05, "loss": 0.1063, "step": 34020 }, { "epoch": 9.57, "learning_rate": 8.984662480867148e-05, "loss": 0.0896, "step": 34050 }, { "epoch": 9.58, "learning_rate": 8.982788242276575e-05, "loss": 0.1027, "step": 34080 }, { "epoch": 9.59, "learning_rate": 8.980976478305688e-05, "loss": 0.1027, "step": 34110 }, { "epoch": 9.6, "learning_rate": 8.979102239715116e-05, "loss": 0.0974, "step": 34140 }, { "epoch": 9.61, "learning_rate": 8.977228001124544e-05, "loss": 0.1036, "step": 34170 }, { "epoch": 9.61, "learning_rate": 8.975353762533971e-05, "loss": 0.0923, "step": 34200 }, { "epoch": 9.62, "learning_rate": 8.973479523943399e-05, "loss": 0.1057, "step": 34230 }, { "epoch": 9.63, "learning_rate": 8.971605285352826e-05, "loss": 0.1012, "step": 34260 }, { "epoch": 9.64, "learning_rate": 8.969731046762254e-05, "loss": 0.0945, "step": 34290 }, { "epoch": 9.65, "learning_rate": 8.96785680817168e-05, "loss": 0.1056, "step": 34320 }, { "epoch": 9.66, "learning_rate": 8.965982569581108e-05, "loss": 0.0922, "step": 34350 }, { "epoch": 9.67, "learning_rate": 8.964108330990537e-05, "loss": 0.1059, "step": 34380 }, { "epoch": 9.67, "learning_rate": 8.962234092399962e-05, "loss": 0.0943, "step": 34410 }, { "epoch": 9.68, "learning_rate": 8.96035985380939e-05, "loss": 0.0954, "step": 34440 }, { "epoch": 9.69, "learning_rate": 8.958485615218818e-05, "loss": 0.1035, "step": 34470 }, { "epoch": 9.7, "learning_rate": 8.956611376628246e-05, "loss": 0.0901, "step": 34500 }, { "epoch": 9.71, "learning_rate": 8.954737138037672e-05, "loss": 0.1006, "step": 34530 }, { "epoch": 9.72, "learning_rate": 8.9528628994471e-05, "loss": 0.1073, "step": 34560 }, { "epoch": 9.72, "learning_rate": 8.950988660856528e-05, "loss": 0.0976, "step": 34590 }, { "epoch": 9.73, "learning_rate": 8.949114422265955e-05, "loss": 0.1036, "step": 34620 }, { "epoch": 9.74, "learning_rate": 8.947240183675383e-05, "loss": 0.0879, "step": 34650 }, { "epoch": 9.75, "learning_rate": 8.94536594508481e-05, "loss": 0.1058, "step": 34680 }, { "epoch": 9.76, "learning_rate": 8.943491706494237e-05, "loss": 0.1025, "step": 34710 }, { "epoch": 9.77, "learning_rate": 8.941617467903664e-05, "loss": 0.0967, "step": 34740 }, { "epoch": 9.77, "learning_rate": 8.939743229313092e-05, "loss": 0.1017, "step": 34770 }, { "epoch": 9.78, "learning_rate": 8.93786899072252e-05, "loss": 0.0916, "step": 34800 }, { "epoch": 9.79, "learning_rate": 8.935994752131946e-05, "loss": 0.1, "step": 34830 }, { "epoch": 9.8, "learning_rate": 8.934120513541374e-05, "loss": 0.0976, "step": 34860 }, { "epoch": 9.81, "learning_rate": 8.932246274950802e-05, "loss": 0.0907, "step": 34890 }, { "epoch": 9.82, "learning_rate": 8.93037203636023e-05, "loss": 0.1056, "step": 34920 }, { "epoch": 9.83, "learning_rate": 8.928497797769655e-05, "loss": 0.0882, "step": 34950 }, { "epoch": 9.83, "learning_rate": 8.926623559179084e-05, "loss": 0.104, "step": 34980 }, { "epoch": 9.84, "learning_rate": 8.924749320588512e-05, "loss": 0.1025, "step": 35010 }, { "epoch": 9.85, "learning_rate": 8.922875081997938e-05, "loss": 0.0919, "step": 35040 }, { "epoch": 9.86, "learning_rate": 8.921000843407367e-05, "loss": 0.1067, "step": 35070 }, { "epoch": 9.87, "learning_rate": 8.919126604816793e-05, "loss": 0.087, "step": 35100 }, { "epoch": 9.88, "learning_rate": 8.917252366226221e-05, "loss": 0.1095, "step": 35130 }, { "epoch": 9.88, "learning_rate": 8.915378127635648e-05, "loss": 0.1009, "step": 35160 }, { "epoch": 9.89, "learning_rate": 8.913503889045076e-05, "loss": 0.0953, "step": 35190 }, { "epoch": 9.9, "learning_rate": 8.911629650454504e-05, "loss": 0.1059, "step": 35220 }, { "epoch": 9.91, "learning_rate": 8.909755411863931e-05, "loss": 0.0921, "step": 35250 }, { "epoch": 9.92, "learning_rate": 8.907881173273358e-05, "loss": 0.1019, "step": 35280 }, { "epoch": 9.93, "learning_rate": 8.906006934682786e-05, "loss": 0.0956, "step": 35310 }, { "epoch": 9.94, "learning_rate": 8.904132696092214e-05, "loss": 0.0957, "step": 35340 }, { "epoch": 9.94, "learning_rate": 8.90225845750164e-05, "loss": 0.1062, "step": 35370 }, { "epoch": 9.95, "learning_rate": 8.900384218911067e-05, "loss": 0.0928, "step": 35400 }, { "epoch": 9.96, "learning_rate": 8.898509980320496e-05, "loss": 0.1012, "step": 35430 }, { "epoch": 9.97, "learning_rate": 8.896635741729922e-05, "loss": 0.099, "step": 35460 }, { "epoch": 9.98, "learning_rate": 8.89476150313935e-05, "loss": 0.0986, "step": 35490 }, { "epoch": 9.99, "learning_rate": 8.892887264548777e-05, "loss": 0.1049, "step": 35520 }, { "epoch": 9.99, "learning_rate": 8.891013025958205e-05, "loss": 0.0858, "step": 35550 }, { "epoch": 10.0, "eval_loss": 0.11820485442876816, "eval_runtime": 629.5769, "eval_samples_per_second": 25.466, "eval_steps_per_second": 0.797, "eval_wer": 0.1163866635732125, "step": 35570 }, { "epoch": 10.0, "learning_rate": 8.889138787367632e-05, "loss": 0.1056, "step": 35580 }, { "epoch": 10.01, "learning_rate": 8.88726454877706e-05, "loss": 0.0896, "step": 35610 }, { "epoch": 10.02, "learning_rate": 8.885390310186488e-05, "loss": 0.0959, "step": 35640 }, { "epoch": 10.03, "learning_rate": 8.883516071595915e-05, "loss": 0.1004, "step": 35670 }, { "epoch": 10.04, "learning_rate": 8.881641833005342e-05, "loss": 0.0846, "step": 35700 }, { "epoch": 10.04, "learning_rate": 8.87976759441477e-05, "loss": 0.1042, "step": 35730 }, { "epoch": 10.05, "learning_rate": 8.877893355824198e-05, "loss": 0.0917, "step": 35760 }, { "epoch": 10.06, "learning_rate": 8.876019117233623e-05, "loss": 0.1016, "step": 35790 }, { "epoch": 10.07, "learning_rate": 8.874144878643051e-05, "loss": 0.1079, "step": 35820 }, { "epoch": 10.08, "learning_rate": 8.87227064005248e-05, "loss": 0.0842, "step": 35850 }, { "epoch": 10.09, "learning_rate": 8.870396401461906e-05, "loss": 0.0951, "step": 35880 }, { "epoch": 10.1, "learning_rate": 8.868522162871334e-05, "loss": 0.0838, "step": 35910 }, { "epoch": 10.1, "learning_rate": 8.866647924280761e-05, "loss": 0.0944, "step": 35940 }, { "epoch": 10.11, "learning_rate": 8.864773685690189e-05, "loss": 0.1084, "step": 35970 }, { "epoch": 10.12, "learning_rate": 8.862899447099616e-05, "loss": 0.0872, "step": 36000 }, { "epoch": 10.13, "learning_rate": 8.861025208509044e-05, "loss": 0.0977, "step": 36030 }, { "epoch": 10.14, "learning_rate": 8.859150969918472e-05, "loss": 0.0863, "step": 36060 }, { "epoch": 10.15, "learning_rate": 8.857276731327899e-05, "loss": 0.0936, "step": 36090 }, { "epoch": 10.15, "learning_rate": 8.855402492737326e-05, "loss": 0.0998, "step": 36120 }, { "epoch": 10.16, "learning_rate": 8.853528254146754e-05, "loss": 0.0858, "step": 36150 }, { "epoch": 10.17, "learning_rate": 8.851654015556182e-05, "loss": 0.0964, "step": 36180 }, { "epoch": 10.18, "learning_rate": 8.849779776965607e-05, "loss": 0.0884, "step": 36210 }, { "epoch": 10.19, "learning_rate": 8.847905538375035e-05, "loss": 0.0993, "step": 36240 }, { "epoch": 10.2, "learning_rate": 8.846031299784463e-05, "loss": 0.1069, "step": 36270 }, { "epoch": 10.21, "learning_rate": 8.84415706119389e-05, "loss": 0.0834, "step": 36300 }, { "epoch": 10.21, "learning_rate": 8.842282822603318e-05, "loss": 0.1038, "step": 36330 }, { "epoch": 10.22, "learning_rate": 8.840408584012745e-05, "loss": 0.0878, "step": 36360 }, { "epoch": 10.23, "learning_rate": 8.838534345422173e-05, "loss": 0.0933, "step": 36390 }, { "epoch": 10.24, "learning_rate": 8.8366601068316e-05, "loss": 0.1074, "step": 36420 }, { "epoch": 10.25, "learning_rate": 8.834785868241028e-05, "loss": 0.085, "step": 36450 }, { "epoch": 10.26, "learning_rate": 8.832911629650455e-05, "loss": 0.1005, "step": 36480 }, { "epoch": 10.26, "learning_rate": 8.831037391059883e-05, "loss": 0.0899, "step": 36510 }, { "epoch": 10.27, "learning_rate": 8.82916315246931e-05, "loss": 0.0978, "step": 36540 }, { "epoch": 10.28, "learning_rate": 8.827288913878737e-05, "loss": 0.1049, "step": 36570 }, { "epoch": 10.29, "learning_rate": 8.825414675288166e-05, "loss": 0.0886, "step": 36600 }, { "epoch": 10.3, "learning_rate": 8.823540436697591e-05, "loss": 0.1042, "step": 36630 }, { "epoch": 10.31, "learning_rate": 8.821666198107019e-05, "loss": 0.0913, "step": 36660 }, { "epoch": 10.31, "learning_rate": 8.819791959516447e-05, "loss": 0.0982, "step": 36690 }, { "epoch": 10.32, "learning_rate": 8.817917720925874e-05, "loss": 0.1019, "step": 36720 }, { "epoch": 10.33, "learning_rate": 8.816043482335302e-05, "loss": 0.0887, "step": 36750 }, { "epoch": 10.34, "learning_rate": 8.814169243744729e-05, "loss": 0.1025, "step": 36780 }, { "epoch": 10.35, "learning_rate": 8.812295005154157e-05, "loss": 0.0927, "step": 36810 }, { "epoch": 10.36, "learning_rate": 8.810420766563584e-05, "loss": 0.0999, "step": 36840 }, { "epoch": 10.37, "learning_rate": 8.808546527973012e-05, "loss": 0.1032, "step": 36870 }, { "epoch": 10.37, "learning_rate": 8.806672289382438e-05, "loss": 0.0854, "step": 36900 }, { "epoch": 10.38, "learning_rate": 8.804798050791866e-05, "loss": 0.0997, "step": 36930 }, { "epoch": 10.39, "learning_rate": 8.802923812201293e-05, "loss": 0.0915, "step": 36960 }, { "epoch": 10.4, "learning_rate": 8.801049573610721e-05, "loss": 0.0953, "step": 36990 }, { "epoch": 10.41, "learning_rate": 8.79917533502015e-05, "loss": 0.1097, "step": 37020 }, { "epoch": 10.42, "learning_rate": 8.797301096429575e-05, "loss": 0.0804, "step": 37050 }, { "epoch": 10.42, "learning_rate": 8.795426857839003e-05, "loss": 0.1011, "step": 37080 }, { "epoch": 10.43, "learning_rate": 8.793552619248431e-05, "loss": 0.0904, "step": 37110 }, { "epoch": 10.44, "learning_rate": 8.791678380657858e-05, "loss": 0.0983, "step": 37140 }, { "epoch": 10.45, "learning_rate": 8.789804142067286e-05, "loss": 0.1082, "step": 37170 }, { "epoch": 10.46, "learning_rate": 8.787929903476713e-05, "loss": 0.082, "step": 37200 }, { "epoch": 10.47, "learning_rate": 8.786055664886141e-05, "loss": 0.1019, "step": 37230 }, { "epoch": 10.48, "learning_rate": 8.784181426295567e-05, "loss": 0.0875, "step": 37260 }, { "epoch": 10.48, "learning_rate": 8.782307187704996e-05, "loss": 0.0968, "step": 37290 }, { "epoch": 10.49, "learning_rate": 8.780432949114422e-05, "loss": 0.106, "step": 37320 }, { "epoch": 10.5, "learning_rate": 8.77855871052385e-05, "loss": 0.0803, "step": 37350 }, { "epoch": 10.51, "learning_rate": 8.776684471933277e-05, "loss": 0.1021, "step": 37380 }, { "epoch": 10.52, "learning_rate": 8.774810233342705e-05, "loss": 0.0858, "step": 37410 }, { "epoch": 10.53, "learning_rate": 8.772935994752133e-05, "loss": 0.0954, "step": 37440 }, { "epoch": 10.53, "learning_rate": 8.771061756161559e-05, "loss": 0.1046, "step": 37470 }, { "epoch": 10.54, "learning_rate": 8.769187517570987e-05, "loss": 0.087, "step": 37500 }, { "epoch": 10.55, "learning_rate": 8.767313278980415e-05, "loss": 0.097, "step": 37530 }, { "epoch": 10.56, "learning_rate": 8.765439040389843e-05, "loss": 0.0873, "step": 37560 }, { "epoch": 10.57, "learning_rate": 8.76356480179927e-05, "loss": 0.0994, "step": 37590 }, { "epoch": 10.58, "learning_rate": 8.761690563208696e-05, "loss": 0.1015, "step": 37620 }, { "epoch": 10.58, "learning_rate": 8.759816324618125e-05, "loss": 0.0864, "step": 37650 }, { "epoch": 10.59, "learning_rate": 8.757942086027551e-05, "loss": 0.1043, "step": 37680 }, { "epoch": 10.6, "learning_rate": 8.75606784743698e-05, "loss": 0.0927, "step": 37710 }, { "epoch": 10.61, "learning_rate": 8.754193608846406e-05, "loss": 0.098, "step": 37740 }, { "epoch": 10.62, "learning_rate": 8.752319370255834e-05, "loss": 0.1059, "step": 37770 }, { "epoch": 10.63, "learning_rate": 8.750445131665261e-05, "loss": 0.0854, "step": 37800 }, { "epoch": 10.64, "learning_rate": 8.748570893074689e-05, "loss": 0.1, "step": 37830 }, { "epoch": 10.64, "learning_rate": 8.746696654484117e-05, "loss": 0.0915, "step": 37860 }, { "epoch": 10.65, "learning_rate": 8.744822415893543e-05, "loss": 0.1021, "step": 37890 }, { "epoch": 10.66, "learning_rate": 8.74294817730297e-05, "loss": 0.1063, "step": 37920 }, { "epoch": 10.67, "learning_rate": 8.741073938712399e-05, "loss": 0.0844, "step": 37950 }, { "epoch": 10.68, "learning_rate": 8.739199700121827e-05, "loss": 0.1025, "step": 37980 }, { "epoch": 10.69, "learning_rate": 8.737325461531254e-05, "loss": 0.0892, "step": 38010 }, { "epoch": 10.69, "learning_rate": 8.73545122294068e-05, "loss": 0.0979, "step": 38040 }, { "epoch": 10.7, "learning_rate": 8.733576984350108e-05, "loss": 0.107, "step": 38070 }, { "epoch": 10.71, "learning_rate": 8.731702745759535e-05, "loss": 0.0868, "step": 38100 }, { "epoch": 10.72, "learning_rate": 8.729828507168963e-05, "loss": 0.1055, "step": 38130 }, { "epoch": 10.73, "learning_rate": 8.72795426857839e-05, "loss": 0.0902, "step": 38160 }, { "epoch": 10.74, "learning_rate": 8.726080029987818e-05, "loss": 0.0985, "step": 38190 }, { "epoch": 10.74, "learning_rate": 8.724205791397245e-05, "loss": 0.1018, "step": 38220 }, { "epoch": 10.75, "learning_rate": 8.722331552806673e-05, "loss": 0.0856, "step": 38250 }, { "epoch": 10.76, "learning_rate": 8.720457314216101e-05, "loss": 0.1081, "step": 38280 }, { "epoch": 10.77, "learning_rate": 8.718583075625528e-05, "loss": 0.0907, "step": 38310 }, { "epoch": 10.78, "learning_rate": 8.716708837034955e-05, "loss": 0.0984, "step": 38340 }, { "epoch": 10.79, "learning_rate": 8.714834598444383e-05, "loss": 0.0994, "step": 38370 }, { "epoch": 10.8, "learning_rate": 8.712960359853811e-05, "loss": 0.0851, "step": 38400 }, { "epoch": 10.8, "learning_rate": 8.711086121263237e-05, "loss": 0.104, "step": 38430 }, { "epoch": 10.81, "learning_rate": 8.709211882672664e-05, "loss": 0.0864, "step": 38460 }, { "epoch": 10.82, "learning_rate": 8.707337644082092e-05, "loss": 0.0923, "step": 38490 }, { "epoch": 10.83, "learning_rate": 8.705463405491519e-05, "loss": 0.1031, "step": 38520 }, { "epoch": 10.84, "learning_rate": 8.703589166900947e-05, "loss": 0.0839, "step": 38550 }, { "epoch": 10.85, "learning_rate": 8.701714928310374e-05, "loss": 0.0953, "step": 38580 }, { "epoch": 10.85, "learning_rate": 8.699840689719802e-05, "loss": 0.0898, "step": 38610 }, { "epoch": 10.86, "learning_rate": 8.697966451129229e-05, "loss": 0.0942, "step": 38640 }, { "epoch": 10.87, "learning_rate": 8.696092212538657e-05, "loss": 0.1079, "step": 38670 }, { "epoch": 10.88, "learning_rate": 8.694217973948085e-05, "loss": 0.0842, "step": 38700 }, { "epoch": 10.89, "learning_rate": 8.692343735357512e-05, "loss": 0.1018, "step": 38730 }, { "epoch": 10.9, "learning_rate": 8.690469496766938e-05, "loss": 0.0843, "step": 38760 }, { "epoch": 10.91, "learning_rate": 8.688595258176366e-05, "loss": 0.1039, "step": 38790 }, { "epoch": 10.91, "learning_rate": 8.686721019585795e-05, "loss": 0.1033, "step": 38820 }, { "epoch": 10.92, "learning_rate": 8.684846780995221e-05, "loss": 0.0854, "step": 38850 }, { "epoch": 10.93, "learning_rate": 8.682972542404648e-05, "loss": 0.1018, "step": 38880 }, { "epoch": 10.94, "learning_rate": 8.681098303814076e-05, "loss": 0.0897, "step": 38910 }, { "epoch": 10.95, "learning_rate": 8.679224065223503e-05, "loss": 0.1007, "step": 38940 }, { "epoch": 10.96, "learning_rate": 8.677349826632931e-05, "loss": 0.1023, "step": 38970 }, { "epoch": 10.96, "learning_rate": 8.675475588042358e-05, "loss": 0.0866, "step": 39000 }, { "epoch": 10.97, "learning_rate": 8.673663824071472e-05, "loss": 0.1016, "step": 39030 }, { "epoch": 10.98, "learning_rate": 8.671789585480899e-05, "loss": 0.0893, "step": 39060 }, { "epoch": 10.99, "learning_rate": 8.669915346890327e-05, "loss": 0.0963, "step": 39090 }, { "epoch": 11.0, "learning_rate": 8.668041108299753e-05, "loss": 0.102, "step": 39120 }, { "epoch": 11.0, "eval_loss": 0.11905849725008011, "eval_runtime": 629.8349, "eval_samples_per_second": 25.456, "eval_steps_per_second": 0.797, "eval_wer": 0.11857710207033968, "step": 39127 }, { "epoch": 11.01, "learning_rate": 8.666166869709182e-05, "loss": 0.0842, "step": 39150 }, { "epoch": 11.01, "learning_rate": 8.66429263111861e-05, "loss": 0.1001, "step": 39180 }, { "epoch": 11.02, "learning_rate": 8.662418392528035e-05, "loss": 0.0859, "step": 39210 }, { "epoch": 11.03, "learning_rate": 8.660544153937463e-05, "loss": 0.1002, "step": 39240 }, { "epoch": 11.04, "learning_rate": 8.658669915346891e-05, "loss": 0.0933, "step": 39270 }, { "epoch": 11.05, "learning_rate": 8.656795676756318e-05, "loss": 0.0919, "step": 39300 }, { "epoch": 11.06, "learning_rate": 8.654921438165745e-05, "loss": 0.0992, "step": 39330 }, { "epoch": 11.07, "learning_rate": 8.653047199575173e-05, "loss": 0.081, "step": 39360 }, { "epoch": 11.07, "learning_rate": 8.651172960984601e-05, "loss": 0.0935, "step": 39390 }, { "epoch": 11.08, "learning_rate": 8.649298722394028e-05, "loss": 0.0815, "step": 39420 }, { "epoch": 11.09, "learning_rate": 8.647424483803456e-05, "loss": 0.0923, "step": 39450 }, { "epoch": 11.1, "learning_rate": 8.645550245212882e-05, "loss": 0.0969, "step": 39480 }, { "epoch": 11.11, "learning_rate": 8.64367600662231e-05, "loss": 0.0873, "step": 39510 }, { "epoch": 11.12, "learning_rate": 8.641801768031737e-05, "loss": 0.0961, "step": 39540 }, { "epoch": 11.12, "learning_rate": 8.639927529441165e-05, "loss": 0.0933, "step": 39570 }, { "epoch": 11.13, "learning_rate": 8.638053290850593e-05, "loss": 0.0972, "step": 39600 }, { "epoch": 11.14, "learning_rate": 8.636179052260019e-05, "loss": 0.1017, "step": 39630 }, { "epoch": 11.15, "learning_rate": 8.634304813669447e-05, "loss": 0.0847, "step": 39660 }, { "epoch": 11.16, "learning_rate": 8.632430575078875e-05, "loss": 0.0971, "step": 39690 }, { "epoch": 11.17, "learning_rate": 8.630556336488302e-05, "loss": 0.09, "step": 39720 }, { "epoch": 11.18, "learning_rate": 8.628682097897729e-05, "loss": 0.0889, "step": 39750 }, { "epoch": 11.18, "learning_rate": 8.626807859307157e-05, "loss": 0.1016, "step": 39780 }, { "epoch": 11.19, "learning_rate": 8.624933620716585e-05, "loss": 0.0859, "step": 39810 }, { "epoch": 11.2, "learning_rate": 8.623059382126011e-05, "loss": 0.1014, "step": 39840 }, { "epoch": 11.21, "learning_rate": 8.62118514353544e-05, "loss": 0.0945, "step": 39870 }, { "epoch": 11.22, "learning_rate": 8.619310904944866e-05, "loss": 0.0887, "step": 39900 }, { "epoch": 11.23, "learning_rate": 8.617436666354294e-05, "loss": 0.0987, "step": 39930 }, { "epoch": 11.23, "learning_rate": 8.615562427763721e-05, "loss": 0.0808, "step": 39960 }, { "epoch": 11.24, "learning_rate": 8.613688189173149e-05, "loss": 0.1018, "step": 39990 }, { "epoch": 11.25, "learning_rate": 8.611813950582577e-05, "loss": 0.0971, "step": 40020 }, { "epoch": 11.26, "learning_rate": 8.609939711992003e-05, "loss": 0.0955, "step": 40050 }, { "epoch": 11.27, "learning_rate": 8.608065473401431e-05, "loss": 0.1036, "step": 40080 }, { "epoch": 11.28, "learning_rate": 8.606191234810859e-05, "loss": 0.0821, "step": 40110 }, { "epoch": 11.28, "learning_rate": 8.604316996220286e-05, "loss": 0.097, "step": 40140 }, { "epoch": 11.29, "learning_rate": 8.602442757629712e-05, "loss": 0.0943, "step": 40170 }, { "epoch": 11.3, "learning_rate": 8.60056851903914e-05, "loss": 0.0939, "step": 40200 }, { "epoch": 11.31, "learning_rate": 8.598694280448569e-05, "loss": 0.1064, "step": 40230 }, { "epoch": 11.32, "learning_rate": 8.596820041857995e-05, "loss": 0.0813, "step": 40260 }, { "epoch": 11.33, "learning_rate": 8.594945803267423e-05, "loss": 0.0943, "step": 40290 }, { "epoch": 11.34, "learning_rate": 8.59307156467685e-05, "loss": 0.0898, "step": 40320 }, { "epoch": 11.34, "learning_rate": 8.591197326086278e-05, "loss": 0.0902, "step": 40350 }, { "epoch": 11.35, "learning_rate": 8.589323087495705e-05, "loss": 0.1028, "step": 40380 }, { "epoch": 11.36, "learning_rate": 8.587448848905133e-05, "loss": 0.0828, "step": 40410 }, { "epoch": 11.37, "learning_rate": 8.585574610314561e-05, "loss": 0.0964, "step": 40440 }, { "epoch": 11.38, "learning_rate": 8.583700371723987e-05, "loss": 0.089, "step": 40470 }, { "epoch": 11.39, "learning_rate": 8.581826133133415e-05, "loss": 0.0955, "step": 40500 }, { "epoch": 11.39, "learning_rate": 8.579951894542843e-05, "loss": 0.1037, "step": 40530 }, { "epoch": 11.4, "learning_rate": 8.57807765595227e-05, "loss": 0.0833, "step": 40560 }, { "epoch": 11.41, "learning_rate": 8.576203417361696e-05, "loss": 0.0963, "step": 40590 }, { "epoch": 11.42, "learning_rate": 8.574329178771124e-05, "loss": 0.0885, "step": 40620 }, { "epoch": 11.43, "learning_rate": 8.572454940180552e-05, "loss": 0.0929, "step": 40650 }, { "epoch": 11.44, "learning_rate": 8.570580701589979e-05, "loss": 0.1005, "step": 40680 }, { "epoch": 11.44, "learning_rate": 8.568706462999407e-05, "loss": 0.083, "step": 40710 }, { "epoch": 11.45, "learning_rate": 8.566832224408834e-05, "loss": 0.0974, "step": 40740 }, { "epoch": 11.46, "learning_rate": 8.564957985818262e-05, "loss": 0.0894, "step": 40770 }, { "epoch": 11.47, "learning_rate": 8.563083747227689e-05, "loss": 0.0891, "step": 40800 }, { "epoch": 11.48, "learning_rate": 8.561209508637117e-05, "loss": 0.0977, "step": 40830 }, { "epoch": 11.49, "learning_rate": 8.559335270046544e-05, "loss": 0.0794, "step": 40860 }, { "epoch": 11.5, "learning_rate": 8.55746103145597e-05, "loss": 0.0966, "step": 40890 }, { "epoch": 11.5, "learning_rate": 8.555586792865399e-05, "loss": 0.0915, "step": 40920 }, { "epoch": 11.51, "learning_rate": 8.553712554274827e-05, "loss": 0.091, "step": 40950 }, { "epoch": 11.52, "learning_rate": 8.551838315684255e-05, "loss": 0.1046, "step": 40980 }, { "epoch": 11.53, "learning_rate": 8.54996407709368e-05, "loss": 0.0763, "step": 41010 }, { "epoch": 11.54, "learning_rate": 8.548152313122794e-05, "loss": 0.1007, "step": 41040 }, { "epoch": 11.55, "learning_rate": 8.546278074532221e-05, "loss": 0.0859, "step": 41070 }, { "epoch": 11.55, "learning_rate": 8.544403835941649e-05, "loss": 0.0962, "step": 41100 }, { "epoch": 11.56, "learning_rate": 8.542529597351077e-05, "loss": 0.1012, "step": 41130 }, { "epoch": 11.57, "learning_rate": 8.540655358760504e-05, "loss": 0.0849, "step": 41160 }, { "epoch": 11.58, "learning_rate": 8.538781120169932e-05, "loss": 0.0986, "step": 41190 }, { "epoch": 11.59, "learning_rate": 8.536906881579359e-05, "loss": 0.0927, "step": 41220 }, { "epoch": 11.6, "learning_rate": 8.535032642988785e-05, "loss": 0.0907, "step": 41250 }, { "epoch": 11.61, "learning_rate": 8.533158404398214e-05, "loss": 0.1029, "step": 41280 }, { "epoch": 11.61, "learning_rate": 8.531284165807642e-05, "loss": 0.0873, "step": 41310 }, { "epoch": 11.62, "learning_rate": 8.529409927217068e-05, "loss": 0.1019, "step": 41340 }, { "epoch": 11.63, "learning_rate": 8.527535688626495e-05, "loss": 0.0907, "step": 41370 }, { "epoch": 11.64, "learning_rate": 8.525661450035923e-05, "loss": 0.0963, "step": 41400 }, { "epoch": 11.65, "learning_rate": 8.523787211445351e-05, "loss": 0.1014, "step": 41430 }, { "epoch": 11.66, "learning_rate": 8.521912972854778e-05, "loss": 0.083, "step": 41460 }, { "epoch": 11.66, "learning_rate": 8.520038734264205e-05, "loss": 0.0959, "step": 41490 }, { "epoch": 11.67, "learning_rate": 8.518164495673633e-05, "loss": 0.0912, "step": 41520 }, { "epoch": 11.68, "learning_rate": 8.516290257083061e-05, "loss": 0.0932, "step": 41550 }, { "epoch": 11.69, "learning_rate": 8.514416018492488e-05, "loss": 0.1018, "step": 41580 }, { "epoch": 11.7, "learning_rate": 8.512541779901915e-05, "loss": 0.0815, "step": 41610 }, { "epoch": 11.71, "learning_rate": 8.510667541311343e-05, "loss": 0.0983, "step": 41640 }, { "epoch": 11.71, "learning_rate": 8.50879330272077e-05, "loss": 0.0904, "step": 41670 }, { "epoch": 11.72, "learning_rate": 8.506919064130197e-05, "loss": 0.095, "step": 41700 }, { "epoch": 11.73, "learning_rate": 8.505044825539626e-05, "loss": 0.1045, "step": 41730 }, { "epoch": 11.74, "learning_rate": 8.503170586949052e-05, "loss": 0.0825, "step": 41760 }, { "epoch": 11.75, "learning_rate": 8.501358822978166e-05, "loss": 0.0984, "step": 41790 }, { "epoch": 11.76, "learning_rate": 8.499484584387593e-05, "loss": 0.0876, "step": 41820 }, { "epoch": 11.77, "learning_rate": 8.49761034579702e-05, "loss": 0.0913, "step": 41850 }, { "epoch": 11.77, "learning_rate": 8.495736107206448e-05, "loss": 0.1007, "step": 41880 }, { "epoch": 11.78, "learning_rate": 8.493861868615876e-05, "loss": 0.0851, "step": 41910 }, { "epoch": 11.79, "learning_rate": 8.491987630025303e-05, "loss": 0.0994, "step": 41940 }, { "epoch": 11.8, "learning_rate": 8.49011339143473e-05, "loss": 0.0858, "step": 41970 }, { "epoch": 11.81, "learning_rate": 8.488239152844158e-05, "loss": 0.0924, "step": 42000 }, { "epoch": 11.82, "learning_rate": 8.486364914253584e-05, "loss": 0.1027, "step": 42030 }, { "epoch": 11.82, "learning_rate": 8.484490675663012e-05, "loss": 0.0808, "step": 42060 }, { "epoch": 11.83, "learning_rate": 8.482678911692125e-05, "loss": 0.0959, "step": 42090 }, { "epoch": 11.84, "learning_rate": 8.480804673101553e-05, "loss": 0.0849, "step": 42120 }, { "epoch": 11.85, "learning_rate": 8.47893043451098e-05, "loss": 0.0916, "step": 42150 }, { "epoch": 11.86, "learning_rate": 8.477056195920408e-05, "loss": 0.101, "step": 42180 }, { "epoch": 11.87, "learning_rate": 8.475181957329835e-05, "loss": 0.085, "step": 42210 }, { "epoch": 11.88, "learning_rate": 8.473307718739263e-05, "loss": 0.0929, "step": 42240 }, { "epoch": 11.88, "learning_rate": 8.471433480148691e-05, "loss": 0.0869, "step": 42270 }, { "epoch": 11.89, "learning_rate": 8.469559241558116e-05, "loss": 0.0961, "step": 42300 }, { "epoch": 11.9, "learning_rate": 8.467685002967545e-05, "loss": 0.098, "step": 42330 }, { "epoch": 11.91, "learning_rate": 8.465810764376973e-05, "loss": 0.0841, "step": 42360 }, { "epoch": 11.92, "learning_rate": 8.4639365257864e-05, "loss": 0.0983, "step": 42390 }, { "epoch": 11.93, "learning_rate": 8.462062287195826e-05, "loss": 0.0851, "step": 42420 }, { "epoch": 11.93, "learning_rate": 8.460188048605254e-05, "loss": 0.0933, "step": 42450 }, { "epoch": 11.94, "learning_rate": 8.458313810014682e-05, "loss": 0.0984, "step": 42480 }, { "epoch": 11.95, "learning_rate": 8.456439571424109e-05, "loss": 0.0844, "step": 42510 }, { "epoch": 11.96, "learning_rate": 8.454565332833537e-05, "loss": 0.096, "step": 42540 }, { "epoch": 11.97, "learning_rate": 8.452691094242964e-05, "loss": 0.0872, "step": 42570 }, { "epoch": 11.98, "learning_rate": 8.450816855652392e-05, "loss": 0.0938, "step": 42600 }, { "epoch": 11.98, "learning_rate": 8.448942617061819e-05, "loss": 0.1016, "step": 42630 }, { "epoch": 11.99, "learning_rate": 8.447068378471247e-05, "loss": 0.0834, "step": 42660 }, { "epoch": 12.0, "eval_loss": 0.1160648763179779, "eval_runtime": 629.8644, "eval_samples_per_second": 25.455, "eval_steps_per_second": 0.797, "eval_wer": 0.10961745799953598, "step": 42684 }, { "epoch": 12.0, "learning_rate": 8.445194139880675e-05, "loss": 0.1065, "step": 42690 }, { "epoch": 12.01, "learning_rate": 8.4433199012901e-05, "loss": 0.0817, "step": 42720 }, { "epoch": 12.02, "learning_rate": 8.441445662699528e-05, "loss": 0.0949, "step": 42750 }, { "epoch": 12.03, "learning_rate": 8.439571424108957e-05, "loss": 0.0901, "step": 42780 }, { "epoch": 12.04, "learning_rate": 8.437697185518383e-05, "loss": 0.0852, "step": 42810 }, { "epoch": 12.04, "learning_rate": 8.43582294692781e-05, "loss": 0.095, "step": 42840 }, { "epoch": 12.05, "learning_rate": 8.433948708337238e-05, "loss": 0.0805, "step": 42870 }, { "epoch": 12.06, "learning_rate": 8.432074469746666e-05, "loss": 0.094, "step": 42900 }, { "epoch": 12.07, "learning_rate": 8.430200231156093e-05, "loss": 0.0886, "step": 42930 }, { "epoch": 12.08, "learning_rate": 8.428325992565521e-05, "loss": 0.0873, "step": 42960 }, { "epoch": 12.09, "learning_rate": 8.426451753974948e-05, "loss": 0.0949, "step": 42990 }, { "epoch": 12.09, "learning_rate": 8.424577515384376e-05, "loss": 0.0842, "step": 43020 }, { "epoch": 12.1, "learning_rate": 8.422703276793803e-05, "loss": 0.0899, "step": 43050 }, { "epoch": 12.11, "learning_rate": 8.420829038203231e-05, "loss": 0.0871, "step": 43080 }, { "epoch": 12.12, "learning_rate": 8.418954799612657e-05, "loss": 0.0824, "step": 43110 }, { "epoch": 12.13, "learning_rate": 8.417080561022084e-05, "loss": 0.0907, "step": 43140 }, { "epoch": 12.14, "learning_rate": 8.415206322431512e-05, "loss": 0.0786, "step": 43170 }, { "epoch": 12.15, "learning_rate": 8.41333208384094e-05, "loss": 0.0969, "step": 43200 }, { "epoch": 12.15, "learning_rate": 8.411457845250369e-05, "loss": 0.0896, "step": 43230 }, { "epoch": 12.16, "learning_rate": 8.409583606659794e-05, "loss": 0.0874, "step": 43260 }, { "epoch": 12.17, "learning_rate": 8.407709368069222e-05, "loss": 0.0962, "step": 43290 }, { "epoch": 12.18, "learning_rate": 8.40583512947865e-05, "loss": 0.0849, "step": 43320 }, { "epoch": 12.19, "learning_rate": 8.403960890888077e-05, "loss": 0.0933, "step": 43350 }, { "epoch": 12.2, "learning_rate": 8.402086652297505e-05, "loss": 0.0884, "step": 43380 }, { "epoch": 12.2, "learning_rate": 8.400212413706932e-05, "loss": 0.0829, "step": 43410 }, { "epoch": 12.21, "learning_rate": 8.39833817511636e-05, "loss": 0.0994, "step": 43440 }, { "epoch": 12.22, "learning_rate": 8.396463936525787e-05, "loss": 0.0825, "step": 43470 }, { "epoch": 12.23, "learning_rate": 8.394589697935215e-05, "loss": 0.0958, "step": 43500 }, { "epoch": 12.24, "learning_rate": 8.392715459344641e-05, "loss": 0.0949, "step": 43530 }, { "epoch": 12.25, "learning_rate": 8.390841220754068e-05, "loss": 0.0913, "step": 43560 }, { "epoch": 12.25, "learning_rate": 8.388966982163496e-05, "loss": 0.1043, "step": 43590 }, { "epoch": 12.26, "learning_rate": 8.387092743572924e-05, "loss": 0.0779, "step": 43620 }, { "epoch": 12.27, "learning_rate": 8.385218504982352e-05, "loss": 0.0942, "step": 43650 }, { "epoch": 12.28, "learning_rate": 8.383344266391778e-05, "loss": 0.0872, "step": 43680 }, { "epoch": 12.29, "learning_rate": 8.381470027801206e-05, "loss": 0.086, "step": 43710 }, { "epoch": 12.3, "learning_rate": 8.379595789210634e-05, "loss": 0.0961, "step": 43740 }, { "epoch": 12.31, "learning_rate": 8.377721550620061e-05, "loss": 0.0819, "step": 43770 }, { "epoch": 12.31, "learning_rate": 8.375847312029489e-05, "loss": 0.0947, "step": 43800 }, { "epoch": 12.32, "learning_rate": 8.373973073438916e-05, "loss": 0.0934, "step": 43830 }, { "epoch": 12.33, "learning_rate": 8.372098834848344e-05, "loss": 0.0897, "step": 43860 }, { "epoch": 12.34, "learning_rate": 8.37022459625777e-05, "loss": 0.1006, "step": 43890 }, { "epoch": 12.35, "learning_rate": 8.368350357667198e-05, "loss": 0.081, "step": 43920 }, { "epoch": 12.36, "learning_rate": 8.366476119076625e-05, "loss": 0.1011, "step": 43950 }, { "epoch": 12.36, "learning_rate": 8.364601880486053e-05, "loss": 0.0887, "step": 43980 }, { "epoch": 12.37, "learning_rate": 8.36272764189548e-05, "loss": 0.0867, "step": 44010 }, { "epoch": 12.38, "learning_rate": 8.360853403304908e-05, "loss": 0.0979, "step": 44040 }, { "epoch": 12.39, "learning_rate": 8.358979164714336e-05, "loss": 0.0821, "step": 44070 }, { "epoch": 12.4, "learning_rate": 8.357104926123762e-05, "loss": 0.0944, "step": 44100 }, { "epoch": 12.41, "learning_rate": 8.35523068753319e-05, "loss": 0.0895, "step": 44130 }, { "epoch": 12.41, "learning_rate": 8.353356448942618e-05, "loss": 0.0874, "step": 44160 }, { "epoch": 12.42, "learning_rate": 8.351482210352045e-05, "loss": 0.0974, "step": 44190 }, { "epoch": 12.43, "learning_rate": 8.349607971761473e-05, "loss": 0.0825, "step": 44220 }, { "epoch": 12.44, "learning_rate": 8.3477337331709e-05, "loss": 0.0979, "step": 44250 }, { "epoch": 12.45, "learning_rate": 8.345859494580327e-05, "loss": 0.094, "step": 44280 }, { "epoch": 12.46, "learning_rate": 8.343985255989754e-05, "loss": 0.0857, "step": 44310 }, { "epoch": 12.47, "learning_rate": 8.342111017399182e-05, "loss": 0.0988, "step": 44340 }, { "epoch": 12.47, "learning_rate": 8.340236778808609e-05, "loss": 0.0818, "step": 44370 }, { "epoch": 12.48, "learning_rate": 8.338362540218037e-05, "loss": 0.0924, "step": 44400 }, { "epoch": 12.49, "learning_rate": 8.336488301627464e-05, "loss": 0.0896, "step": 44430 }, { "epoch": 12.5, "learning_rate": 8.334614063036892e-05, "loss": 0.0871, "step": 44460 }, { "epoch": 12.51, "learning_rate": 8.33273982444632e-05, "loss": 0.0974, "step": 44490 }, { "epoch": 12.52, "learning_rate": 8.330865585855745e-05, "loss": 0.0854, "step": 44520 }, { "epoch": 12.52, "learning_rate": 8.328991347265174e-05, "loss": 0.0928, "step": 44550 }, { "epoch": 12.53, "learning_rate": 8.327117108674602e-05, "loss": 0.0895, "step": 44580 }, { "epoch": 12.54, "learning_rate": 8.325242870084028e-05, "loss": 0.0887, "step": 44610 }, { "epoch": 12.55, "learning_rate": 8.323368631493457e-05, "loss": 0.0931, "step": 44640 }, { "epoch": 12.56, "learning_rate": 8.321494392902883e-05, "loss": 0.0804, "step": 44670 }, { "epoch": 12.57, "learning_rate": 8.319620154312311e-05, "loss": 0.0916, "step": 44700 }, { "epoch": 12.58, "learning_rate": 8.317745915721738e-05, "loss": 0.0901, "step": 44730 }, { "epoch": 12.58, "learning_rate": 8.315871677131166e-05, "loss": 0.0874, "step": 44760 }, { "epoch": 12.59, "learning_rate": 8.313997438540593e-05, "loss": 0.0987, "step": 44790 }, { "epoch": 12.6, "learning_rate": 8.312123199950021e-05, "loss": 0.0831, "step": 44820 }, { "epoch": 12.61, "learning_rate": 8.310248961359448e-05, "loss": 0.0897, "step": 44850 }, { "epoch": 12.62, "learning_rate": 8.308374722768876e-05, "loss": 0.0943, "step": 44880 }, { "epoch": 12.63, "learning_rate": 8.306500484178304e-05, "loss": 0.0872, "step": 44910 }, { "epoch": 12.63, "learning_rate": 8.30462624558773e-05, "loss": 0.0944, "step": 44940 }, { "epoch": 12.64, "learning_rate": 8.302752006997157e-05, "loss": 0.081, "step": 44970 }, { "epoch": 12.65, "learning_rate": 8.300877768406586e-05, "loss": 0.0945, "step": 45000 }, { "epoch": 12.66, "learning_rate": 8.299003529816012e-05, "loss": 0.0957, "step": 45030 }, { "epoch": 12.67, "learning_rate": 8.29712929122544e-05, "loss": 0.086, "step": 45060 }, { "epoch": 12.68, "learning_rate": 8.295255052634867e-05, "loss": 0.0991, "step": 45090 }, { "epoch": 12.68, "learning_rate": 8.293380814044295e-05, "loss": 0.0807, "step": 45120 }, { "epoch": 12.69, "learning_rate": 8.291506575453722e-05, "loss": 0.0939, "step": 45150 }, { "epoch": 12.7, "learning_rate": 8.28963233686315e-05, "loss": 0.0891, "step": 45180 }, { "epoch": 12.71, "learning_rate": 8.287758098272577e-05, "loss": 0.0857, "step": 45210 }, { "epoch": 12.72, "learning_rate": 8.285883859682005e-05, "loss": 0.097, "step": 45240 }, { "epoch": 12.73, "learning_rate": 8.284009621091432e-05, "loss": 0.0795, "step": 45270 }, { "epoch": 12.74, "learning_rate": 8.28213538250086e-05, "loss": 0.0904, "step": 45300 }, { "epoch": 12.74, "learning_rate": 8.280261143910288e-05, "loss": 0.0901, "step": 45330 }, { "epoch": 12.75, "learning_rate": 8.278386905319713e-05, "loss": 0.0861, "step": 45360 }, { "epoch": 12.76, "learning_rate": 8.276512666729141e-05, "loss": 0.1011, "step": 45390 }, { "epoch": 12.77, "learning_rate": 8.27463842813857e-05, "loss": 0.081, "step": 45420 }, { "epoch": 12.78, "learning_rate": 8.272764189547996e-05, "loss": 0.0884, "step": 45450 }, { "epoch": 12.79, "learning_rate": 8.270889950957424e-05, "loss": 0.09, "step": 45480 }, { "epoch": 12.79, "learning_rate": 8.269015712366851e-05, "loss": 0.0878, "step": 45510 }, { "epoch": 12.8, "learning_rate": 8.267141473776279e-05, "loss": 0.1015, "step": 45540 }, { "epoch": 12.81, "learning_rate": 8.265267235185706e-05, "loss": 0.0795, "step": 45570 }, { "epoch": 12.82, "learning_rate": 8.263392996595134e-05, "loss": 0.0869, "step": 45600 }, { "epoch": 12.83, "learning_rate": 8.261518758004561e-05, "loss": 0.0932, "step": 45630 }, { "epoch": 12.84, "learning_rate": 8.259644519413989e-05, "loss": 0.0875, "step": 45660 }, { "epoch": 12.84, "learning_rate": 8.257770280823416e-05, "loss": 0.0951, "step": 45690 }, { "epoch": 12.85, "learning_rate": 8.255896042232844e-05, "loss": 0.0784, "step": 45720 }, { "epoch": 12.86, "learning_rate": 8.254021803642272e-05, "loss": 0.0984, "step": 45750 }, { "epoch": 12.87, "learning_rate": 8.252147565051697e-05, "loss": 0.0858, "step": 45780 }, { "epoch": 12.88, "learning_rate": 8.250273326461125e-05, "loss": 0.0857, "step": 45810 }, { "epoch": 12.89, "learning_rate": 8.248399087870553e-05, "loss": 0.0948, "step": 45840 }, { "epoch": 12.9, "learning_rate": 8.24652484927998e-05, "loss": 0.0873, "step": 45870 }, { "epoch": 12.9, "learning_rate": 8.244650610689408e-05, "loss": 0.0934, "step": 45900 }, { "epoch": 12.91, "learning_rate": 8.242776372098835e-05, "loss": 0.0895, "step": 45930 }, { "epoch": 12.92, "learning_rate": 8.240902133508263e-05, "loss": 0.0874, "step": 45960 }, { "epoch": 12.93, "learning_rate": 8.23902789491769e-05, "loss": 0.097, "step": 45990 }, { "epoch": 12.94, "learning_rate": 8.237153656327118e-05, "loss": 0.0841, "step": 46020 }, { "epoch": 12.95, "learning_rate": 8.235279417736545e-05, "loss": 0.0915, "step": 46050 }, { "epoch": 12.95, "learning_rate": 8.233405179145973e-05, "loss": 0.0909, "step": 46080 }, { "epoch": 12.96, "learning_rate": 8.2315309405554e-05, "loss": 0.0887, "step": 46110 }, { "epoch": 12.97, "learning_rate": 8.229656701964827e-05, "loss": 0.0965, "step": 46140 }, { "epoch": 12.98, "learning_rate": 8.227782463374256e-05, "loss": 0.0817, "step": 46170 }, { "epoch": 12.99, "learning_rate": 8.225908224783681e-05, "loss": 0.093, "step": 46200 }, { "epoch": 13.0, "learning_rate": 8.224033986193109e-05, "loss": 0.0916, "step": 46230 }, { "epoch": 13.0, "eval_loss": 0.11473153531551361, "eval_runtime": 629.489, "eval_samples_per_second": 25.47, "eval_steps_per_second": 0.797, "eval_wer": 0.11070926535012897, "step": 46241 }, { "epoch": 13.01, "learning_rate": 8.222159747602537e-05, "loss": 0.0861, "step": 46260 }, { "epoch": 13.01, "learning_rate": 8.220285509011965e-05, "loss": 0.0928, "step": 46290 }, { "epoch": 13.02, "learning_rate": 8.218411270421392e-05, "loss": 0.0836, "step": 46320 }, { "epoch": 13.03, "learning_rate": 8.216537031830819e-05, "loss": 0.0949, "step": 46350 }, { "epoch": 13.04, "learning_rate": 8.214662793240247e-05, "loss": 0.0837, "step": 46380 }, { "epoch": 13.05, "learning_rate": 8.212788554649674e-05, "loss": 0.087, "step": 46410 }, { "epoch": 13.06, "learning_rate": 8.210914316059102e-05, "loss": 0.0893, "step": 46440 }, { "epoch": 13.06, "learning_rate": 8.209040077468528e-05, "loss": 0.0818, "step": 46470 }, { "epoch": 13.07, "learning_rate": 8.207165838877957e-05, "loss": 0.0956, "step": 46500 }, { "epoch": 13.08, "learning_rate": 8.205291600287383e-05, "loss": 0.0796, "step": 46530 }, { "epoch": 13.09, "learning_rate": 8.203417361696811e-05, "loss": 0.0904, "step": 46560 }, { "epoch": 13.1, "learning_rate": 8.20154312310624e-05, "loss": 0.0931, "step": 46590 }, { "epoch": 13.11, "learning_rate": 8.199668884515665e-05, "loss": 0.0782, "step": 46620 }, { "epoch": 13.11, "learning_rate": 8.197794645925093e-05, "loss": 0.0967, "step": 46650 }, { "epoch": 13.12, "learning_rate": 8.195920407334521e-05, "loss": 0.0818, "step": 46680 }, { "epoch": 13.13, "learning_rate": 8.194046168743949e-05, "loss": 0.0818, "step": 46710 }, { "epoch": 13.14, "learning_rate": 8.192171930153375e-05, "loss": 0.0909, "step": 46740 }, { "epoch": 13.15, "learning_rate": 8.190297691562803e-05, "loss": 0.081, "step": 46770 }, { "epoch": 13.16, "learning_rate": 8.188423452972231e-05, "loss": 0.0946, "step": 46800 }, { "epoch": 13.17, "learning_rate": 8.186549214381657e-05, "loss": 0.0831, "step": 46830 }, { "epoch": 13.17, "learning_rate": 8.184674975791086e-05, "loss": 0.0902, "step": 46860 }, { "epoch": 13.18, "learning_rate": 8.182800737200512e-05, "loss": 0.0988, "step": 46890 }, { "epoch": 13.19, "learning_rate": 8.18092649860994e-05, "loss": 0.0827, "step": 46920 }, { "epoch": 13.2, "learning_rate": 8.179052260019367e-05, "loss": 0.0959, "step": 46950 }, { "epoch": 13.21, "learning_rate": 8.177178021428795e-05, "loss": 0.0779, "step": 46980 }, { "epoch": 13.22, "learning_rate": 8.175303782838223e-05, "loss": 0.0918, "step": 47010 }, { "epoch": 13.22, "learning_rate": 8.17342954424765e-05, "loss": 0.0885, "step": 47040 }, { "epoch": 13.23, "learning_rate": 8.171555305657077e-05, "loss": 0.0809, "step": 47070 }, { "epoch": 13.24, "learning_rate": 8.169681067066505e-05, "loss": 0.0892, "step": 47100 }, { "epoch": 13.25, "learning_rate": 8.167806828475933e-05, "loss": 0.0831, "step": 47130 }, { "epoch": 13.26, "learning_rate": 8.165932589885358e-05, "loss": 0.091, "step": 47160 }, { "epoch": 13.27, "learning_rate": 8.164058351294786e-05, "loss": 0.0906, "step": 47190 }, { "epoch": 13.28, "learning_rate": 8.162184112704215e-05, "loss": 0.076, "step": 47220 }, { "epoch": 13.28, "learning_rate": 8.160309874113641e-05, "loss": 0.0933, "step": 47250 }, { "epoch": 13.29, "learning_rate": 8.15843563552307e-05, "loss": 0.0812, "step": 47280 }, { "epoch": 13.3, "learning_rate": 8.156561396932496e-05, "loss": 0.088, "step": 47310 }, { "epoch": 13.31, "learning_rate": 8.154687158341924e-05, "loss": 0.0907, "step": 47340 }, { "epoch": 13.32, "learning_rate": 8.152812919751351e-05, "loss": 0.0826, "step": 47370 }, { "epoch": 13.33, "learning_rate": 8.150938681160779e-05, "loss": 0.0933, "step": 47400 }, { "epoch": 13.33, "learning_rate": 8.149064442570207e-05, "loss": 0.0832, "step": 47430 }, { "epoch": 13.34, "learning_rate": 8.147190203979634e-05, "loss": 0.0882, "step": 47460 }, { "epoch": 13.35, "learning_rate": 8.14531596538906e-05, "loss": 0.0929, "step": 47490 }, { "epoch": 13.36, "learning_rate": 8.143441726798489e-05, "loss": 0.0805, "step": 47520 }, { "epoch": 13.37, "learning_rate": 8.141629962827602e-05, "loss": 0.0915, "step": 47550 }, { "epoch": 13.38, "learning_rate": 8.13975572423703e-05, "loss": 0.0825, "step": 47580 }, { "epoch": 13.38, "learning_rate": 8.137881485646456e-05, "loss": 0.0881, "step": 47610 }, { "epoch": 13.39, "learning_rate": 8.136007247055883e-05, "loss": 0.0948, "step": 47640 }, { "epoch": 13.4, "learning_rate": 8.134133008465311e-05, "loss": 0.079, "step": 47670 }, { "epoch": 13.41, "learning_rate": 8.132258769874739e-05, "loss": 0.0912, "step": 47700 }, { "epoch": 13.42, "learning_rate": 8.130384531284166e-05, "loss": 0.0813, "step": 47730 }, { "epoch": 13.43, "learning_rate": 8.128510292693594e-05, "loss": 0.0904, "step": 47760 }, { "epoch": 13.44, "learning_rate": 8.126636054103021e-05, "loss": 0.0906, "step": 47790 }, { "epoch": 13.44, "learning_rate": 8.124761815512449e-05, "loss": 0.081, "step": 47820 }, { "epoch": 13.45, "learning_rate": 8.122887576921876e-05, "loss": 0.0943, "step": 47850 }, { "epoch": 13.46, "learning_rate": 8.121013338331304e-05, "loss": 0.0856, "step": 47880 }, { "epoch": 13.47, "learning_rate": 8.11913909974073e-05, "loss": 0.0926, "step": 47910 }, { "epoch": 13.48, "learning_rate": 8.117264861150157e-05, "loss": 0.0904, "step": 47940 }, { "epoch": 13.49, "learning_rate": 8.115390622559585e-05, "loss": 0.0777, "step": 47970 }, { "epoch": 13.49, "learning_rate": 8.113516383969013e-05, "loss": 0.0937, "step": 48000 }, { "epoch": 13.5, "learning_rate": 8.11164214537844e-05, "loss": 0.0818, "step": 48030 }, { "epoch": 13.51, "learning_rate": 8.109767906787867e-05, "loss": 0.0923, "step": 48060 }, { "epoch": 13.52, "learning_rate": 8.107893668197295e-05, "loss": 0.0971, "step": 48090 }, { "epoch": 13.53, "learning_rate": 8.106019429606723e-05, "loss": 0.0824, "step": 48120 }, { "epoch": 13.54, "learning_rate": 8.10414519101615e-05, "loss": 0.0986, "step": 48150 }, { "epoch": 13.55, "learning_rate": 8.102270952425578e-05, "loss": 0.0822, "step": 48180 }, { "epoch": 13.55, "learning_rate": 8.100396713835005e-05, "loss": 0.0884, "step": 48210 }, { "epoch": 13.56, "learning_rate": 8.098522475244433e-05, "loss": 0.0895, "step": 48240 }, { "epoch": 13.57, "learning_rate": 8.09664823665386e-05, "loss": 0.0801, "step": 48270 }, { "epoch": 13.58, "learning_rate": 8.094773998063288e-05, "loss": 0.0971, "step": 48300 }, { "epoch": 13.59, "learning_rate": 8.092899759472714e-05, "loss": 0.0858, "step": 48330 }, { "epoch": 13.6, "learning_rate": 8.091025520882141e-05, "loss": 0.0889, "step": 48360 }, { "epoch": 13.6, "learning_rate": 8.089151282291569e-05, "loss": 0.0944, "step": 48390 }, { "epoch": 13.61, "learning_rate": 8.087277043700997e-05, "loss": 0.0848, "step": 48420 }, { "epoch": 13.62, "learning_rate": 8.085402805110424e-05, "loss": 0.0897, "step": 48450 }, { "epoch": 13.63, "learning_rate": 8.083528566519851e-05, "loss": 0.0812, "step": 48480 }, { "epoch": 13.64, "learning_rate": 8.081654327929279e-05, "loss": 0.0942, "step": 48510 }, { "epoch": 13.65, "learning_rate": 8.079780089338707e-05, "loss": 0.0925, "step": 48540 }, { "epoch": 13.65, "learning_rate": 8.077905850748134e-05, "loss": 0.0806, "step": 48570 }, { "epoch": 13.66, "learning_rate": 8.076031612157562e-05, "loss": 0.091, "step": 48600 }, { "epoch": 13.67, "learning_rate": 8.074157373566989e-05, "loss": 0.0816, "step": 48630 }, { "epoch": 13.68, "learning_rate": 8.072283134976417e-05, "loss": 0.0859, "step": 48660 }, { "epoch": 13.69, "learning_rate": 8.070408896385843e-05, "loss": 0.0956, "step": 48690 }, { "epoch": 13.7, "learning_rate": 8.068534657795272e-05, "loss": 0.0816, "step": 48720 }, { "epoch": 13.71, "learning_rate": 8.066660419204698e-05, "loss": 0.0919, "step": 48750 }, { "epoch": 13.71, "learning_rate": 8.064786180614125e-05, "loss": 0.0798, "step": 48780 }, { "epoch": 13.72, "learning_rate": 8.062911942023553e-05, "loss": 0.0891, "step": 48810 }, { "epoch": 13.73, "learning_rate": 8.061037703432981e-05, "loss": 0.0939, "step": 48840 }, { "epoch": 13.74, "learning_rate": 8.059163464842408e-05, "loss": 0.0796, "step": 48870 }, { "epoch": 13.75, "learning_rate": 8.057289226251835e-05, "loss": 0.0913, "step": 48900 }, { "epoch": 13.76, "learning_rate": 8.055414987661263e-05, "loss": 0.0841, "step": 48930 }, { "epoch": 13.76, "learning_rate": 8.053540749070691e-05, "loss": 0.0827, "step": 48960 }, { "epoch": 13.77, "learning_rate": 8.051666510480118e-05, "loss": 0.0944, "step": 48990 }, { "epoch": 13.78, "learning_rate": 8.049792271889546e-05, "loss": 0.0816, "step": 49020 }, { "epoch": 13.79, "learning_rate": 8.047918033298972e-05, "loss": 0.0923, "step": 49050 }, { "epoch": 13.8, "learning_rate": 8.0460437947084e-05, "loss": 0.0796, "step": 49080 }, { "epoch": 13.81, "learning_rate": 8.044169556117827e-05, "loss": 0.0896, "step": 49110 }, { "epoch": 13.81, "learning_rate": 8.042295317527255e-05, "loss": 0.091, "step": 49140 }, { "epoch": 13.82, "learning_rate": 8.040421078936682e-05, "loss": 0.0853, "step": 49170 }, { "epoch": 13.83, "learning_rate": 8.038546840346109e-05, "loss": 0.0954, "step": 49200 }, { "epoch": 13.84, "learning_rate": 8.036672601755537e-05, "loss": 0.084, "step": 49230 }, { "epoch": 13.85, "learning_rate": 8.034798363164965e-05, "loss": 0.0951, "step": 49260 }, { "epoch": 13.86, "learning_rate": 8.032924124574392e-05, "loss": 0.0924, "step": 49290 }, { "epoch": 13.87, "learning_rate": 8.031049885983819e-05, "loss": 0.0813, "step": 49320 }, { "epoch": 13.87, "learning_rate": 8.029175647393247e-05, "loss": 0.0953, "step": 49350 }, { "epoch": 13.88, "learning_rate": 8.027301408802675e-05, "loss": 0.0834, "step": 49380 }, { "epoch": 13.89, "learning_rate": 8.025427170212101e-05, "loss": 0.0869, "step": 49410 }, { "epoch": 13.9, "learning_rate": 8.02355293162153e-05, "loss": 0.0927, "step": 49440 }, { "epoch": 13.91, "learning_rate": 8.021678693030956e-05, "loss": 0.0817, "step": 49470 }, { "epoch": 13.92, "learning_rate": 8.019804454440384e-05, "loss": 0.0902, "step": 49500 }, { "epoch": 13.92, "learning_rate": 8.017930215849811e-05, "loss": 0.0805, "step": 49530 }, { "epoch": 13.93, "learning_rate": 8.016055977259239e-05, "loss": 0.0897, "step": 49560 }, { "epoch": 13.94, "learning_rate": 8.014181738668666e-05, "loss": 0.0919, "step": 49590 }, { "epoch": 13.95, "learning_rate": 8.012307500078093e-05, "loss": 0.0787, "step": 49620 }, { "epoch": 13.96, "learning_rate": 8.010433261487521e-05, "loss": 0.0947, "step": 49650 }, { "epoch": 13.97, "learning_rate": 8.008559022896949e-05, "loss": 0.0821, "step": 49680 }, { "epoch": 13.98, "learning_rate": 8.006684784306377e-05, "loss": 0.0905, "step": 49710 }, { "epoch": 13.98, "learning_rate": 8.004810545715802e-05, "loss": 0.0873, "step": 49740 }, { "epoch": 13.99, "learning_rate": 8.00293630712523e-05, "loss": 0.0811, "step": 49770 }, { "epoch": 14.0, "eval_loss": 0.1173907220363617, "eval_runtime": 631.7038, "eval_samples_per_second": 25.381, "eval_steps_per_second": 0.795, "eval_wer": 0.11362302621702401, "step": 49798 }, { "epoch": 14.0, "learning_rate": 8.001062068534659e-05, "loss": 0.1005, "step": 49800 }, { "epoch": 14.01, "learning_rate": 7.999187829944085e-05, "loss": 0.0736, "step": 49830 }, { "epoch": 14.02, "learning_rate": 7.997313591353513e-05, "loss": 0.0886, "step": 49860 }, { "epoch": 14.03, "learning_rate": 7.99543935276294e-05, "loss": 0.0771, "step": 49890 }, { "epoch": 14.03, "learning_rate": 7.993565114172368e-05, "loss": 0.0816, "step": 49920 }, { "epoch": 14.04, "learning_rate": 7.991690875581795e-05, "loss": 0.0934, "step": 49950 }, { "epoch": 14.05, "learning_rate": 7.989816636991223e-05, "loss": 0.0765, "step": 49980 }, { "epoch": 14.06, "learning_rate": 7.98794239840065e-05, "loss": 0.0926, "step": 50010 }, { "epoch": 14.07, "learning_rate": 7.986130634429764e-05, "loss": 0.0839, "step": 50040 }, { "epoch": 14.08, "learning_rate": 7.984256395839191e-05, "loss": 0.0827, "step": 50070 }, { "epoch": 14.08, "learning_rate": 7.982382157248617e-05, "loss": 0.0953, "step": 50100 }, { "epoch": 14.09, "learning_rate": 7.980507918658046e-05, "loss": 0.0752, "step": 50130 }, { "epoch": 14.1, "learning_rate": 7.978633680067474e-05, "loss": 0.0905, "step": 50160 }, { "epoch": 14.11, "learning_rate": 7.9767594414769e-05, "loss": 0.0793, "step": 50190 }, { "epoch": 14.12, "learning_rate": 7.974885202886327e-05, "loss": 0.0884, "step": 50220 }, { "epoch": 14.13, "learning_rate": 7.973010964295755e-05, "loss": 0.0951, "step": 50250 }, { "epoch": 14.14, "learning_rate": 7.971136725705183e-05, "loss": 0.0748, "step": 50280 }, { "epoch": 14.14, "learning_rate": 7.96926248711461e-05, "loss": 0.0875, "step": 50310 }, { "epoch": 14.15, "learning_rate": 7.967388248524037e-05, "loss": 0.0817, "step": 50340 }, { "epoch": 14.16, "learning_rate": 7.965514009933465e-05, "loss": 0.0817, "step": 50370 }, { "epoch": 14.17, "learning_rate": 7.963639771342892e-05, "loss": 0.091, "step": 50400 }, { "epoch": 14.18, "learning_rate": 7.96176553275232e-05, "loss": 0.0767, "step": 50430 }, { "epoch": 14.19, "learning_rate": 7.959891294161748e-05, "loss": 0.09, "step": 50460 }, { "epoch": 14.19, "learning_rate": 7.958017055571175e-05, "loss": 0.0803, "step": 50490 }, { "epoch": 14.2, "learning_rate": 7.956142816980601e-05, "loss": 0.0905, "step": 50520 }, { "epoch": 14.21, "learning_rate": 7.95426857839003e-05, "loss": 0.0886, "step": 50550 }, { "epoch": 14.22, "learning_rate": 7.952394339799458e-05, "loss": 0.077, "step": 50580 }, { "epoch": 14.23, "learning_rate": 7.950520101208884e-05, "loss": 0.0931, "step": 50610 }, { "epoch": 14.24, "learning_rate": 7.948645862618311e-05, "loss": 0.083, "step": 50640 }, { "epoch": 14.25, "learning_rate": 7.946771624027739e-05, "loss": 0.088, "step": 50670 }, { "epoch": 14.25, "learning_rate": 7.944897385437167e-05, "loss": 0.0911, "step": 50700 }, { "epoch": 14.26, "learning_rate": 7.943023146846594e-05, "loss": 0.0779, "step": 50730 }, { "epoch": 14.27, "learning_rate": 7.94114890825602e-05, "loss": 0.0882, "step": 50760 }, { "epoch": 14.28, "learning_rate": 7.939274669665449e-05, "loss": 0.081, "step": 50790 }, { "epoch": 14.29, "learning_rate": 7.937400431074877e-05, "loss": 0.08, "step": 50820 }, { "epoch": 14.3, "learning_rate": 7.935526192484304e-05, "loss": 0.0957, "step": 50850 }, { "epoch": 14.3, "learning_rate": 7.933651953893732e-05, "loss": 0.0756, "step": 50880 }, { "epoch": 14.31, "learning_rate": 7.931777715303158e-05, "loss": 0.0878, "step": 50910 }, { "epoch": 14.32, "learning_rate": 7.929903476712585e-05, "loss": 0.0808, "step": 50940 }, { "epoch": 14.33, "learning_rate": 7.928029238122013e-05, "loss": 0.0871, "step": 50970 }, { "epoch": 14.34, "learning_rate": 7.926154999531441e-05, "loss": 0.089, "step": 51000 }, { "epoch": 14.35, "learning_rate": 7.924280760940868e-05, "loss": 0.0732, "step": 51030 }, { "epoch": 14.35, "learning_rate": 7.922406522350295e-05, "loss": 0.0866, "step": 51060 }, { "epoch": 14.36, "learning_rate": 7.920532283759723e-05, "loss": 0.084, "step": 51090 }, { "epoch": 14.37, "learning_rate": 7.918658045169151e-05, "loss": 0.0905, "step": 51120 }, { "epoch": 14.38, "learning_rate": 7.916783806578578e-05, "loss": 0.0965, "step": 51150 }, { "epoch": 14.39, "learning_rate": 7.914909567988005e-05, "loss": 0.0761, "step": 51180 }, { "epoch": 14.4, "learning_rate": 7.913035329397433e-05, "loss": 0.0914, "step": 51210 }, { "epoch": 14.41, "learning_rate": 7.911161090806861e-05, "loss": 0.0851, "step": 51240 }, { "epoch": 14.41, "learning_rate": 7.909286852216287e-05, "loss": 0.0879, "step": 51270 }, { "epoch": 14.42, "learning_rate": 7.907412613625716e-05, "loss": 0.0961, "step": 51300 }, { "epoch": 14.43, "learning_rate": 7.905538375035142e-05, "loss": 0.0748, "step": 51330 }, { "epoch": 14.44, "learning_rate": 7.903664136444569e-05, "loss": 0.0873, "step": 51360 }, { "epoch": 14.45, "learning_rate": 7.901789897853997e-05, "loss": 0.081, "step": 51390 }, { "epoch": 14.46, "learning_rate": 7.899915659263425e-05, "loss": 0.0856, "step": 51420 }, { "epoch": 14.46, "learning_rate": 7.898041420672852e-05, "loss": 0.0935, "step": 51450 }, { "epoch": 14.47, "learning_rate": 7.896167182082279e-05, "loss": 0.0782, "step": 51480 }, { "epoch": 14.48, "learning_rate": 7.894292943491707e-05, "loss": 0.0931, "step": 51510 }, { "epoch": 14.49, "learning_rate": 7.892418704901135e-05, "loss": 0.083, "step": 51540 }, { "epoch": 14.5, "learning_rate": 7.890544466310562e-05, "loss": 0.084, "step": 51570 }, { "epoch": 14.51, "learning_rate": 7.888670227719988e-05, "loss": 0.097, "step": 51600 }, { "epoch": 14.51, "learning_rate": 7.886795989129416e-05, "loss": 0.0767, "step": 51630 }, { "epoch": 14.52, "learning_rate": 7.884921750538845e-05, "loss": 0.0904, "step": 51660 }, { "epoch": 14.53, "learning_rate": 7.883047511948271e-05, "loss": 0.078, "step": 51690 }, { "epoch": 14.54, "learning_rate": 7.8811732733577e-05, "loss": 0.0922, "step": 51720 }, { "epoch": 14.55, "learning_rate": 7.879299034767126e-05, "loss": 0.0937, "step": 51750 }, { "epoch": 14.56, "learning_rate": 7.877424796176553e-05, "loss": 0.079, "step": 51780 }, { "epoch": 14.57, "learning_rate": 7.875550557585981e-05, "loss": 0.0961, "step": 51810 }, { "epoch": 14.57, "learning_rate": 7.873676318995409e-05, "loss": 0.0843, "step": 51840 }, { "epoch": 14.58, "learning_rate": 7.871802080404836e-05, "loss": 0.0878, "step": 51870 }, { "epoch": 14.59, "learning_rate": 7.869927841814263e-05, "loss": 0.094, "step": 51900 }, { "epoch": 14.6, "learning_rate": 7.868053603223691e-05, "loss": 0.0784, "step": 51930 }, { "epoch": 14.61, "learning_rate": 7.866179364633119e-05, "loss": 0.0955, "step": 51960 }, { "epoch": 14.62, "learning_rate": 7.864305126042546e-05, "loss": 0.0821, "step": 51990 }, { "epoch": 14.62, "learning_rate": 7.862430887451972e-05, "loss": 0.089, "step": 52020 }, { "epoch": 14.63, "learning_rate": 7.8605566488614e-05, "loss": 0.0965, "step": 52050 }, { "epoch": 14.64, "learning_rate": 7.858682410270828e-05, "loss": 0.0806, "step": 52080 }, { "epoch": 14.65, "learning_rate": 7.856808171680255e-05, "loss": 0.0959, "step": 52110 }, { "epoch": 14.66, "learning_rate": 7.854933933089683e-05, "loss": 0.0791, "step": 52140 }, { "epoch": 14.67, "learning_rate": 7.85305969449911e-05, "loss": 0.0813, "step": 52170 }, { "epoch": 14.68, "learning_rate": 7.851185455908537e-05, "loss": 0.0952, "step": 52200 }, { "epoch": 14.68, "learning_rate": 7.849311217317965e-05, "loss": 0.0775, "step": 52230 }, { "epoch": 14.69, "learning_rate": 7.847436978727393e-05, "loss": 0.0922, "step": 52260 }, { "epoch": 14.7, "learning_rate": 7.84556274013682e-05, "loss": 0.0799, "step": 52290 }, { "epoch": 14.71, "learning_rate": 7.843688501546246e-05, "loss": 0.0875, "step": 52320 }, { "epoch": 14.72, "learning_rate": 7.84187673757536e-05, "loss": 0.095, "step": 52350 }, { "epoch": 14.73, "learning_rate": 7.840002498984787e-05, "loss": 0.0759, "step": 52380 }, { "epoch": 14.73, "learning_rate": 7.838128260394215e-05, "loss": 0.0883, "step": 52410 }, { "epoch": 14.74, "learning_rate": 7.836254021803643e-05, "loss": 0.0788, "step": 52440 }, { "epoch": 14.75, "learning_rate": 7.83437978321307e-05, "loss": 0.0862, "step": 52470 }, { "epoch": 14.76, "learning_rate": 7.832505544622497e-05, "loss": 0.0953, "step": 52500 }, { "epoch": 14.77, "learning_rate": 7.830631306031925e-05, "loss": 0.0753, "step": 52530 }, { "epoch": 14.78, "learning_rate": 7.828757067441352e-05, "loss": 0.0885, "step": 52560 }, { "epoch": 14.78, "learning_rate": 7.82688282885078e-05, "loss": 0.0845, "step": 52590 }, { "epoch": 14.79, "learning_rate": 7.825008590260208e-05, "loss": 0.0848, "step": 52620 }, { "epoch": 14.8, "learning_rate": 7.823134351669635e-05, "loss": 0.0943, "step": 52650 }, { "epoch": 14.81, "learning_rate": 7.821260113079061e-05, "loss": 0.0713, "step": 52680 }, { "epoch": 14.82, "learning_rate": 7.81938587448849e-05, "loss": 0.0952, "step": 52710 }, { "epoch": 14.83, "learning_rate": 7.817511635897918e-05, "loss": 0.0814, "step": 52740 }, { "epoch": 14.84, "learning_rate": 7.815637397307344e-05, "loss": 0.0847, "step": 52770 }, { "epoch": 14.84, "learning_rate": 7.813763158716771e-05, "loss": 0.0882, "step": 52800 }, { "epoch": 14.85, "learning_rate": 7.811888920126199e-05, "loss": 0.0745, "step": 52830 }, { "epoch": 14.86, "learning_rate": 7.810014681535627e-05, "loss": 0.086, "step": 52860 }, { "epoch": 14.87, "learning_rate": 7.808140442945054e-05, "loss": 0.082, "step": 52890 }, { "epoch": 14.88, "learning_rate": 7.806266204354481e-05, "loss": 0.087, "step": 52920 }, { "epoch": 14.89, "learning_rate": 7.804391965763909e-05, "loss": 0.0939, "step": 52950 }, { "epoch": 14.89, "learning_rate": 7.802517727173336e-05, "loss": 0.0783, "step": 52980 }, { "epoch": 14.9, "learning_rate": 7.800643488582764e-05, "loss": 0.0911, "step": 53010 }, { "epoch": 14.91, "learning_rate": 7.79876924999219e-05, "loss": 0.0812, "step": 53040 }, { "epoch": 14.92, "learning_rate": 7.796895011401619e-05, "loss": 0.0883, "step": 53070 }, { "epoch": 14.93, "learning_rate": 7.795020772811045e-05, "loss": 0.0946, "step": 53100 }, { "epoch": 14.94, "learning_rate": 7.793146534220473e-05, "loss": 0.08, "step": 53130 }, { "epoch": 14.95, "learning_rate": 7.791272295629902e-05, "loss": 0.0946, "step": 53160 }, { "epoch": 14.95, "learning_rate": 7.789398057039328e-05, "loss": 0.0825, "step": 53190 }, { "epoch": 14.96, "learning_rate": 7.787523818448755e-05, "loss": 0.0829, "step": 53220 }, { "epoch": 14.97, "learning_rate": 7.785649579858183e-05, "loss": 0.0883, "step": 53250 }, { "epoch": 14.98, "learning_rate": 7.783775341267611e-05, "loss": 0.0762, "step": 53280 }, { "epoch": 14.99, "learning_rate": 7.781901102677038e-05, "loss": 0.0883, "step": 53310 }, { "epoch": 15.0, "learning_rate": 7.780026864086465e-05, "loss": 0.0814, "step": 53340 }, { "epoch": 15.0, "eval_loss": 0.11322180926799774, "eval_runtime": 632.5147, "eval_samples_per_second": 25.348, "eval_steps_per_second": 0.794, "eval_wer": 0.111405292536132, "step": 53355 }, { "epoch": 15.0, "learning_rate": 7.778152625495893e-05, "loss": 0.0883, "step": 53370 }, { "epoch": 15.01, "learning_rate": 7.77627838690532e-05, "loss": 0.0827, "step": 53400 }, { "epoch": 15.02, "learning_rate": 7.774404148314748e-05, "loss": 0.0796, "step": 53430 }, { "epoch": 15.03, "learning_rate": 7.772529909724174e-05, "loss": 0.0921, "step": 53460 }, { "epoch": 15.04, "learning_rate": 7.770655671133602e-05, "loss": 0.0729, "step": 53490 }, { "epoch": 15.05, "learning_rate": 7.768781432543029e-05, "loss": 0.0852, "step": 53520 }, { "epoch": 15.05, "learning_rate": 7.766907193952457e-05, "loss": 0.0831, "step": 53550 }, { "epoch": 15.06, "learning_rate": 7.765032955361885e-05, "loss": 0.0817, "step": 53580 }, { "epoch": 15.07, "learning_rate": 7.763158716771312e-05, "loss": 0.0898, "step": 53610 }, { "epoch": 15.08, "learning_rate": 7.761284478180739e-05, "loss": 0.0737, "step": 53640 }, { "epoch": 15.09, "learning_rate": 7.759410239590167e-05, "loss": 0.0815, "step": 53670 }, { "epoch": 15.1, "learning_rate": 7.757536000999595e-05, "loss": 0.08, "step": 53700 }, { "epoch": 15.11, "learning_rate": 7.755661762409022e-05, "loss": 0.0801, "step": 53730 }, { "epoch": 15.11, "learning_rate": 7.753787523818449e-05, "loss": 0.0874, "step": 53760 }, { "epoch": 15.12, "learning_rate": 7.751913285227877e-05, "loss": 0.0756, "step": 53790 }, { "epoch": 15.13, "learning_rate": 7.750039046637303e-05, "loss": 0.0854, "step": 53820 }, { "epoch": 15.14, "learning_rate": 7.748164808046732e-05, "loss": 0.0827, "step": 53850 }, { "epoch": 15.15, "learning_rate": 7.746290569456158e-05, "loss": 0.0835, "step": 53880 }, { "epoch": 15.16, "learning_rate": 7.744416330865586e-05, "loss": 0.0916, "step": 53910 }, { "epoch": 15.16, "learning_rate": 7.742542092275013e-05, "loss": 0.0763, "step": 53940 }, { "epoch": 15.17, "learning_rate": 7.740667853684441e-05, "loss": 0.0874, "step": 53970 }, { "epoch": 15.18, "learning_rate": 7.738793615093869e-05, "loss": 0.0863, "step": 54000 }, { "epoch": 15.19, "learning_rate": 7.736919376503296e-05, "loss": 0.0826, "step": 54030 }, { "epoch": 15.2, "learning_rate": 7.735045137912723e-05, "loss": 0.0904, "step": 54060 }, { "epoch": 15.21, "learning_rate": 7.733170899322151e-05, "loss": 0.0751, "step": 54090 }, { "epoch": 15.22, "learning_rate": 7.731296660731579e-05, "loss": 0.0875, "step": 54120 }, { "epoch": 15.22, "learning_rate": 7.729422422141006e-05, "loss": 0.0827, "step": 54150 }, { "epoch": 15.23, "learning_rate": 7.727548183550432e-05, "loss": 0.0795, "step": 54180 }, { "epoch": 15.24, "learning_rate": 7.72567394495986e-05, "loss": 0.098, "step": 54210 }, { "epoch": 15.25, "learning_rate": 7.723799706369289e-05, "loss": 0.0755, "step": 54240 }, { "epoch": 15.26, "learning_rate": 7.721925467778715e-05, "loss": 0.0872, "step": 54270 }, { "epoch": 15.27, "learning_rate": 7.720051229188142e-05, "loss": 0.0763, "step": 54300 }, { "epoch": 15.27, "learning_rate": 7.71817699059757e-05, "loss": 0.0825, "step": 54330 }, { "epoch": 15.28, "learning_rate": 7.716302752006997e-05, "loss": 0.0878, "step": 54360 }, { "epoch": 15.29, "learning_rate": 7.714428513416425e-05, "loss": 0.0728, "step": 54390 }, { "epoch": 15.3, "learning_rate": 7.712554274825853e-05, "loss": 0.0811, "step": 54420 }, { "epoch": 15.31, "learning_rate": 7.71068003623528e-05, "loss": 0.0822, "step": 54450 }, { "epoch": 15.32, "learning_rate": 7.708805797644707e-05, "loss": 0.0817, "step": 54480 }, { "epoch": 15.32, "learning_rate": 7.706931559054135e-05, "loss": 0.0834, "step": 54510 }, { "epoch": 15.33, "learning_rate": 7.705057320463563e-05, "loss": 0.069, "step": 54540 }, { "epoch": 15.34, "learning_rate": 7.70318308187299e-05, "loss": 0.0891, "step": 54570 }, { "epoch": 15.35, "learning_rate": 7.701308843282416e-05, "loss": 0.084, "step": 54600 }, { "epoch": 15.36, "learning_rate": 7.699434604691844e-05, "loss": 0.0767, "step": 54630 }, { "epoch": 15.37, "learning_rate": 7.697560366101272e-05, "loss": 0.0847, "step": 54660 }, { "epoch": 15.38, "learning_rate": 7.695686127510699e-05, "loss": 0.072, "step": 54690 }, { "epoch": 15.38, "learning_rate": 7.693811888920126e-05, "loss": 0.0833, "step": 54720 }, { "epoch": 15.39, "learning_rate": 7.691937650329554e-05, "loss": 0.0797, "step": 54750 }, { "epoch": 15.4, "learning_rate": 7.690063411738981e-05, "loss": 0.0854, "step": 54780 }, { "epoch": 15.41, "learning_rate": 7.688189173148409e-05, "loss": 0.0862, "step": 54810 }, { "epoch": 15.42, "learning_rate": 7.686314934557837e-05, "loss": 0.075, "step": 54840 }, { "epoch": 15.43, "learning_rate": 7.684440695967264e-05, "loss": 0.0875, "step": 54870 }, { "epoch": 15.43, "learning_rate": 7.68256645737669e-05, "loss": 0.0819, "step": 54900 }, { "epoch": 15.44, "learning_rate": 7.680692218786119e-05, "loss": 0.0798, "step": 54930 }, { "epoch": 15.45, "learning_rate": 7.678817980195547e-05, "loss": 0.0926, "step": 54960 }, { "epoch": 15.46, "learning_rate": 7.676943741604973e-05, "loss": 0.068, "step": 54990 }, { "epoch": 15.47, "learning_rate": 7.6750695030144e-05, "loss": 0.0866, "step": 55020 }, { "epoch": 15.48, "learning_rate": 7.673195264423828e-05, "loss": 0.0796, "step": 55050 }, { "epoch": 15.48, "learning_rate": 7.671321025833256e-05, "loss": 0.0793, "step": 55080 }, { "epoch": 15.49, "learning_rate": 7.669446787242683e-05, "loss": 0.0862, "step": 55110 }, { "epoch": 15.5, "learning_rate": 7.66757254865211e-05, "loss": 0.0715, "step": 55140 }, { "epoch": 15.51, "learning_rate": 7.665698310061538e-05, "loss": 0.0907, "step": 55170 }, { "epoch": 15.52, "learning_rate": 7.663824071470965e-05, "loss": 0.0794, "step": 55200 }, { "epoch": 15.53, "learning_rate": 7.661949832880393e-05, "loss": 0.0794, "step": 55230 }, { "epoch": 15.54, "learning_rate": 7.660075594289821e-05, "loss": 0.0878, "step": 55260 }, { "epoch": 15.54, "learning_rate": 7.658201355699248e-05, "loss": 0.0693, "step": 55290 }, { "epoch": 15.55, "learning_rate": 7.656327117108674e-05, "loss": 0.0834, "step": 55320 }, { "epoch": 15.56, "learning_rate": 7.654452878518102e-05, "loss": 0.0798, "step": 55350 }, { "epoch": 15.57, "learning_rate": 7.65257863992753e-05, "loss": 0.0784, "step": 55380 }, { "epoch": 15.58, "learning_rate": 7.650704401336957e-05, "loss": 0.0943, "step": 55410 }, { "epoch": 15.59, "learning_rate": 7.648830162746384e-05, "loss": 0.079, "step": 55440 }, { "epoch": 15.59, "learning_rate": 7.646955924155812e-05, "loss": 0.0829, "step": 55470 }, { "epoch": 15.6, "learning_rate": 7.64508168556524e-05, "loss": 0.0832, "step": 55500 }, { "epoch": 15.61, "learning_rate": 7.643207446974667e-05, "loss": 0.0839, "step": 55530 }, { "epoch": 15.62, "learning_rate": 7.641333208384094e-05, "loss": 0.0917, "step": 55560 }, { "epoch": 15.63, "learning_rate": 7.639458969793522e-05, "loss": 0.0779, "step": 55590 }, { "epoch": 15.64, "learning_rate": 7.637584731202949e-05, "loss": 0.0846, "step": 55620 }, { "epoch": 15.65, "learning_rate": 7.635710492612377e-05, "loss": 0.079, "step": 55650 }, { "epoch": 15.65, "learning_rate": 7.633836254021805e-05, "loss": 0.0813, "step": 55680 }, { "epoch": 15.66, "learning_rate": 7.631962015431231e-05, "loss": 0.0871, "step": 55710 }, { "epoch": 15.67, "learning_rate": 7.630087776840658e-05, "loss": 0.0716, "step": 55740 }, { "epoch": 15.68, "learning_rate": 7.628213538250086e-05, "loss": 0.0888, "step": 55770 }, { "epoch": 15.69, "learning_rate": 7.626339299659514e-05, "loss": 0.0843, "step": 55800 }, { "epoch": 15.7, "learning_rate": 7.624465061068941e-05, "loss": 0.0837, "step": 55830 }, { "epoch": 15.7, "learning_rate": 7.622590822478368e-05, "loss": 0.0913, "step": 55860 }, { "epoch": 15.71, "learning_rate": 7.620716583887796e-05, "loss": 0.0767, "step": 55890 }, { "epoch": 15.72, "learning_rate": 7.618842345297224e-05, "loss": 0.0822, "step": 55920 }, { "epoch": 15.73, "learning_rate": 7.616968106706651e-05, "loss": 0.0824, "step": 55950 }, { "epoch": 15.74, "learning_rate": 7.615093868116078e-05, "loss": 0.0802, "step": 55980 }, { "epoch": 15.75, "learning_rate": 7.613219629525506e-05, "loss": 0.0896, "step": 56010 }, { "epoch": 15.75, "learning_rate": 7.611345390934932e-05, "loss": 0.0744, "step": 56040 }, { "epoch": 15.76, "learning_rate": 7.60947115234436e-05, "loss": 0.0874, "step": 56070 }, { "epoch": 15.77, "learning_rate": 7.607596913753789e-05, "loss": 0.0843, "step": 56100 }, { "epoch": 15.78, "learning_rate": 7.605722675163215e-05, "loss": 0.0824, "step": 56130 }, { "epoch": 15.79, "learning_rate": 7.603848436572642e-05, "loss": 0.0829, "step": 56160 }, { "epoch": 15.8, "learning_rate": 7.60197419798207e-05, "loss": 0.0741, "step": 56190 }, { "epoch": 15.81, "learning_rate": 7.600099959391498e-05, "loss": 0.0848, "step": 56220 }, { "epoch": 15.81, "learning_rate": 7.598225720800925e-05, "loss": 0.0778, "step": 56250 }, { "epoch": 15.82, "learning_rate": 7.596351482210352e-05, "loss": 0.0817, "step": 56280 }, { "epoch": 15.83, "learning_rate": 7.59447724361978e-05, "loss": 0.0897, "step": 56310 }, { "epoch": 15.84, "learning_rate": 7.592603005029208e-05, "loss": 0.0732, "step": 56340 }, { "epoch": 15.85, "learning_rate": 7.590728766438635e-05, "loss": 0.0873, "step": 56370 }, { "epoch": 15.86, "learning_rate": 7.588854527848061e-05, "loss": 0.0847, "step": 56400 }, { "epoch": 15.86, "learning_rate": 7.58698028925749e-05, "loss": 0.0816, "step": 56430 }, { "epoch": 15.87, "learning_rate": 7.585168525286602e-05, "loss": 0.093, "step": 56460 }, { "epoch": 15.88, "learning_rate": 7.58329428669603e-05, "loss": 0.0765, "step": 56490 }, { "epoch": 15.89, "learning_rate": 7.581420048105457e-05, "loss": 0.0946, "step": 56520 }, { "epoch": 15.9, "learning_rate": 7.579545809514885e-05, "loss": 0.0853, "step": 56550 }, { "epoch": 15.91, "learning_rate": 7.577671570924313e-05, "loss": 0.0813, "step": 56580 }, { "epoch": 15.91, "learning_rate": 7.57579733233374e-05, "loss": 0.0905, "step": 56610 }, { "epoch": 15.92, "learning_rate": 7.573923093743167e-05, "loss": 0.075, "step": 56640 }, { "epoch": 15.93, "learning_rate": 7.572048855152595e-05, "loss": 0.0863, "step": 56670 }, { "epoch": 15.94, "learning_rate": 7.570174616562023e-05, "loss": 0.0818, "step": 56700 }, { "epoch": 15.95, "learning_rate": 7.568300377971448e-05, "loss": 0.0797, "step": 56730 }, { "epoch": 15.96, "learning_rate": 7.566426139380876e-05, "loss": 0.0891, "step": 56760 }, { "epoch": 15.97, "learning_rate": 7.564551900790305e-05, "loss": 0.0777, "step": 56790 }, { "epoch": 15.97, "learning_rate": 7.562677662199731e-05, "loss": 0.0888, "step": 56820 }, { "epoch": 15.98, "learning_rate": 7.56080342360916e-05, "loss": 0.084, "step": 56850 }, { "epoch": 15.99, "learning_rate": 7.558929185018586e-05, "loss": 0.0817, "step": 56880 }, { "epoch": 16.0, "learning_rate": 7.557054946428014e-05, "loss": 0.0865, "step": 56910 }, { "epoch": 16.0, "eval_loss": 0.11335010826587677, "eval_runtime": 631.0736, "eval_samples_per_second": 25.406, "eval_steps_per_second": 0.795, "eval_wer": 0.10965840077518321, "step": 56912 }, { "epoch": 16.01, "learning_rate": 7.555180707837441e-05, "loss": 0.0725, "step": 56940 }, { "epoch": 16.02, "learning_rate": 7.553306469246869e-05, "loss": 0.0876, "step": 56970 }, { "epoch": 16.02, "learning_rate": 7.551432230656297e-05, "loss": 0.0761, "step": 57000 }, { "epoch": 16.03, "learning_rate": 7.549557992065724e-05, "loss": 0.0835, "step": 57030 }, { "epoch": 16.04, "learning_rate": 7.54768375347515e-05, "loss": 0.0822, "step": 57060 }, { "epoch": 16.05, "learning_rate": 7.545809514884579e-05, "loss": 0.0788, "step": 57090 }, { "epoch": 16.06, "learning_rate": 7.543935276294007e-05, "loss": 0.0917, "step": 57120 }, { "epoch": 16.07, "learning_rate": 7.542061037703432e-05, "loss": 0.0746, "step": 57150 }, { "epoch": 16.08, "learning_rate": 7.54018679911286e-05, "loss": 0.0875, "step": 57180 }, { "epoch": 16.08, "learning_rate": 7.538312560522288e-05, "loss": 0.0808, "step": 57210 }, { "epoch": 16.09, "learning_rate": 7.536438321931715e-05, "loss": 0.0729, "step": 57240 }, { "epoch": 16.1, "learning_rate": 7.534564083341143e-05, "loss": 0.0799, "step": 57270 }, { "epoch": 16.11, "learning_rate": 7.53268984475057e-05, "loss": 0.0743, "step": 57300 }, { "epoch": 16.12, "learning_rate": 7.530815606159998e-05, "loss": 0.0852, "step": 57330 }, { "epoch": 16.13, "learning_rate": 7.528941367569425e-05, "loss": 0.0868, "step": 57360 }, { "epoch": 16.13, "learning_rate": 7.527067128978853e-05, "loss": 0.0761, "step": 57390 }, { "epoch": 16.14, "learning_rate": 7.52519289038828e-05, "loss": 0.0889, "step": 57420 }, { "epoch": 16.15, "learning_rate": 7.523318651797708e-05, "loss": 0.0749, "step": 57450 }, { "epoch": 16.16, "learning_rate": 7.521444413207135e-05, "loss": 0.0825, "step": 57480 }, { "epoch": 16.17, "learning_rate": 7.519570174616563e-05, "loss": 0.0816, "step": 57510 }, { "epoch": 16.18, "learning_rate": 7.517695936025991e-05, "loss": 0.0757, "step": 57540 }, { "epoch": 16.18, "learning_rate": 7.515821697435416e-05, "loss": 0.0887, "step": 57570 }, { "epoch": 16.19, "learning_rate": 7.513947458844844e-05, "loss": 0.0732, "step": 57600 }, { "epoch": 16.2, "learning_rate": 7.512073220254272e-05, "loss": 0.0765, "step": 57630 }, { "epoch": 16.21, "learning_rate": 7.510198981663699e-05, "loss": 0.0843, "step": 57660 }, { "epoch": 16.22, "learning_rate": 7.508324743073127e-05, "loss": 0.0758, "step": 57690 }, { "epoch": 16.23, "learning_rate": 7.506450504482554e-05, "loss": 0.0916, "step": 57720 }, { "epoch": 16.24, "learning_rate": 7.504576265891982e-05, "loss": 0.0736, "step": 57750 }, { "epoch": 16.24, "learning_rate": 7.502702027301409e-05, "loss": 0.0851, "step": 57780 }, { "epoch": 16.25, "learning_rate": 7.500827788710837e-05, "loss": 0.0807, "step": 57810 }, { "epoch": 16.26, "learning_rate": 7.498953550120264e-05, "loss": 0.0731, "step": 57840 }, { "epoch": 16.27, "learning_rate": 7.497079311529692e-05, "loss": 0.0856, "step": 57870 }, { "epoch": 16.28, "learning_rate": 7.495205072939118e-05, "loss": 0.0746, "step": 57900 }, { "epoch": 16.29, "learning_rate": 7.493330834348547e-05, "loss": 0.0786, "step": 57930 }, { "epoch": 16.29, "learning_rate": 7.491456595757975e-05, "loss": 0.0825, "step": 57960 }, { "epoch": 16.3, "learning_rate": 7.4895823571674e-05, "loss": 0.0801, "step": 57990 }, { "epoch": 16.31, "learning_rate": 7.487708118576828e-05, "loss": 0.0861, "step": 58020 }, { "epoch": 16.32, "learning_rate": 7.485833879986256e-05, "loss": 0.073, "step": 58050 }, { "epoch": 16.33, "learning_rate": 7.483959641395684e-05, "loss": 0.0867, "step": 58080 }, { "epoch": 16.34, "learning_rate": 7.482085402805111e-05, "loss": 0.0837, "step": 58110 }, { "epoch": 16.35, "learning_rate": 7.480211164214538e-05, "loss": 0.0742, "step": 58140 }, { "epoch": 16.35, "learning_rate": 7.478336925623966e-05, "loss": 0.0841, "step": 58170 }, { "epoch": 16.36, "learning_rate": 7.476462687033393e-05, "loss": 0.076, "step": 58200 }, { "epoch": 16.37, "learning_rate": 7.474588448442821e-05, "loss": 0.0824, "step": 58230 }, { "epoch": 16.38, "learning_rate": 7.472714209852247e-05, "loss": 0.0785, "step": 58260 }, { "epoch": 16.39, "learning_rate": 7.470839971261676e-05, "loss": 0.0758, "step": 58290 }, { "epoch": 16.4, "learning_rate": 7.468965732671102e-05, "loss": 0.0863, "step": 58320 }, { "epoch": 16.4, "learning_rate": 7.46709149408053e-05, "loss": 0.0778, "step": 58350 }, { "epoch": 16.41, "learning_rate": 7.465217255489958e-05, "loss": 0.0795, "step": 58380 }, { "epoch": 16.42, "learning_rate": 7.463343016899385e-05, "loss": 0.0839, "step": 58410 }, { "epoch": 16.43, "learning_rate": 7.461468778308812e-05, "loss": 0.0761, "step": 58440 }, { "epoch": 16.44, "learning_rate": 7.45959453971824e-05, "loss": 0.0846, "step": 58470 }, { "epoch": 16.45, "learning_rate": 7.457720301127668e-05, "loss": 0.0739, "step": 58500 }, { "epoch": 16.45, "learning_rate": 7.455846062537095e-05, "loss": 0.088, "step": 58530 }, { "epoch": 16.46, "learning_rate": 7.454034298566208e-05, "loss": 0.0839, "step": 58560 }, { "epoch": 16.47, "learning_rate": 7.452160059975634e-05, "loss": 0.0762, "step": 58590 }, { "epoch": 16.48, "learning_rate": 7.450285821385062e-05, "loss": 0.0822, "step": 58620 }, { "epoch": 16.49, "learning_rate": 7.44841158279449e-05, "loss": 0.0745, "step": 58650 }, { "epoch": 16.5, "learning_rate": 7.446537344203917e-05, "loss": 0.0805, "step": 58680 }, { "epoch": 16.51, "learning_rate": 7.444663105613345e-05, "loss": 0.0806, "step": 58710 }, { "epoch": 16.51, "learning_rate": 7.442788867022772e-05, "loss": 0.0756, "step": 58740 }, { "epoch": 16.52, "learning_rate": 7.440914628432199e-05, "loss": 0.0866, "step": 58770 }, { "epoch": 16.53, "learning_rate": 7.439040389841627e-05, "loss": 0.0762, "step": 58800 }, { "epoch": 16.54, "learning_rate": 7.437166151251055e-05, "loss": 0.0832, "step": 58830 }, { "epoch": 16.55, "learning_rate": 7.435291912660483e-05, "loss": 0.0779, "step": 58860 }, { "epoch": 16.56, "learning_rate": 7.433417674069909e-05, "loss": 0.0738, "step": 58890 }, { "epoch": 16.56, "learning_rate": 7.431543435479337e-05, "loss": 0.0825, "step": 58920 }, { "epoch": 16.57, "learning_rate": 7.429669196888765e-05, "loss": 0.0772, "step": 58950 }, { "epoch": 16.58, "learning_rate": 7.427794958298191e-05, "loss": 0.0841, "step": 58980 }, { "epoch": 16.59, "learning_rate": 7.425920719707618e-05, "loss": 0.084, "step": 59010 }, { "epoch": 16.6, "learning_rate": 7.424046481117046e-05, "loss": 0.0756, "step": 59040 }, { "epoch": 16.61, "learning_rate": 7.422172242526474e-05, "loss": 0.0815, "step": 59070 }, { "epoch": 16.62, "learning_rate": 7.420298003935901e-05, "loss": 0.0771, "step": 59100 }, { "epoch": 16.62, "learning_rate": 7.418423765345329e-05, "loss": 0.0805, "step": 59130 }, { "epoch": 16.63, "learning_rate": 7.416549526754756e-05, "loss": 0.083, "step": 59160 }, { "epoch": 16.64, "learning_rate": 7.414675288164184e-05, "loss": 0.0782, "step": 59190 }, { "epoch": 16.65, "learning_rate": 7.412801049573611e-05, "loss": 0.0888, "step": 59220 }, { "epoch": 16.66, "learning_rate": 7.410926810983039e-05, "loss": 0.0732, "step": 59250 }, { "epoch": 16.67, "learning_rate": 7.409052572392467e-05, "loss": 0.081, "step": 59280 }, { "epoch": 16.67, "learning_rate": 7.407178333801892e-05, "loss": 0.0761, "step": 59310 }, { "epoch": 16.68, "learning_rate": 7.40530409521132e-05, "loss": 0.0746, "step": 59340 }, { "epoch": 16.69, "learning_rate": 7.403429856620749e-05, "loss": 0.0844, "step": 59370 }, { "epoch": 16.7, "learning_rate": 7.401555618030175e-05, "loss": 0.0739, "step": 59400 }, { "epoch": 16.71, "learning_rate": 7.399681379439602e-05, "loss": 0.0863, "step": 59430 }, { "epoch": 16.72, "learning_rate": 7.39780714084903e-05, "loss": 0.0837, "step": 59460 }, { "epoch": 16.72, "learning_rate": 7.395932902258458e-05, "loss": 0.0738, "step": 59490 }, { "epoch": 16.73, "learning_rate": 7.394058663667885e-05, "loss": 0.085, "step": 59520 }, { "epoch": 16.74, "learning_rate": 7.392184425077313e-05, "loss": 0.0736, "step": 59550 }, { "epoch": 16.75, "learning_rate": 7.39031018648674e-05, "loss": 0.0792, "step": 59580 }, { "epoch": 16.76, "learning_rate": 7.388435947896168e-05, "loss": 0.0807, "step": 59610 }, { "epoch": 16.77, "learning_rate": 7.386561709305595e-05, "loss": 0.0703, "step": 59640 }, { "epoch": 16.78, "learning_rate": 7.384687470715023e-05, "loss": 0.0869, "step": 59670 }, { "epoch": 16.78, "learning_rate": 7.382813232124451e-05, "loss": 0.0718, "step": 59700 }, { "epoch": 16.79, "learning_rate": 7.380938993533876e-05, "loss": 0.0829, "step": 59730 }, { "epoch": 16.8, "learning_rate": 7.379064754943304e-05, "loss": 0.0795, "step": 59760 }, { "epoch": 16.81, "learning_rate": 7.377190516352732e-05, "loss": 0.0728, "step": 59790 }, { "epoch": 16.82, "learning_rate": 7.375316277762159e-05, "loss": 0.0846, "step": 59820 }, { "epoch": 16.83, "learning_rate": 7.373442039171586e-05, "loss": 0.0729, "step": 59850 }, { "epoch": 16.83, "learning_rate": 7.371567800581014e-05, "loss": 0.0789, "step": 59880 }, { "epoch": 16.84, "learning_rate": 7.369693561990442e-05, "loss": 0.0832, "step": 59910 }, { "epoch": 16.85, "learning_rate": 7.367819323399869e-05, "loss": 0.0723, "step": 59940 }, { "epoch": 16.86, "learning_rate": 7.365945084809297e-05, "loss": 0.0783, "step": 59970 }, { "epoch": 16.87, "learning_rate": 7.364070846218724e-05, "loss": 0.0742, "step": 60000 }, { "epoch": 16.88, "learning_rate": 7.362196607628152e-05, "loss": 0.0792, "step": 60030 }, { "epoch": 16.88, "learning_rate": 7.360322369037579e-05, "loss": 0.0826, "step": 60060 }, { "epoch": 16.89, "learning_rate": 7.358448130447007e-05, "loss": 0.0771, "step": 60090 }, { "epoch": 16.9, "learning_rate": 7.356573891856435e-05, "loss": 0.0814, "step": 60120 }, { "epoch": 16.91, "learning_rate": 7.35469965326586e-05, "loss": 0.0756, "step": 60150 }, { "epoch": 16.92, "learning_rate": 7.352825414675288e-05, "loss": 0.0816, "step": 60180 }, { "epoch": 16.93, "learning_rate": 7.350951176084716e-05, "loss": 0.0811, "step": 60210 }, { "epoch": 16.94, "learning_rate": 7.349076937494143e-05, "loss": 0.0722, "step": 60240 }, { "epoch": 16.94, "learning_rate": 7.34720269890357e-05, "loss": 0.0808, "step": 60270 }, { "epoch": 16.95, "learning_rate": 7.345328460312998e-05, "loss": 0.0714, "step": 60300 }, { "epoch": 16.96, "learning_rate": 7.343454221722426e-05, "loss": 0.0755, "step": 60330 }, { "epoch": 16.97, "learning_rate": 7.341579983131853e-05, "loss": 0.0794, "step": 60360 }, { "epoch": 16.98, "learning_rate": 7.339705744541281e-05, "loss": 0.0736, "step": 60390 }, { "epoch": 16.99, "learning_rate": 7.337831505950708e-05, "loss": 0.0825, "step": 60420 }, { "epoch": 16.99, "learning_rate": 7.335957267360136e-05, "loss": 0.0701, "step": 60450 }, { "epoch": 17.0, "eval_loss": 0.1095786765217781, "eval_runtime": 631.7392, "eval_samples_per_second": 25.379, "eval_steps_per_second": 0.795, "eval_wer": 0.1054412948835178, "step": 60469 }, { "epoch": 17.0, "learning_rate": 7.334083028769562e-05, "loss": 0.0849, "step": 60480 }, { "epoch": 17.01, "learning_rate": 7.33220879017899e-05, "loss": 0.073, "step": 60510 }, { "epoch": 17.02, "learning_rate": 7.330334551588419e-05, "loss": 0.0751, "step": 60540 }, { "epoch": 17.03, "learning_rate": 7.328522787617531e-05, "loss": 0.0886, "step": 60570 }, { "epoch": 17.04, "learning_rate": 7.326648549026958e-05, "loss": 0.0696, "step": 60600 }, { "epoch": 17.05, "learning_rate": 7.324774310436385e-05, "loss": 0.0775, "step": 60630 }, { "epoch": 17.05, "learning_rate": 7.322900071845813e-05, "loss": 0.075, "step": 60660 }, { "epoch": 17.06, "learning_rate": 7.321025833255241e-05, "loss": 0.0763, "step": 60690 }, { "epoch": 17.07, "learning_rate": 7.319151594664668e-05, "loss": 0.0847, "step": 60720 }, { "epoch": 17.08, "learning_rate": 7.317277356074095e-05, "loss": 0.0705, "step": 60750 }, { "epoch": 17.09, "learning_rate": 7.315403117483523e-05, "loss": 0.0852, "step": 60780 }, { "epoch": 17.1, "learning_rate": 7.313528878892951e-05, "loss": 0.0728, "step": 60810 }, { "epoch": 17.1, "learning_rate": 7.311654640302377e-05, "loss": 0.0773, "step": 60840 }, { "epoch": 17.11, "learning_rate": 7.309780401711806e-05, "loss": 0.0868, "step": 60870 }, { "epoch": 17.12, "learning_rate": 7.307906163121232e-05, "loss": 0.0669, "step": 60900 }, { "epoch": 17.13, "learning_rate": 7.306031924530659e-05, "loss": 0.0827, "step": 60930 }, { "epoch": 17.14, "learning_rate": 7.304157685940087e-05, "loss": 0.0748, "step": 60960 }, { "epoch": 17.15, "learning_rate": 7.302283447349515e-05, "loss": 0.0782, "step": 60990 }, { "epoch": 17.15, "learning_rate": 7.300409208758942e-05, "loss": 0.0853, "step": 61020 }, { "epoch": 17.16, "learning_rate": 7.298534970168369e-05, "loss": 0.0705, "step": 61050 }, { "epoch": 17.17, "learning_rate": 7.296660731577797e-05, "loss": 0.0813, "step": 61080 }, { "epoch": 17.18, "learning_rate": 7.294786492987225e-05, "loss": 0.0703, "step": 61110 }, { "epoch": 17.19, "learning_rate": 7.292912254396652e-05, "loss": 0.0765, "step": 61140 }, { "epoch": 17.2, "learning_rate": 7.291038015806078e-05, "loss": 0.0864, "step": 61170 }, { "epoch": 17.21, "learning_rate": 7.289163777215507e-05, "loss": 0.0637, "step": 61200 }, { "epoch": 17.21, "learning_rate": 7.287289538624935e-05, "loss": 0.0846, "step": 61230 }, { "epoch": 17.22, "learning_rate": 7.285415300034361e-05, "loss": 0.0713, "step": 61260 }, { "epoch": 17.23, "learning_rate": 7.28354106144379e-05, "loss": 0.0796, "step": 61290 }, { "epoch": 17.24, "learning_rate": 7.281666822853216e-05, "loss": 0.0836, "step": 61320 }, { "epoch": 17.25, "learning_rate": 7.279792584262643e-05, "loss": 0.071, "step": 61350 }, { "epoch": 17.26, "learning_rate": 7.277918345672071e-05, "loss": 0.0842, "step": 61380 }, { "epoch": 17.26, "learning_rate": 7.276044107081499e-05, "loss": 0.0715, "step": 61410 }, { "epoch": 17.27, "learning_rate": 7.274169868490926e-05, "loss": 0.0776, "step": 61440 }, { "epoch": 17.28, "learning_rate": 7.272295629900353e-05, "loss": 0.0912, "step": 61470 }, { "epoch": 17.29, "learning_rate": 7.270421391309781e-05, "loss": 0.0693, "step": 61500 }, { "epoch": 17.3, "learning_rate": 7.268547152719209e-05, "loss": 0.0826, "step": 61530 }, { "epoch": 17.31, "learning_rate": 7.266672914128636e-05, "loss": 0.071, "step": 61560 }, { "epoch": 17.32, "learning_rate": 7.264798675538062e-05, "loss": 0.0761, "step": 61590 }, { "epoch": 17.32, "learning_rate": 7.26292443694749e-05, "loss": 0.0866, "step": 61620 }, { "epoch": 17.33, "learning_rate": 7.261050198356918e-05, "loss": 0.0686, "step": 61650 }, { "epoch": 17.34, "learning_rate": 7.259175959766345e-05, "loss": 0.0813, "step": 61680 }, { "epoch": 17.35, "learning_rate": 7.257301721175773e-05, "loss": 0.0735, "step": 61710 }, { "epoch": 17.36, "learning_rate": 7.2554274825852e-05, "loss": 0.0763, "step": 61740 }, { "epoch": 17.37, "learning_rate": 7.253553243994627e-05, "loss": 0.0875, "step": 61770 }, { "epoch": 17.37, "learning_rate": 7.251679005404055e-05, "loss": 0.0685, "step": 61800 }, { "epoch": 17.38, "learning_rate": 7.249804766813483e-05, "loss": 0.083, "step": 61830 }, { "epoch": 17.39, "learning_rate": 7.24793052822291e-05, "loss": 0.0742, "step": 61860 }, { "epoch": 17.4, "learning_rate": 7.246056289632336e-05, "loss": 0.0777, "step": 61890 }, { "epoch": 17.41, "learning_rate": 7.244182051041765e-05, "loss": 0.0847, "step": 61920 }, { "epoch": 17.42, "learning_rate": 7.242307812451193e-05, "loss": 0.0699, "step": 61950 }, { "epoch": 17.42, "learning_rate": 7.24043357386062e-05, "loss": 0.0814, "step": 61980 }, { "epoch": 17.43, "learning_rate": 7.238559335270046e-05, "loss": 0.0703, "step": 62010 }, { "epoch": 17.44, "learning_rate": 7.236685096679474e-05, "loss": 0.0774, "step": 62040 }, { "epoch": 17.45, "learning_rate": 7.234810858088902e-05, "loss": 0.0904, "step": 62070 }, { "epoch": 17.46, "learning_rate": 7.232936619498329e-05, "loss": 0.0735, "step": 62100 }, { "epoch": 17.47, "learning_rate": 7.231062380907757e-05, "loss": 0.0807, "step": 62130 }, { "epoch": 17.48, "learning_rate": 7.229188142317184e-05, "loss": 0.0728, "step": 62160 }, { "epoch": 17.48, "learning_rate": 7.22731390372661e-05, "loss": 0.0834, "step": 62190 }, { "epoch": 17.49, "learning_rate": 7.225439665136039e-05, "loss": 0.0892, "step": 62220 }, { "epoch": 17.5, "learning_rate": 7.223565426545467e-05, "loss": 0.0714, "step": 62250 }, { "epoch": 17.51, "learning_rate": 7.221691187954894e-05, "loss": 0.0876, "step": 62280 }, { "epoch": 17.52, "learning_rate": 7.21981694936432e-05, "loss": 0.0767, "step": 62310 }, { "epoch": 17.53, "learning_rate": 7.217942710773748e-05, "loss": 0.0747, "step": 62340 }, { "epoch": 17.53, "learning_rate": 7.216068472183177e-05, "loss": 0.0803, "step": 62370 }, { "epoch": 17.54, "learning_rate": 7.214194233592603e-05, "loss": 0.069, "step": 62400 }, { "epoch": 17.55, "learning_rate": 7.21231999500203e-05, "loss": 0.0822, "step": 62430 }, { "epoch": 17.56, "learning_rate": 7.210445756411458e-05, "loss": 0.0727, "step": 62460 }, { "epoch": 17.57, "learning_rate": 7.208571517820886e-05, "loss": 0.075, "step": 62490 }, { "epoch": 17.58, "learning_rate": 7.206697279230313e-05, "loss": 0.0832, "step": 62520 }, { "epoch": 17.58, "learning_rate": 7.20482304063974e-05, "loss": 0.0697, "step": 62550 }, { "epoch": 17.59, "learning_rate": 7.202948802049168e-05, "loss": 0.0852, "step": 62580 }, { "epoch": 17.6, "learning_rate": 7.201074563458596e-05, "loss": 0.0754, "step": 62610 }, { "epoch": 17.61, "learning_rate": 7.199200324868023e-05, "loss": 0.0752, "step": 62640 }, { "epoch": 17.62, "learning_rate": 7.197326086277451e-05, "loss": 0.0795, "step": 62670 }, { "epoch": 17.63, "learning_rate": 7.195514322306563e-05, "loss": 0.071, "step": 62700 }, { "epoch": 17.64, "learning_rate": 7.193640083715992e-05, "loss": 0.0865, "step": 62730 }, { "epoch": 17.64, "learning_rate": 7.191765845125418e-05, "loss": 0.0715, "step": 62760 }, { "epoch": 17.65, "learning_rate": 7.189891606534845e-05, "loss": 0.0827, "step": 62790 }, { "epoch": 17.66, "learning_rate": 7.188017367944273e-05, "loss": 0.0856, "step": 62820 }, { "epoch": 17.67, "learning_rate": 7.186143129353701e-05, "loss": 0.0703, "step": 62850 }, { "epoch": 17.68, "learning_rate": 7.184331365382814e-05, "loss": 0.083, "step": 62880 }, { "epoch": 17.69, "learning_rate": 7.182457126792241e-05, "loss": 0.0741, "step": 62910 }, { "epoch": 17.69, "learning_rate": 7.180582888201667e-05, "loss": 0.0774, "step": 62940 }, { "epoch": 17.7, "learning_rate": 7.178708649611096e-05, "loss": 0.085, "step": 62970 }, { "epoch": 17.71, "learning_rate": 7.176834411020524e-05, "loss": 0.0715, "step": 63000 }, { "epoch": 17.72, "learning_rate": 7.17496017242995e-05, "loss": 0.0827, "step": 63030 }, { "epoch": 17.73, "learning_rate": 7.173085933839378e-05, "loss": 0.0761, "step": 63060 }, { "epoch": 17.74, "learning_rate": 7.171211695248805e-05, "loss": 0.0745, "step": 63090 }, { "epoch": 17.75, "learning_rate": 7.169337456658233e-05, "loss": 0.0882, "step": 63120 }, { "epoch": 17.75, "learning_rate": 7.16746321806766e-05, "loss": 0.0695, "step": 63150 }, { "epoch": 17.76, "learning_rate": 7.165588979477088e-05, "loss": 0.0864, "step": 63180 }, { "epoch": 17.77, "learning_rate": 7.163714740886516e-05, "loss": 0.0712, "step": 63210 }, { "epoch": 17.78, "learning_rate": 7.161840502295942e-05, "loss": 0.0758, "step": 63240 }, { "epoch": 17.79, "learning_rate": 7.15996626370537e-05, "loss": 0.0815, "step": 63270 }, { "epoch": 17.8, "learning_rate": 7.158092025114798e-05, "loss": 0.0707, "step": 63300 }, { "epoch": 17.8, "learning_rate": 7.156217786524225e-05, "loss": 0.0863, "step": 63330 }, { "epoch": 17.81, "learning_rate": 7.154343547933651e-05, "loss": 0.0762, "step": 63360 }, { "epoch": 17.82, "learning_rate": 7.15246930934308e-05, "loss": 0.0778, "step": 63390 }, { "epoch": 17.83, "learning_rate": 7.150595070752508e-05, "loss": 0.0935, "step": 63420 }, { "epoch": 17.84, "learning_rate": 7.148720832161934e-05, "loss": 0.0699, "step": 63450 }, { "epoch": 17.85, "learning_rate": 7.146846593571362e-05, "loss": 0.0895, "step": 63480 }, { "epoch": 17.85, "learning_rate": 7.144972354980789e-05, "loss": 0.0716, "step": 63510 }, { "epoch": 17.86, "learning_rate": 7.143098116390217e-05, "loss": 0.078, "step": 63540 }, { "epoch": 17.87, "learning_rate": 7.141223877799644e-05, "loss": 0.086, "step": 63570 }, { "epoch": 17.88, "learning_rate": 7.139349639209072e-05, "loss": 0.0707, "step": 63600 }, { "epoch": 17.89, "learning_rate": 7.1374754006185e-05, "loss": 0.0843, "step": 63630 }, { "epoch": 17.9, "learning_rate": 7.135601162027926e-05, "loss": 0.0736, "step": 63660 }, { "epoch": 17.91, "learning_rate": 7.133726923437354e-05, "loss": 0.0799, "step": 63690 }, { "epoch": 17.91, "learning_rate": 7.131852684846782e-05, "loss": 0.0843, "step": 63720 }, { "epoch": 17.92, "learning_rate": 7.12997844625621e-05, "loss": 0.0764, "step": 63750 }, { "epoch": 17.93, "learning_rate": 7.128104207665635e-05, "loss": 0.0853, "step": 63780 }, { "epoch": 17.94, "learning_rate": 7.126229969075063e-05, "loss": 0.0718, "step": 63810 }, { "epoch": 17.95, "learning_rate": 7.124355730484491e-05, "loss": 0.0764, "step": 63840 }, { "epoch": 17.96, "learning_rate": 7.122481491893918e-05, "loss": 0.0894, "step": 63870 }, { "epoch": 17.96, "learning_rate": 7.120607253303346e-05, "loss": 0.0675, "step": 63900 }, { "epoch": 17.97, "learning_rate": 7.118733014712773e-05, "loss": 0.0774, "step": 63930 }, { "epoch": 17.98, "learning_rate": 7.116858776122201e-05, "loss": 0.0727, "step": 63960 }, { "epoch": 17.99, "learning_rate": 7.114984537531628e-05, "loss": 0.0752, "step": 63990 }, { "epoch": 18.0, "learning_rate": 7.113110298941056e-05, "loss": 0.0891, "step": 64020 }, { "epoch": 18.0, "eval_loss": 0.11096266657114029, "eval_runtime": 631.8647, "eval_samples_per_second": 25.374, "eval_steps_per_second": 0.794, "eval_wer": 0.10757714301311534, "step": 64026 }, { "epoch": 18.01, "learning_rate": 7.111236060350484e-05, "loss": 0.0713, "step": 64050 }, { "epoch": 18.02, "learning_rate": 7.10936182175991e-05, "loss": 0.0849, "step": 64080 }, { "epoch": 18.02, "learning_rate": 7.107487583169337e-05, "loss": 0.0712, "step": 64110 }, { "epoch": 18.03, "learning_rate": 7.105613344578766e-05, "loss": 0.084, "step": 64140 }, { "epoch": 18.04, "learning_rate": 7.103739105988194e-05, "loss": 0.0746, "step": 64170 }, { "epoch": 18.05, "learning_rate": 7.101864867397619e-05, "loss": 0.072, "step": 64200 }, { "epoch": 18.06, "learning_rate": 7.099990628807047e-05, "loss": 0.0888, "step": 64230 }, { "epoch": 18.07, "learning_rate": 7.098116390216475e-05, "loss": 0.0688, "step": 64260 }, { "epoch": 18.07, "learning_rate": 7.096242151625902e-05, "loss": 0.0824, "step": 64290 }, { "epoch": 18.08, "learning_rate": 7.09436791303533e-05, "loss": 0.0756, "step": 64320 }, { "epoch": 18.09, "learning_rate": 7.092493674444757e-05, "loss": 0.0737, "step": 64350 }, { "epoch": 18.1, "learning_rate": 7.090619435854185e-05, "loss": 0.0816, "step": 64380 }, { "epoch": 18.11, "learning_rate": 7.088745197263612e-05, "loss": 0.07, "step": 64410 }, { "epoch": 18.12, "learning_rate": 7.08687095867304e-05, "loss": 0.0768, "step": 64440 }, { "epoch": 18.12, "learning_rate": 7.084996720082467e-05, "loss": 0.074, "step": 64470 }, { "epoch": 18.13, "learning_rate": 7.083122481491895e-05, "loss": 0.0739, "step": 64500 }, { "epoch": 18.14, "learning_rate": 7.081248242901321e-05, "loss": 0.0799, "step": 64530 }, { "epoch": 18.15, "learning_rate": 7.07937400431075e-05, "loss": 0.069, "step": 64560 }, { "epoch": 18.16, "learning_rate": 7.077499765720178e-05, "loss": 0.0774, "step": 64590 }, { "epoch": 18.17, "learning_rate": 7.075625527129603e-05, "loss": 0.0779, "step": 64620 }, { "epoch": 18.18, "learning_rate": 7.073751288539031e-05, "loss": 0.0785, "step": 64650 }, { "epoch": 18.18, "learning_rate": 7.071877049948459e-05, "loss": 0.0852, "step": 64680 }, { "epoch": 18.19, "learning_rate": 7.070002811357886e-05, "loss": 0.0702, "step": 64710 }, { "epoch": 18.2, "learning_rate": 7.068128572767314e-05, "loss": 0.0814, "step": 64740 }, { "epoch": 18.21, "learning_rate": 7.066254334176741e-05, "loss": 0.0741, "step": 64770 }, { "epoch": 18.22, "learning_rate": 7.064380095586169e-05, "loss": 0.0806, "step": 64800 }, { "epoch": 18.23, "learning_rate": 7.062505856995596e-05, "loss": 0.0827, "step": 64830 }, { "epoch": 18.23, "learning_rate": 7.060631618405024e-05, "loss": 0.0712, "step": 64860 }, { "epoch": 18.24, "learning_rate": 7.05875737981445e-05, "loss": 0.0786, "step": 64890 }, { "epoch": 18.25, "learning_rate": 7.056883141223878e-05, "loss": 0.0775, "step": 64920 }, { "epoch": 18.26, "learning_rate": 7.055008902633305e-05, "loss": 0.0702, "step": 64950 }, { "epoch": 18.27, "learning_rate": 7.053134664042733e-05, "loss": 0.0864, "step": 64980 }, { "epoch": 18.28, "learning_rate": 7.051322900071846e-05, "loss": 0.0695, "step": 65010 }, { "epoch": 18.29, "learning_rate": 7.049448661481274e-05, "loss": 0.0781, "step": 65040 }, { "epoch": 18.29, "learning_rate": 7.047574422890701e-05, "loss": 0.0763, "step": 65070 }, { "epoch": 18.3, "learning_rate": 7.045700184300128e-05, "loss": 0.0721, "step": 65100 }, { "epoch": 18.31, "learning_rate": 7.043825945709556e-05, "loss": 0.0787, "step": 65130 }, { "epoch": 18.32, "learning_rate": 7.041951707118984e-05, "loss": 0.0721, "step": 65160 }, { "epoch": 18.33, "learning_rate": 7.04007746852841e-05, "loss": 0.0787, "step": 65190 }, { "epoch": 18.34, "learning_rate": 7.038203229937837e-05, "loss": 0.0802, "step": 65220 }, { "epoch": 18.34, "learning_rate": 7.036328991347265e-05, "loss": 0.0771, "step": 65250 }, { "epoch": 18.35, "learning_rate": 7.034454752756694e-05, "loss": 0.0839, "step": 65280 }, { "epoch": 18.36, "learning_rate": 7.03258051416612e-05, "loss": 0.0652, "step": 65310 }, { "epoch": 18.37, "learning_rate": 7.030706275575548e-05, "loss": 0.0793, "step": 65340 }, { "epoch": 18.38, "learning_rate": 7.028832036984975e-05, "loss": 0.0745, "step": 65370 }, { "epoch": 18.39, "learning_rate": 7.026957798394402e-05, "loss": 0.073, "step": 65400 }, { "epoch": 18.39, "learning_rate": 7.02508355980383e-05, "loss": 0.0829, "step": 65430 }, { "epoch": 18.4, "learning_rate": 7.023209321213258e-05, "loss": 0.071, "step": 65460 }, { "epoch": 18.41, "learning_rate": 7.021335082622685e-05, "loss": 0.0768, "step": 65490 }, { "epoch": 18.42, "learning_rate": 7.019460844032111e-05, "loss": 0.0708, "step": 65520 }, { "epoch": 18.43, "learning_rate": 7.01758660544154e-05, "loss": 0.0787, "step": 65550 }, { "epoch": 18.44, "learning_rate": 7.015712366850968e-05, "loss": 0.0843, "step": 65580 }, { "epoch": 18.45, "learning_rate": 7.013838128260394e-05, "loss": 0.0689, "step": 65610 }, { "epoch": 18.45, "learning_rate": 7.011963889669821e-05, "loss": 0.0751, "step": 65640 }, { "epoch": 18.46, "learning_rate": 7.010089651079249e-05, "loss": 0.071, "step": 65670 }, { "epoch": 18.47, "learning_rate": 7.008215412488677e-05, "loss": 0.0748, "step": 65700 }, { "epoch": 18.48, "learning_rate": 7.006341173898104e-05, "loss": 0.0827, "step": 65730 }, { "epoch": 18.49, "learning_rate": 7.004466935307532e-05, "loss": 0.07, "step": 65760 }, { "epoch": 18.5, "learning_rate": 7.002592696716959e-05, "loss": 0.0818, "step": 65790 }, { "epoch": 18.5, "learning_rate": 7.000718458126386e-05, "loss": 0.0764, "step": 65820 }, { "epoch": 18.51, "learning_rate": 6.998844219535814e-05, "loss": 0.0714, "step": 65850 }, { "epoch": 18.52, "learning_rate": 6.996969980945242e-05, "loss": 0.0827, "step": 65880 }, { "epoch": 18.53, "learning_rate": 6.995095742354669e-05, "loss": 0.0721, "step": 65910 }, { "epoch": 18.54, "learning_rate": 6.993221503764095e-05, "loss": 0.0817, "step": 65940 }, { "epoch": 18.55, "learning_rate": 6.991347265173523e-05, "loss": 0.0746, "step": 65970 }, { "epoch": 18.55, "learning_rate": 6.989473026582952e-05, "loss": 0.0753, "step": 66000 }, { "epoch": 18.56, "learning_rate": 6.987598787992378e-05, "loss": 0.0887, "step": 66030 }, { "epoch": 18.57, "learning_rate": 6.985724549401805e-05, "loss": 0.0671, "step": 66060 }, { "epoch": 18.58, "learning_rate": 6.983850310811233e-05, "loss": 0.0833, "step": 66090 }, { "epoch": 18.59, "learning_rate": 6.981976072220661e-05, "loss": 0.0769, "step": 66120 }, { "epoch": 18.6, "learning_rate": 6.980101833630088e-05, "loss": 0.0754, "step": 66150 }, { "epoch": 18.61, "learning_rate": 6.978227595039516e-05, "loss": 0.0855, "step": 66180 }, { "epoch": 18.61, "learning_rate": 6.976353356448943e-05, "loss": 0.0675, "step": 66210 }, { "epoch": 18.62, "learning_rate": 6.97447911785837e-05, "loss": 0.0819, "step": 66240 }, { "epoch": 18.63, "learning_rate": 6.972604879267798e-05, "loss": 0.0741, "step": 66270 }, { "epoch": 18.64, "learning_rate": 6.970730640677226e-05, "loss": 0.075, "step": 66300 }, { "epoch": 18.65, "learning_rate": 6.968856402086652e-05, "loss": 0.0836, "step": 66330 }, { "epoch": 18.66, "learning_rate": 6.966982163496079e-05, "loss": 0.0685, "step": 66360 }, { "epoch": 18.66, "learning_rate": 6.965107924905507e-05, "loss": 0.0776, "step": 66390 }, { "epoch": 18.67, "learning_rate": 6.963233686314935e-05, "loss": 0.0784, "step": 66420 }, { "epoch": 18.68, "learning_rate": 6.961359447724362e-05, "loss": 0.076, "step": 66450 }, { "epoch": 18.69, "learning_rate": 6.959485209133789e-05, "loss": 0.0871, "step": 66480 }, { "epoch": 18.7, "learning_rate": 6.957610970543217e-05, "loss": 0.0686, "step": 66510 }, { "epoch": 18.71, "learning_rate": 6.955736731952645e-05, "loss": 0.0764, "step": 66540 }, { "epoch": 18.72, "learning_rate": 6.953862493362072e-05, "loss": 0.0749, "step": 66570 }, { "epoch": 18.72, "learning_rate": 6.9519882547715e-05, "loss": 0.0771, "step": 66600 }, { "epoch": 18.73, "learning_rate": 6.950114016180927e-05, "loss": 0.0862, "step": 66630 }, { "epoch": 18.74, "learning_rate": 6.948239777590353e-05, "loss": 0.0667, "step": 66660 }, { "epoch": 18.75, "learning_rate": 6.946365538999782e-05, "loss": 0.0809, "step": 66690 }, { "epoch": 18.76, "learning_rate": 6.94449130040921e-05, "loss": 0.0769, "step": 66720 }, { "epoch": 18.77, "learning_rate": 6.942617061818636e-05, "loss": 0.0756, "step": 66750 }, { "epoch": 18.77, "learning_rate": 6.940742823228063e-05, "loss": 0.0835, "step": 66780 }, { "epoch": 18.78, "learning_rate": 6.938868584637491e-05, "loss": 0.072, "step": 66810 }, { "epoch": 18.79, "learning_rate": 6.936994346046919e-05, "loss": 0.0859, "step": 66840 }, { "epoch": 18.8, "learning_rate": 6.935120107456346e-05, "loss": 0.0747, "step": 66870 }, { "epoch": 18.81, "learning_rate": 6.933245868865773e-05, "loss": 0.0723, "step": 66900 }, { "epoch": 18.82, "learning_rate": 6.931371630275201e-05, "loss": 0.079, "step": 66930 }, { "epoch": 18.82, "learning_rate": 6.929497391684629e-05, "loss": 0.0697, "step": 66960 }, { "epoch": 18.83, "learning_rate": 6.927623153094056e-05, "loss": 0.0786, "step": 66990 }, { "epoch": 18.84, "learning_rate": 6.925748914503484e-05, "loss": 0.0785, "step": 67020 }, { "epoch": 18.85, "learning_rate": 6.92387467591291e-05, "loss": 0.0776, "step": 67050 }, { "epoch": 18.86, "learning_rate": 6.922000437322337e-05, "loss": 0.0874, "step": 67080 }, { "epoch": 18.87, "learning_rate": 6.920126198731765e-05, "loss": 0.0705, "step": 67110 }, { "epoch": 18.88, "learning_rate": 6.918251960141193e-05, "loss": 0.0799, "step": 67140 }, { "epoch": 18.88, "learning_rate": 6.916377721550622e-05, "loss": 0.0753, "step": 67170 }, { "epoch": 18.89, "learning_rate": 6.914503482960047e-05, "loss": 0.0758, "step": 67200 }, { "epoch": 18.9, "learning_rate": 6.912629244369475e-05, "loss": 0.0837, "step": 67230 }, { "epoch": 18.91, "learning_rate": 6.910755005778903e-05, "loss": 0.0687, "step": 67260 }, { "epoch": 18.92, "learning_rate": 6.90888076718833e-05, "loss": 0.0788, "step": 67290 }, { "epoch": 18.93, "learning_rate": 6.907006528597757e-05, "loss": 0.0696, "step": 67320 }, { "epoch": 18.93, "learning_rate": 6.905132290007185e-05, "loss": 0.074, "step": 67350 }, { "epoch": 18.94, "learning_rate": 6.903258051416613e-05, "loss": 0.078, "step": 67380 }, { "epoch": 18.95, "learning_rate": 6.90138381282604e-05, "loss": 0.0681, "step": 67410 }, { "epoch": 18.96, "learning_rate": 6.899509574235468e-05, "loss": 0.0798, "step": 67440 }, { "epoch": 18.97, "learning_rate": 6.897635335644894e-05, "loss": 0.0725, "step": 67470 }, { "epoch": 18.98, "learning_rate": 6.895823571674009e-05, "loss": 0.0733, "step": 67500 }, { "epoch": 18.98, "learning_rate": 6.893949333083435e-05, "loss": 0.0848, "step": 67530 }, { "epoch": 18.99, "learning_rate": 6.892075094492862e-05, "loss": 0.071, "step": 67560 }, { "epoch": 19.0, "eval_loss": 0.11411216855049133, "eval_runtime": 631.0775, "eval_samples_per_second": 25.406, "eval_steps_per_second": 0.795, "eval_wer": 0.10739290052270277, "step": 67583 }, { "epoch": 19.0, "learning_rate": 6.89020085590229e-05, "loss": 0.0792, "step": 67590 }, { "epoch": 19.01, "learning_rate": 6.888326617311718e-05, "loss": 0.0661, "step": 67620 }, { "epoch": 19.02, "learning_rate": 6.886452378721145e-05, "loss": 0.0769, "step": 67650 }, { "epoch": 19.03, "learning_rate": 6.884578140130572e-05, "loss": 0.0759, "step": 67680 }, { "epoch": 19.04, "learning_rate": 6.88270390154e-05, "loss": 0.069, "step": 67710 }, { "epoch": 19.04, "learning_rate": 6.880829662949428e-05, "loss": 0.0822, "step": 67740 }, { "epoch": 19.05, "learning_rate": 6.878955424358855e-05, "loss": 0.0713, "step": 67770 }, { "epoch": 19.06, "learning_rate": 6.877081185768281e-05, "loss": 0.0794, "step": 67800 }, { "epoch": 19.07, "learning_rate": 6.87520694717771e-05, "loss": 0.0757, "step": 67830 }, { "epoch": 19.08, "learning_rate": 6.873332708587136e-05, "loss": 0.0695, "step": 67860 }, { "epoch": 19.09, "learning_rate": 6.871458469996564e-05, "loss": 0.077, "step": 67890 }, { "epoch": 19.09, "learning_rate": 6.869584231405992e-05, "loss": 0.072, "step": 67920 }, { "epoch": 19.1, "learning_rate": 6.867709992815419e-05, "loss": 0.0781, "step": 67950 }, { "epoch": 19.11, "learning_rate": 6.865835754224846e-05, "loss": 0.075, "step": 67980 }, { "epoch": 19.12, "learning_rate": 6.863961515634274e-05, "loss": 0.0725, "step": 68010 }, { "epoch": 19.13, "learning_rate": 6.862087277043702e-05, "loss": 0.0776, "step": 68040 }, { "epoch": 19.14, "learning_rate": 6.860213038453129e-05, "loss": 0.069, "step": 68070 }, { "epoch": 19.15, "learning_rate": 6.858338799862556e-05, "loss": 0.0821, "step": 68100 }, { "epoch": 19.15, "learning_rate": 6.856464561271984e-05, "loss": 0.0748, "step": 68130 }, { "epoch": 19.16, "learning_rate": 6.854590322681412e-05, "loss": 0.0672, "step": 68160 }, { "epoch": 19.17, "learning_rate": 6.852716084090838e-05, "loss": 0.0828, "step": 68190 }, { "epoch": 19.18, "learning_rate": 6.850841845500265e-05, "loss": 0.0701, "step": 68220 }, { "epoch": 19.19, "learning_rate": 6.848967606909693e-05, "loss": 0.0745, "step": 68250 }, { "epoch": 19.2, "learning_rate": 6.847093368319121e-05, "loss": 0.0738, "step": 68280 }, { "epoch": 19.2, "learning_rate": 6.845219129728548e-05, "loss": 0.0706, "step": 68310 }, { "epoch": 19.21, "learning_rate": 6.843344891137976e-05, "loss": 0.0788, "step": 68340 }, { "epoch": 19.22, "learning_rate": 6.841470652547403e-05, "loss": 0.0682, "step": 68370 }, { "epoch": 19.23, "learning_rate": 6.83959641395683e-05, "loss": 0.077, "step": 68400 }, { "epoch": 19.24, "learning_rate": 6.837722175366258e-05, "loss": 0.0796, "step": 68430 }, { "epoch": 19.25, "learning_rate": 6.835847936775686e-05, "loss": 0.071, "step": 68460 }, { "epoch": 19.25, "learning_rate": 6.833973698185113e-05, "loss": 0.0796, "step": 68490 }, { "epoch": 19.26, "learning_rate": 6.83209945959454e-05, "loss": 0.0697, "step": 68520 }, { "epoch": 19.27, "learning_rate": 6.830225221003968e-05, "loss": 0.0737, "step": 68550 }, { "epoch": 19.28, "learning_rate": 6.828350982413396e-05, "loss": 0.0736, "step": 68580 }, { "epoch": 19.29, "learning_rate": 6.826476743822822e-05, "loss": 0.0753, "step": 68610 }, { "epoch": 19.3, "learning_rate": 6.824602505232249e-05, "loss": 0.0804, "step": 68640 }, { "epoch": 19.31, "learning_rate": 6.822728266641677e-05, "loss": 0.0669, "step": 68670 }, { "epoch": 19.31, "learning_rate": 6.820854028051105e-05, "loss": 0.0748, "step": 68700 }, { "epoch": 19.32, "learning_rate": 6.818979789460532e-05, "loss": 0.0714, "step": 68730 }, { "epoch": 19.33, "learning_rate": 6.81710555086996e-05, "loss": 0.0694, "step": 68760 }, { "epoch": 19.34, "learning_rate": 6.815231312279387e-05, "loss": 0.0826, "step": 68790 }, { "epoch": 19.35, "learning_rate": 6.813357073688814e-05, "loss": 0.0699, "step": 68820 }, { "epoch": 19.36, "learning_rate": 6.811482835098242e-05, "loss": 0.0767, "step": 68850 }, { "epoch": 19.36, "learning_rate": 6.80960859650767e-05, "loss": 0.0759, "step": 68880 }, { "epoch": 19.37, "learning_rate": 6.807734357917097e-05, "loss": 0.0722, "step": 68910 }, { "epoch": 19.38, "learning_rate": 6.805860119326523e-05, "loss": 0.0778, "step": 68940 }, { "epoch": 19.39, "learning_rate": 6.803985880735951e-05, "loss": 0.0665, "step": 68970 }, { "epoch": 19.4, "learning_rate": 6.80211164214538e-05, "loss": 0.0742, "step": 69000 }, { "epoch": 19.41, "learning_rate": 6.800237403554806e-05, "loss": 0.076, "step": 69030 }, { "epoch": 19.42, "learning_rate": 6.798363164964233e-05, "loss": 0.0732, "step": 69060 }, { "epoch": 19.42, "learning_rate": 6.796488926373661e-05, "loss": 0.0808, "step": 69090 }, { "epoch": 19.43, "learning_rate": 6.794614687783089e-05, "loss": 0.0655, "step": 69120 }, { "epoch": 19.44, "learning_rate": 6.792740449192516e-05, "loss": 0.0749, "step": 69150 }, { "epoch": 19.45, "learning_rate": 6.790866210601944e-05, "loss": 0.0761, "step": 69180 }, { "epoch": 19.46, "learning_rate": 6.788991972011371e-05, "loss": 0.0735, "step": 69210 }, { "epoch": 19.47, "learning_rate": 6.787117733420797e-05, "loss": 0.0796, "step": 69240 }, { "epoch": 19.47, "learning_rate": 6.785243494830226e-05, "loss": 0.0688, "step": 69270 }, { "epoch": 19.48, "learning_rate": 6.783369256239654e-05, "loss": 0.071, "step": 69300 }, { "epoch": 19.49, "learning_rate": 6.78149501764908e-05, "loss": 0.0748, "step": 69330 }, { "epoch": 19.5, "learning_rate": 6.779620779058507e-05, "loss": 0.0683, "step": 69360 }, { "epoch": 19.51, "learning_rate": 6.777746540467935e-05, "loss": 0.0797, "step": 69390 }, { "epoch": 19.52, "learning_rate": 6.775872301877363e-05, "loss": 0.0685, "step": 69420 }, { "epoch": 19.52, "learning_rate": 6.77399806328679e-05, "loss": 0.0806, "step": 69450 }, { "epoch": 19.53, "learning_rate": 6.772123824696217e-05, "loss": 0.0753, "step": 69480 }, { "epoch": 19.54, "learning_rate": 6.770249586105645e-05, "loss": 0.0716, "step": 69510 }, { "epoch": 19.55, "learning_rate": 6.768375347515073e-05, "loss": 0.0764, "step": 69540 }, { "epoch": 19.56, "learning_rate": 6.7665011089245e-05, "loss": 0.0662, "step": 69570 }, { "epoch": 19.57, "learning_rate": 6.764626870333926e-05, "loss": 0.0742, "step": 69600 }, { "epoch": 19.58, "learning_rate": 6.762752631743355e-05, "loss": 0.0755, "step": 69630 }, { "epoch": 19.58, "learning_rate": 6.760878393152781e-05, "loss": 0.0695, "step": 69660 }, { "epoch": 19.59, "learning_rate": 6.75900415456221e-05, "loss": 0.0789, "step": 69690 }, { "epoch": 19.6, "learning_rate": 6.757129915971638e-05, "loss": 0.0675, "step": 69720 }, { "epoch": 19.61, "learning_rate": 6.755255677381064e-05, "loss": 0.0775, "step": 69750 }, { "epoch": 19.62, "learning_rate": 6.753381438790491e-05, "loss": 0.0748, "step": 69780 }, { "epoch": 19.63, "learning_rate": 6.751507200199919e-05, "loss": 0.0748, "step": 69810 }, { "epoch": 19.63, "learning_rate": 6.749632961609347e-05, "loss": 0.0823, "step": 69840 }, { "epoch": 19.64, "learning_rate": 6.747758723018774e-05, "loss": 0.067, "step": 69870 }, { "epoch": 19.65, "learning_rate": 6.745884484428201e-05, "loss": 0.0791, "step": 69900 }, { "epoch": 19.66, "learning_rate": 6.744010245837629e-05, "loss": 0.0775, "step": 69930 }, { "epoch": 19.67, "learning_rate": 6.742136007247057e-05, "loss": 0.0684, "step": 69960 }, { "epoch": 19.68, "learning_rate": 6.740261768656484e-05, "loss": 0.082, "step": 69990 }, { "epoch": 19.69, "learning_rate": 6.73838753006591e-05, "loss": 0.068, "step": 70020 }, { "epoch": 19.69, "learning_rate": 6.736513291475338e-05, "loss": 0.076, "step": 70050 }, { "epoch": 19.7, "learning_rate": 6.734639052884765e-05, "loss": 0.0774, "step": 70080 }, { "epoch": 19.71, "learning_rate": 6.732764814294193e-05, "loss": 0.0734, "step": 70110 }, { "epoch": 19.72, "learning_rate": 6.730890575703621e-05, "loss": 0.0791, "step": 70140 }, { "epoch": 19.73, "learning_rate": 6.729016337113048e-05, "loss": 0.0675, "step": 70170 }, { "epoch": 19.74, "learning_rate": 6.727142098522475e-05, "loss": 0.0778, "step": 70200 }, { "epoch": 19.74, "learning_rate": 6.725267859931903e-05, "loss": 0.0786, "step": 70230 }, { "epoch": 19.75, "learning_rate": 6.723393621341331e-05, "loss": 0.0687, "step": 70260 }, { "epoch": 19.76, "learning_rate": 6.721519382750758e-05, "loss": 0.0832, "step": 70290 }, { "epoch": 19.77, "learning_rate": 6.719645144160185e-05, "loss": 0.0673, "step": 70320 }, { "epoch": 19.78, "learning_rate": 6.717770905569613e-05, "loss": 0.0807, "step": 70350 }, { "epoch": 19.79, "learning_rate": 6.715896666979041e-05, "loss": 0.0735, "step": 70380 }, { "epoch": 19.79, "learning_rate": 6.714022428388467e-05, "loss": 0.0684, "step": 70410 }, { "epoch": 19.8, "learning_rate": 6.712148189797894e-05, "loss": 0.0847, "step": 70440 }, { "epoch": 19.81, "learning_rate": 6.710273951207322e-05, "loss": 0.0683, "step": 70470 }, { "epoch": 19.82, "learning_rate": 6.708399712616749e-05, "loss": 0.0744, "step": 70500 }, { "epoch": 19.83, "learning_rate": 6.706525474026177e-05, "loss": 0.0729, "step": 70530 }, { "epoch": 19.84, "learning_rate": 6.704651235435605e-05, "loss": 0.0745, "step": 70560 }, { "epoch": 19.85, "learning_rate": 6.702776996845032e-05, "loss": 0.0777, "step": 70590 }, { "epoch": 19.85, "learning_rate": 6.700902758254459e-05, "loss": 0.0661, "step": 70620 }, { "epoch": 19.86, "learning_rate": 6.699028519663887e-05, "loss": 0.0773, "step": 70650 }, { "epoch": 19.87, "learning_rate": 6.697154281073315e-05, "loss": 0.0748, "step": 70680 }, { "epoch": 19.88, "learning_rate": 6.695280042482742e-05, "loss": 0.0717, "step": 70710 }, { "epoch": 19.89, "learning_rate": 6.693405803892168e-05, "loss": 0.081, "step": 70740 }, { "epoch": 19.9, "learning_rate": 6.691531565301597e-05, "loss": 0.0682, "step": 70770 }, { "epoch": 19.9, "learning_rate": 6.689657326711025e-05, "loss": 0.0766, "step": 70800 }, { "epoch": 19.91, "learning_rate": 6.687783088120451e-05, "loss": 0.0731, "step": 70830 }, { "epoch": 19.92, "learning_rate": 6.685908849529878e-05, "loss": 0.07, "step": 70860 }, { "epoch": 19.93, "learning_rate": 6.684034610939306e-05, "loss": 0.0782, "step": 70890 }, { "epoch": 19.94, "learning_rate": 6.682160372348733e-05, "loss": 0.0678, "step": 70920 }, { "epoch": 19.95, "learning_rate": 6.680286133758161e-05, "loss": 0.0755, "step": 70950 }, { "epoch": 19.95, "learning_rate": 6.678411895167589e-05, "loss": 0.0763, "step": 70980 }, { "epoch": 19.96, "learning_rate": 6.676537656577016e-05, "loss": 0.0731, "step": 71010 }, { "epoch": 19.97, "learning_rate": 6.674663417986443e-05, "loss": 0.0806, "step": 71040 }, { "epoch": 19.98, "learning_rate": 6.672789179395871e-05, "loss": 0.0644, "step": 71070 }, { "epoch": 19.99, "learning_rate": 6.670914940805299e-05, "loss": 0.0751, "step": 71100 }, { "epoch": 20.0, "learning_rate": 6.669103176834412e-05, "loss": 0.0726, "step": 71130 }, { "epoch": 20.0, "eval_loss": 0.10938318818807602, "eval_runtime": 632.7086, "eval_samples_per_second": 25.34, "eval_steps_per_second": 0.793, "eval_wer": 0.10929673959029929, "step": 71140 }, { "epoch": 20.01, "learning_rate": 6.66722893824384e-05, "loss": 0.0718, "step": 71160 }, { "epoch": 20.01, "learning_rate": 6.665354699653265e-05, "loss": 0.0843, "step": 71190 }, { "epoch": 20.02, "learning_rate": 6.663480461062693e-05, "loss": 0.0637, "step": 71220 }, { "epoch": 20.03, "learning_rate": 6.661606222472121e-05, "loss": 0.0759, "step": 71250 }, { "epoch": 20.04, "learning_rate": 6.659731983881548e-05, "loss": 0.068, "step": 71280 }, { "epoch": 20.05, "learning_rate": 6.657857745290976e-05, "loss": 0.0724, "step": 71310 }, { "epoch": 20.06, "learning_rate": 6.655983506700403e-05, "loss": 0.0815, "step": 71340 }, { "epoch": 20.06, "learning_rate": 6.654109268109831e-05, "loss": 0.0639, "step": 71370 }, { "epoch": 20.07, "learning_rate": 6.652235029519258e-05, "loss": 0.0768, "step": 71400 }, { "epoch": 20.08, "learning_rate": 6.650360790928686e-05, "loss": 0.0674, "step": 71430 }, { "epoch": 20.09, "learning_rate": 6.648486552338114e-05, "loss": 0.0714, "step": 71460 }, { "epoch": 20.1, "learning_rate": 6.64661231374754e-05, "loss": 0.0785, "step": 71490 }, { "epoch": 20.11, "learning_rate": 6.644738075156967e-05, "loss": 0.0628, "step": 71520 }, { "epoch": 20.12, "learning_rate": 6.642863836566395e-05, "loss": 0.0787, "step": 71550 }, { "epoch": 20.12, "learning_rate": 6.640989597975824e-05, "loss": 0.0656, "step": 71580 }, { "epoch": 20.13, "learning_rate": 6.639115359385249e-05, "loss": 0.0701, "step": 71610 }, { "epoch": 20.14, "learning_rate": 6.637241120794677e-05, "loss": 0.0743, "step": 71640 }, { "epoch": 20.15, "learning_rate": 6.635366882204105e-05, "loss": 0.0632, "step": 71670 }, { "epoch": 20.16, "learning_rate": 6.633492643613533e-05, "loss": 0.0758, "step": 71700 }, { "epoch": 20.17, "learning_rate": 6.63161840502296e-05, "loss": 0.0652, "step": 71730 }, { "epoch": 20.17, "learning_rate": 6.629744166432387e-05, "loss": 0.0769, "step": 71760 }, { "epoch": 20.18, "learning_rate": 6.627869927841815e-05, "loss": 0.0761, "step": 71790 }, { "epoch": 20.19, "learning_rate": 6.625995689251242e-05, "loss": 0.0657, "step": 71820 }, { "epoch": 20.2, "learning_rate": 6.62412145066067e-05, "loss": 0.0763, "step": 71850 }, { "epoch": 20.21, "learning_rate": 6.622247212070098e-05, "loss": 0.0649, "step": 71880 }, { "epoch": 20.22, "learning_rate": 6.620372973479524e-05, "loss": 0.0711, "step": 71910 }, { "epoch": 20.22, "learning_rate": 6.618498734888951e-05, "loss": 0.0837, "step": 71940 }, { "epoch": 20.23, "learning_rate": 6.616624496298379e-05, "loss": 0.0623, "step": 71970 }, { "epoch": 20.24, "learning_rate": 6.614750257707807e-05, "loss": 0.0737, "step": 72000 }, { "epoch": 20.25, "learning_rate": 6.612876019117233e-05, "loss": 0.0678, "step": 72030 }, { "epoch": 20.26, "learning_rate": 6.611001780526661e-05, "loss": 0.0704, "step": 72060 }, { "epoch": 20.27, "learning_rate": 6.609127541936089e-05, "loss": 0.0771, "step": 72090 }, { "epoch": 20.28, "learning_rate": 6.607253303345517e-05, "loss": 0.0639, "step": 72120 }, { "epoch": 20.28, "learning_rate": 6.605379064754944e-05, "loss": 0.0759, "step": 72150 }, { "epoch": 20.29, "learning_rate": 6.60350482616437e-05, "loss": 0.0701, "step": 72180 }, { "epoch": 20.3, "learning_rate": 6.601630587573799e-05, "loss": 0.07, "step": 72210 }, { "epoch": 20.31, "learning_rate": 6.599756348983225e-05, "loss": 0.0784, "step": 72240 }, { "epoch": 20.32, "learning_rate": 6.597882110392653e-05, "loss": 0.0676, "step": 72270 }, { "epoch": 20.33, "learning_rate": 6.596007871802082e-05, "loss": 0.0814, "step": 72300 }, { "epoch": 20.33, "learning_rate": 6.594133633211508e-05, "loss": 0.0678, "step": 72330 }, { "epoch": 20.34, "learning_rate": 6.592259394620935e-05, "loss": 0.0718, "step": 72360 }, { "epoch": 20.35, "learning_rate": 6.590385156030363e-05, "loss": 0.0836, "step": 72390 }, { "epoch": 20.36, "learning_rate": 6.588510917439791e-05, "loss": 0.0626, "step": 72420 }, { "epoch": 20.37, "learning_rate": 6.586636678849218e-05, "loss": 0.0782, "step": 72450 }, { "epoch": 20.38, "learning_rate": 6.584762440258645e-05, "loss": 0.0696, "step": 72480 }, { "epoch": 20.39, "learning_rate": 6.582888201668073e-05, "loss": 0.069, "step": 72510 }, { "epoch": 20.39, "learning_rate": 6.581013963077501e-05, "loss": 0.0799, "step": 72540 }, { "epoch": 20.4, "learning_rate": 6.579139724486928e-05, "loss": 0.0639, "step": 72570 }, { "epoch": 20.41, "learning_rate": 6.577265485896354e-05, "loss": 0.0775, "step": 72600 }, { "epoch": 20.42, "learning_rate": 6.575391247305782e-05, "loss": 0.0689, "step": 72630 }, { "epoch": 20.43, "learning_rate": 6.573517008715209e-05, "loss": 0.0757, "step": 72660 }, { "epoch": 20.44, "learning_rate": 6.571642770124637e-05, "loss": 0.0819, "step": 72690 }, { "epoch": 20.44, "learning_rate": 6.569768531534065e-05, "loss": 0.0691, "step": 72720 }, { "epoch": 20.45, "learning_rate": 6.567894292943492e-05, "loss": 0.08, "step": 72750 }, { "epoch": 20.46, "learning_rate": 6.566020054352919e-05, "loss": 0.0654, "step": 72780 }, { "epoch": 20.47, "learning_rate": 6.564145815762347e-05, "loss": 0.0697, "step": 72810 }, { "epoch": 20.48, "learning_rate": 6.562271577171775e-05, "loss": 0.0783, "step": 72840 }, { "epoch": 20.49, "learning_rate": 6.560397338581202e-05, "loss": 0.0692, "step": 72870 }, { "epoch": 20.49, "learning_rate": 6.558523099990629e-05, "loss": 0.0761, "step": 72900 }, { "epoch": 20.5, "learning_rate": 6.556648861400057e-05, "loss": 0.0662, "step": 72930 }, { "epoch": 20.51, "learning_rate": 6.554774622809485e-05, "loss": 0.0752, "step": 72960 }, { "epoch": 20.52, "learning_rate": 6.552900384218912e-05, "loss": 0.0795, "step": 72990 }, { "epoch": 20.53, "learning_rate": 6.551026145628338e-05, "loss": 0.0593, "step": 73020 }, { "epoch": 20.54, "learning_rate": 6.549151907037766e-05, "loss": 0.0788, "step": 73050 }, { "epoch": 20.55, "learning_rate": 6.547277668447193e-05, "loss": 0.0711, "step": 73080 }, { "epoch": 20.55, "learning_rate": 6.545403429856621e-05, "loss": 0.072, "step": 73110 }, { "epoch": 20.56, "learning_rate": 6.543529191266049e-05, "loss": 0.0816, "step": 73140 }, { "epoch": 20.57, "learning_rate": 6.541654952675476e-05, "loss": 0.0643, "step": 73170 }, { "epoch": 20.58, "learning_rate": 6.539780714084903e-05, "loss": 0.0759, "step": 73200 }, { "epoch": 20.59, "learning_rate": 6.537906475494331e-05, "loss": 0.07, "step": 73230 }, { "epoch": 20.6, "learning_rate": 6.536094711523444e-05, "loss": 0.0754, "step": 73260 }, { "epoch": 20.6, "learning_rate": 6.534220472932872e-05, "loss": 0.0787, "step": 73290 }, { "epoch": 20.61, "learning_rate": 6.5323462343423e-05, "loss": 0.0665, "step": 73320 }, { "epoch": 20.62, "learning_rate": 6.530471995751725e-05, "loss": 0.0778, "step": 73350 }, { "epoch": 20.63, "learning_rate": 6.528597757161153e-05, "loss": 0.0681, "step": 73380 }, { "epoch": 20.64, "learning_rate": 6.526723518570581e-05, "loss": 0.0757, "step": 73410 }, { "epoch": 20.65, "learning_rate": 6.524849279980008e-05, "loss": 0.0797, "step": 73440 }, { "epoch": 20.65, "learning_rate": 6.522975041389436e-05, "loss": 0.0645, "step": 73470 }, { "epoch": 20.66, "learning_rate": 6.521100802798863e-05, "loss": 0.0796, "step": 73500 }, { "epoch": 20.67, "learning_rate": 6.519226564208291e-05, "loss": 0.0662, "step": 73530 }, { "epoch": 20.68, "learning_rate": 6.517352325617718e-05, "loss": 0.0715, "step": 73560 }, { "epoch": 20.69, "learning_rate": 6.515478087027146e-05, "loss": 0.0764, "step": 73590 }, { "epoch": 20.7, "learning_rate": 6.513603848436573e-05, "loss": 0.0633, "step": 73620 }, { "epoch": 20.71, "learning_rate": 6.511729609846001e-05, "loss": 0.0814, "step": 73650 }, { "epoch": 20.71, "learning_rate": 6.509855371255427e-05, "loss": 0.0667, "step": 73680 }, { "epoch": 20.72, "learning_rate": 6.507981132664856e-05, "loss": 0.0737, "step": 73710 }, { "epoch": 20.73, "learning_rate": 6.506106894074284e-05, "loss": 0.0809, "step": 73740 }, { "epoch": 20.74, "learning_rate": 6.504232655483709e-05, "loss": 0.0629, "step": 73770 }, { "epoch": 20.75, "learning_rate": 6.502358416893137e-05, "loss": 0.0815, "step": 73800 }, { "epoch": 20.76, "learning_rate": 6.500484178302565e-05, "loss": 0.0656, "step": 73830 }, { "epoch": 20.76, "learning_rate": 6.498609939711992e-05, "loss": 0.0706, "step": 73860 }, { "epoch": 20.77, "learning_rate": 6.49673570112142e-05, "loss": 0.077, "step": 73890 }, { "epoch": 20.78, "learning_rate": 6.494861462530847e-05, "loss": 0.0618, "step": 73920 }, { "epoch": 20.79, "learning_rate": 6.492987223940275e-05, "loss": 0.0761, "step": 73950 }, { "epoch": 20.8, "learning_rate": 6.491112985349702e-05, "loss": 0.0671, "step": 73980 }, { "epoch": 20.81, "learning_rate": 6.48923874675913e-05, "loss": 0.0702, "step": 74010 }, { "epoch": 20.82, "learning_rate": 6.487364508168557e-05, "loss": 0.0794, "step": 74040 }, { "epoch": 20.82, "learning_rate": 6.485490269577985e-05, "loss": 0.0656, "step": 74070 }, { "epoch": 20.83, "learning_rate": 6.483616030987411e-05, "loss": 0.0802, "step": 74100 }, { "epoch": 20.84, "learning_rate": 6.48174179239684e-05, "loss": 0.067, "step": 74130 }, { "epoch": 20.85, "learning_rate": 6.479867553806268e-05, "loss": 0.0695, "step": 74160 }, { "epoch": 20.86, "learning_rate": 6.477993315215693e-05, "loss": 0.0764, "step": 74190 }, { "epoch": 20.87, "learning_rate": 6.476119076625121e-05, "loss": 0.0639, "step": 74220 }, { "epoch": 20.87, "learning_rate": 6.474244838034549e-05, "loss": 0.0817, "step": 74250 }, { "epoch": 20.88, "learning_rate": 6.472370599443976e-05, "loss": 0.0686, "step": 74280 }, { "epoch": 20.89, "learning_rate": 6.470496360853404e-05, "loss": 0.0747, "step": 74310 }, { "epoch": 20.9, "learning_rate": 6.468622122262831e-05, "loss": 0.0826, "step": 74340 }, { "epoch": 20.91, "learning_rate": 6.466747883672259e-05, "loss": 0.0697, "step": 74370 }, { "epoch": 20.92, "learning_rate": 6.464873645081686e-05, "loss": 0.08, "step": 74400 }, { "epoch": 20.92, "learning_rate": 6.462999406491114e-05, "loss": 0.0681, "step": 74430 }, { "epoch": 20.93, "learning_rate": 6.46112516790054e-05, "loss": 0.0737, "step": 74460 }, { "epoch": 20.94, "learning_rate": 6.459250929309968e-05, "loss": 0.0777, "step": 74490 }, { "epoch": 20.95, "learning_rate": 6.457376690719395e-05, "loss": 0.0633, "step": 74520 }, { "epoch": 20.96, "learning_rate": 6.455502452128823e-05, "loss": 0.0784, "step": 74550 }, { "epoch": 20.97, "learning_rate": 6.453628213538251e-05, "loss": 0.0677, "step": 74580 }, { "epoch": 20.98, "learning_rate": 6.451753974947677e-05, "loss": 0.0742, "step": 74610 }, { "epoch": 20.98, "learning_rate": 6.449879736357105e-05, "loss": 0.0751, "step": 74640 }, { "epoch": 20.99, "learning_rate": 6.448005497766533e-05, "loss": 0.0647, "step": 74670 }, { "epoch": 21.0, "eval_loss": 0.10879692435264587, "eval_runtime": 632.1305, "eval_samples_per_second": 25.363, "eval_steps_per_second": 0.794, "eval_wer": 0.10948780587665306, "step": 74697 }, { "epoch": 21.0, "learning_rate": 6.44613125917596e-05, "loss": 0.0789, "step": 74700 }, { "epoch": 21.01, "learning_rate": 6.444257020585388e-05, "loss": 0.0664, "step": 74730 }, { "epoch": 21.02, "learning_rate": 6.442382781994815e-05, "loss": 0.0746, "step": 74760 }, { "epoch": 21.03, "learning_rate": 6.440508543404243e-05, "loss": 0.067, "step": 74790 }, { "epoch": 21.03, "learning_rate": 6.43863430481367e-05, "loss": 0.0695, "step": 74820 }, { "epoch": 21.04, "learning_rate": 6.436760066223098e-05, "loss": 0.076, "step": 74850 }, { "epoch": 21.05, "learning_rate": 6.434885827632524e-05, "loss": 0.063, "step": 74880 }, { "epoch": 21.06, "learning_rate": 6.433011589041952e-05, "loss": 0.074, "step": 74910 }, { "epoch": 21.07, "learning_rate": 6.431137350451379e-05, "loss": 0.0667, "step": 74940 }, { "epoch": 21.08, "learning_rate": 6.429263111860807e-05, "loss": 0.0668, "step": 74970 }, { "epoch": 21.09, "learning_rate": 6.427388873270235e-05, "loss": 0.0764, "step": 75000 }, { "epoch": 21.09, "learning_rate": 6.42551463467966e-05, "loss": 0.0628, "step": 75030 }, { "epoch": 21.1, "learning_rate": 6.423640396089089e-05, "loss": 0.0738, "step": 75060 }, { "epoch": 21.11, "learning_rate": 6.421766157498517e-05, "loss": 0.0686, "step": 75090 }, { "epoch": 21.12, "learning_rate": 6.419891918907944e-05, "loss": 0.0706, "step": 75120 }, { "epoch": 21.13, "learning_rate": 6.41801768031737e-05, "loss": 0.076, "step": 75150 }, { "epoch": 21.14, "learning_rate": 6.416143441726798e-05, "loss": 0.0645, "step": 75180 }, { "epoch": 21.14, "learning_rate": 6.414269203136227e-05, "loss": 0.0768, "step": 75210 }, { "epoch": 21.15, "learning_rate": 6.412394964545653e-05, "loss": 0.0682, "step": 75240 }, { "epoch": 21.16, "learning_rate": 6.410520725955081e-05, "loss": 0.0743, "step": 75270 }, { "epoch": 21.17, "learning_rate": 6.408646487364508e-05, "loss": 0.0767, "step": 75300 }, { "epoch": 21.18, "learning_rate": 6.406772248773936e-05, "loss": 0.0631, "step": 75330 }, { "epoch": 21.19, "learning_rate": 6.404898010183363e-05, "loss": 0.071, "step": 75360 }, { "epoch": 21.19, "learning_rate": 6.403023771592791e-05, "loss": 0.0711, "step": 75390 }, { "epoch": 21.2, "learning_rate": 6.401149533002219e-05, "loss": 0.0755, "step": 75420 }, { "epoch": 21.21, "learning_rate": 6.399275294411645e-05, "loss": 0.0772, "step": 75450 }, { "epoch": 21.22, "learning_rate": 6.397401055821073e-05, "loss": 0.065, "step": 75480 }, { "epoch": 21.23, "learning_rate": 6.395526817230501e-05, "loss": 0.0749, "step": 75510 }, { "epoch": 21.24, "learning_rate": 6.393652578639929e-05, "loss": 0.0694, "step": 75540 }, { "epoch": 21.25, "learning_rate": 6.391778340049354e-05, "loss": 0.0693, "step": 75570 }, { "epoch": 21.25, "learning_rate": 6.389904101458782e-05, "loss": 0.0739, "step": 75600 }, { "epoch": 21.26, "learning_rate": 6.38802986286821e-05, "loss": 0.0633, "step": 75630 }, { "epoch": 21.27, "learning_rate": 6.386155624277637e-05, "loss": 0.0772, "step": 75660 }, { "epoch": 21.28, "learning_rate": 6.384281385687065e-05, "loss": 0.0679, "step": 75690 }, { "epoch": 21.29, "learning_rate": 6.382407147096492e-05, "loss": 0.0731, "step": 75720 }, { "epoch": 21.3, "learning_rate": 6.38053290850592e-05, "loss": 0.0798, "step": 75750 }, { "epoch": 21.3, "learning_rate": 6.378658669915347e-05, "loss": 0.0637, "step": 75780 }, { "epoch": 21.31, "learning_rate": 6.376784431324775e-05, "loss": 0.0739, "step": 75810 }, { "epoch": 21.32, "learning_rate": 6.374910192734203e-05, "loss": 0.0673, "step": 75840 }, { "epoch": 21.33, "learning_rate": 6.37303595414363e-05, "loss": 0.0685, "step": 75870 }, { "epoch": 21.34, "learning_rate": 6.371161715553057e-05, "loss": 0.0788, "step": 75900 }, { "epoch": 21.35, "learning_rate": 6.369287476962485e-05, "loss": 0.0629, "step": 75930 }, { "epoch": 21.36, "learning_rate": 6.367413238371913e-05, "loss": 0.0732, "step": 75960 }, { "epoch": 21.36, "learning_rate": 6.365538999781338e-05, "loss": 0.0739, "step": 75990 }, { "epoch": 21.37, "learning_rate": 6.363664761190766e-05, "loss": 0.0702, "step": 76020 }, { "epoch": 21.38, "learning_rate": 6.361790522600194e-05, "loss": 0.0759, "step": 76050 }, { "epoch": 21.39, "learning_rate": 6.359916284009621e-05, "loss": 0.062, "step": 76080 }, { "epoch": 21.4, "learning_rate": 6.358042045419049e-05, "loss": 0.0747, "step": 76110 }, { "epoch": 21.41, "learning_rate": 6.356167806828476e-05, "loss": 0.0691, "step": 76140 }, { "epoch": 21.41, "learning_rate": 6.354293568237904e-05, "loss": 0.0705, "step": 76170 }, { "epoch": 21.42, "learning_rate": 6.352419329647331e-05, "loss": 0.076, "step": 76200 }, { "epoch": 21.43, "learning_rate": 6.350545091056759e-05, "loss": 0.0653, "step": 76230 }, { "epoch": 21.44, "learning_rate": 6.348670852466187e-05, "loss": 0.0774, "step": 76260 }, { "epoch": 21.45, "learning_rate": 6.346796613875614e-05, "loss": 0.0697, "step": 76290 }, { "epoch": 21.46, "learning_rate": 6.34492237528504e-05, "loss": 0.0719, "step": 76320 }, { "epoch": 21.46, "learning_rate": 6.343048136694468e-05, "loss": 0.0762, "step": 76350 }, { "epoch": 21.47, "learning_rate": 6.341173898103897e-05, "loss": 0.06, "step": 76380 }, { "epoch": 21.48, "learning_rate": 6.339299659513322e-05, "loss": 0.0742, "step": 76410 }, { "epoch": 21.49, "learning_rate": 6.33742542092275e-05, "loss": 0.0687, "step": 76440 }, { "epoch": 21.5, "learning_rate": 6.335551182332178e-05, "loss": 0.0717, "step": 76470 }, { "epoch": 21.51, "learning_rate": 6.333739418361291e-05, "loss": 0.0793, "step": 76500 }, { "epoch": 21.52, "learning_rate": 6.331865179770719e-05, "loss": 0.0649, "step": 76530 }, { "epoch": 21.52, "learning_rate": 6.329990941180146e-05, "loss": 0.0725, "step": 76560 }, { "epoch": 21.53, "learning_rate": 6.328116702589574e-05, "loss": 0.0679, "step": 76590 }, { "epoch": 21.54, "learning_rate": 6.326242463999e-05, "loss": 0.0641, "step": 76620 }, { "epoch": 21.55, "learning_rate": 6.324368225408429e-05, "loss": 0.074, "step": 76650 }, { "epoch": 21.56, "learning_rate": 6.322493986817855e-05, "loss": 0.0634, "step": 76680 }, { "epoch": 21.57, "learning_rate": 6.320619748227283e-05, "loss": 0.0753, "step": 76710 }, { "epoch": 21.57, "learning_rate": 6.31874550963671e-05, "loss": 0.0683, "step": 76740 }, { "epoch": 21.58, "learning_rate": 6.316871271046137e-05, "loss": 0.0706, "step": 76770 }, { "epoch": 21.59, "learning_rate": 6.314997032455565e-05, "loss": 0.075, "step": 76800 }, { "epoch": 21.6, "learning_rate": 6.313122793864993e-05, "loss": 0.064, "step": 76830 }, { "epoch": 21.61, "learning_rate": 6.31124855527442e-05, "loss": 0.0723, "step": 76860 }, { "epoch": 21.62, "learning_rate": 6.309374316683847e-05, "loss": 0.0713, "step": 76890 }, { "epoch": 21.62, "learning_rate": 6.307500078093275e-05, "loss": 0.0669, "step": 76920 }, { "epoch": 21.63, "learning_rate": 6.305625839502703e-05, "loss": 0.079, "step": 76950 }, { "epoch": 21.64, "learning_rate": 6.30375160091213e-05, "loss": 0.0626, "step": 76980 }, { "epoch": 21.65, "learning_rate": 6.301877362321558e-05, "loss": 0.074, "step": 77010 }, { "epoch": 21.66, "learning_rate": 6.300003123730984e-05, "loss": 0.0726, "step": 77040 }, { "epoch": 21.67, "learning_rate": 6.298128885140413e-05, "loss": 0.0727, "step": 77070 }, { "epoch": 21.68, "learning_rate": 6.296254646549839e-05, "loss": 0.0774, "step": 77100 }, { "epoch": 21.68, "learning_rate": 6.294380407959267e-05, "loss": 0.0654, "step": 77130 }, { "epoch": 21.69, "learning_rate": 6.292506169368694e-05, "loss": 0.0763, "step": 77160 }, { "epoch": 21.7, "learning_rate": 6.290631930778121e-05, "loss": 0.0702, "step": 77190 }, { "epoch": 21.71, "learning_rate": 6.288757692187549e-05, "loss": 0.0735, "step": 77220 }, { "epoch": 21.72, "learning_rate": 6.286883453596977e-05, "loss": 0.0718, "step": 77250 }, { "epoch": 21.73, "learning_rate": 6.285009215006404e-05, "loss": 0.0632, "step": 77280 }, { "epoch": 21.73, "learning_rate": 6.28313497641583e-05, "loss": 0.0814, "step": 77310 }, { "epoch": 21.74, "learning_rate": 6.281260737825259e-05, "loss": 0.068, "step": 77340 }, { "epoch": 21.75, "learning_rate": 6.279386499234687e-05, "loss": 0.0704, "step": 77370 }, { "epoch": 21.76, "learning_rate": 6.277512260644113e-05, "loss": 0.0803, "step": 77400 }, { "epoch": 21.77, "learning_rate": 6.275638022053542e-05, "loss": 0.0651, "step": 77430 }, { "epoch": 21.78, "learning_rate": 6.273763783462968e-05, "loss": 0.074, "step": 77460 }, { "epoch": 21.79, "learning_rate": 6.271889544872396e-05, "loss": 0.0719, "step": 77490 }, { "epoch": 21.79, "learning_rate": 6.270015306281823e-05, "loss": 0.0734, "step": 77520 }, { "epoch": 21.8, "learning_rate": 6.268141067691251e-05, "loss": 0.0751, "step": 77550 }, { "epoch": 21.81, "learning_rate": 6.266266829100678e-05, "loss": 0.0611, "step": 77580 }, { "epoch": 21.82, "learning_rate": 6.264392590510105e-05, "loss": 0.0735, "step": 77610 }, { "epoch": 21.83, "learning_rate": 6.262518351919533e-05, "loss": 0.0671, "step": 77640 }, { "epoch": 21.84, "learning_rate": 6.260644113328961e-05, "loss": 0.0709, "step": 77670 }, { "epoch": 21.84, "learning_rate": 6.258769874738388e-05, "loss": 0.0753, "step": 77700 }, { "epoch": 21.85, "learning_rate": 6.256895636147814e-05, "loss": 0.0609, "step": 77730 }, { "epoch": 21.86, "learning_rate": 6.255021397557242e-05, "loss": 0.0752, "step": 77760 }, { "epoch": 21.87, "learning_rate": 6.253209633586355e-05, "loss": 0.0645, "step": 77790 }, { "epoch": 21.88, "learning_rate": 6.251335394995783e-05, "loss": 0.0729, "step": 77820 }, { "epoch": 21.89, "learning_rate": 6.249461156405211e-05, "loss": 0.076, "step": 77850 }, { "epoch": 21.89, "learning_rate": 6.247586917814638e-05, "loss": 0.0614, "step": 77880 }, { "epoch": 21.9, "learning_rate": 6.245712679224065e-05, "loss": 0.0782, "step": 77910 }, { "epoch": 21.91, "learning_rate": 6.243838440633493e-05, "loss": 0.0683, "step": 77940 }, { "epoch": 21.92, "learning_rate": 6.24196420204292e-05, "loss": 0.0712, "step": 77970 }, { "epoch": 21.93, "learning_rate": 6.240089963452348e-05, "loss": 0.0798, "step": 78000 }, { "epoch": 21.94, "learning_rate": 6.238215724861776e-05, "loss": 0.0626, "step": 78030 }, { "epoch": 21.95, "learning_rate": 6.236341486271203e-05, "loss": 0.0763, "step": 78060 }, { "epoch": 21.95, "learning_rate": 6.23446724768063e-05, "loss": 0.0675, "step": 78090 }, { "epoch": 21.96, "learning_rate": 6.232593009090058e-05, "loss": 0.0664, "step": 78120 }, { "epoch": 21.97, "learning_rate": 6.230718770499486e-05, "loss": 0.0785, "step": 78150 }, { "epoch": 21.98, "learning_rate": 6.228844531908912e-05, "loss": 0.0613, "step": 78180 }, { "epoch": 21.99, "learning_rate": 6.226970293318339e-05, "loss": 0.0739, "step": 78210 }, { "epoch": 22.0, "learning_rate": 6.225096054727767e-05, "loss": 0.0643, "step": 78240 }, { "epoch": 22.0, "eval_loss": 0.11053762584924698, "eval_runtime": 632.3359, "eval_samples_per_second": 25.355, "eval_steps_per_second": 0.794, "eval_wer": 0.10436995892074843, "step": 78254 }, { "epoch": 22.0, "learning_rate": 6.223221816137195e-05, "loss": 0.0775, "step": 78270 }, { "epoch": 22.01, "learning_rate": 6.221347577546622e-05, "loss": 0.067, "step": 78300 }, { "epoch": 22.02, "learning_rate": 6.219473338956049e-05, "loss": 0.0672, "step": 78330 }, { "epoch": 22.03, "learning_rate": 6.217599100365477e-05, "loss": 0.0742, "step": 78360 }, { "epoch": 22.04, "learning_rate": 6.215724861774904e-05, "loss": 0.066, "step": 78390 }, { "epoch": 22.05, "learning_rate": 6.213850623184332e-05, "loss": 0.0683, "step": 78420 }, { "epoch": 22.06, "learning_rate": 6.21197638459376e-05, "loss": 0.0729, "step": 78450 }, { "epoch": 22.06, "learning_rate": 6.210102146003187e-05, "loss": 0.0682, "step": 78480 }, { "epoch": 22.07, "learning_rate": 6.208227907412613e-05, "loss": 0.0785, "step": 78510 }, { "epoch": 22.08, "learning_rate": 6.206353668822041e-05, "loss": 0.0648, "step": 78540 }, { "epoch": 22.09, "learning_rate": 6.20447943023147e-05, "loss": 0.07, "step": 78570 }, { "epoch": 22.1, "learning_rate": 6.202605191640896e-05, "loss": 0.0733, "step": 78600 }, { "epoch": 22.11, "learning_rate": 6.200730953050323e-05, "loss": 0.0656, "step": 78630 }, { "epoch": 22.11, "learning_rate": 6.198856714459751e-05, "loss": 0.0732, "step": 78660 }, { "epoch": 22.12, "learning_rate": 6.196982475869179e-05, "loss": 0.0634, "step": 78690 }, { "epoch": 22.13, "learning_rate": 6.195108237278606e-05, "loss": 0.0733, "step": 78720 }, { "epoch": 22.14, "learning_rate": 6.193233998688033e-05, "loss": 0.0651, "step": 78750 }, { "epoch": 22.15, "learning_rate": 6.191359760097461e-05, "loss": 0.068, "step": 78780 }, { "epoch": 22.16, "learning_rate": 6.189485521506887e-05, "loss": 0.0718, "step": 78810 }, { "epoch": 22.16, "learning_rate": 6.187611282916316e-05, "loss": 0.0614, "step": 78840 }, { "epoch": 22.17, "learning_rate": 6.185737044325744e-05, "loss": 0.0751, "step": 78870 }, { "epoch": 22.18, "learning_rate": 6.183925280354856e-05, "loss": 0.0744, "step": 78900 }, { "epoch": 22.19, "learning_rate": 6.182051041764285e-05, "loss": 0.0678, "step": 78930 }, { "epoch": 22.2, "learning_rate": 6.180176803173711e-05, "loss": 0.0754, "step": 78960 }, { "epoch": 22.21, "learning_rate": 6.178302564583138e-05, "loss": 0.0606, "step": 78990 }, { "epoch": 22.22, "learning_rate": 6.176428325992566e-05, "loss": 0.0704, "step": 79020 }, { "epoch": 22.22, "learning_rate": 6.174554087401994e-05, "loss": 0.0677, "step": 79050 }, { "epoch": 22.23, "learning_rate": 6.17267984881142e-05, "loss": 0.0684, "step": 79080 }, { "epoch": 22.24, "learning_rate": 6.170805610220848e-05, "loss": 0.0728, "step": 79110 }, { "epoch": 22.25, "learning_rate": 6.168931371630276e-05, "loss": 0.0615, "step": 79140 }, { "epoch": 22.26, "learning_rate": 6.167057133039703e-05, "loss": 0.0699, "step": 79170 }, { "epoch": 22.27, "learning_rate": 6.16518289444913e-05, "loss": 0.0734, "step": 79200 }, { "epoch": 22.27, "learning_rate": 6.163308655858557e-05, "loss": 0.0702, "step": 79230 }, { "epoch": 22.28, "learning_rate": 6.161434417267985e-05, "loss": 0.0776, "step": 79260 }, { "epoch": 22.29, "learning_rate": 6.159560178677412e-05, "loss": 0.0604, "step": 79290 }, { "epoch": 22.3, "learning_rate": 6.15768594008684e-05, "loss": 0.0685, "step": 79320 }, { "epoch": 22.31, "learning_rate": 6.155811701496268e-05, "loss": 0.0684, "step": 79350 }, { "epoch": 22.32, "learning_rate": 6.153937462905695e-05, "loss": 0.0694, "step": 79380 }, { "epoch": 22.32, "learning_rate": 6.152063224315122e-05, "loss": 0.0777, "step": 79410 }, { "epoch": 22.33, "learning_rate": 6.15018898572455e-05, "loss": 0.0644, "step": 79440 }, { "epoch": 22.34, "learning_rate": 6.148314747133978e-05, "loss": 0.0739, "step": 79470 }, { "epoch": 22.35, "learning_rate": 6.146440508543403e-05, "loss": 0.0732, "step": 79500 }, { "epoch": 22.36, "learning_rate": 6.144566269952832e-05, "loss": 0.0716, "step": 79530 }, { "epoch": 22.37, "learning_rate": 6.14269203136226e-05, "loss": 0.0746, "step": 79560 }, { "epoch": 22.38, "learning_rate": 6.140817792771686e-05, "loss": 0.0616, "step": 79590 }, { "epoch": 22.38, "learning_rate": 6.138943554181114e-05, "loss": 0.0698, "step": 79620 }, { "epoch": 22.39, "learning_rate": 6.137069315590541e-05, "loss": 0.0703, "step": 79650 }, { "epoch": 22.4, "learning_rate": 6.135195076999969e-05, "loss": 0.0673, "step": 79680 }, { "epoch": 22.41, "learning_rate": 6.133320838409396e-05, "loss": 0.0764, "step": 79710 }, { "epoch": 22.42, "learning_rate": 6.131446599818824e-05, "loss": 0.0598, "step": 79740 }, { "epoch": 22.43, "learning_rate": 6.129572361228252e-05, "loss": 0.066, "step": 79770 }, { "epoch": 22.43, "learning_rate": 6.127698122637679e-05, "loss": 0.07, "step": 79800 }, { "epoch": 22.44, "learning_rate": 6.125823884047106e-05, "loss": 0.0671, "step": 79830 }, { "epoch": 22.45, "learning_rate": 6.123949645456534e-05, "loss": 0.0717, "step": 79860 }, { "epoch": 22.46, "learning_rate": 6.122075406865962e-05, "loss": 0.0608, "step": 79890 }, { "epoch": 22.47, "learning_rate": 6.120201168275387e-05, "loss": 0.0703, "step": 79920 }, { "epoch": 22.48, "learning_rate": 6.118326929684815e-05, "loss": 0.0671, "step": 79950 }, { "epoch": 22.49, "learning_rate": 6.116452691094243e-05, "loss": 0.0684, "step": 79980 }, { "epoch": 22.49, "learning_rate": 6.11457845250367e-05, "loss": 0.0739, "step": 80010 }, { "epoch": 22.5, "learning_rate": 6.112704213913098e-05, "loss": 0.0601, "step": 80040 }, { "epoch": 22.51, "learning_rate": 6.110829975322525e-05, "loss": 0.0709, "step": 80070 }, { "epoch": 22.52, "learning_rate": 6.108955736731953e-05, "loss": 0.0708, "step": 80100 }, { "epoch": 22.53, "learning_rate": 6.10708149814138e-05, "loss": 0.067, "step": 80130 }, { "epoch": 22.54, "learning_rate": 6.105207259550808e-05, "loss": 0.0721, "step": 80160 }, { "epoch": 22.54, "learning_rate": 6.1033330209602354e-05, "loss": 0.0629, "step": 80190 }, { "epoch": 22.55, "learning_rate": 6.101458782369662e-05, "loss": 0.073, "step": 80220 }, { "epoch": 22.56, "learning_rate": 6.09958454377909e-05, "loss": 0.0669, "step": 80250 }, { "epoch": 22.57, "learning_rate": 6.097710305188518e-05, "loss": 0.0667, "step": 80280 }, { "epoch": 22.58, "learning_rate": 6.095836066597945e-05, "loss": 0.0723, "step": 80310 }, { "epoch": 22.59, "learning_rate": 6.093961828007372e-05, "loss": 0.0626, "step": 80340 }, { "epoch": 22.59, "learning_rate": 6.092087589416799e-05, "loss": 0.0693, "step": 80370 }, { "epoch": 22.6, "learning_rate": 6.0902133508262274e-05, "loss": 0.0697, "step": 80400 }, { "epoch": 22.61, "learning_rate": 6.088339112235655e-05, "loss": 0.063, "step": 80430 }, { "epoch": 22.62, "learning_rate": 6.086464873645082e-05, "loss": 0.0771, "step": 80460 }, { "epoch": 22.63, "learning_rate": 6.084590635054509e-05, "loss": 0.0635, "step": 80490 }, { "epoch": 22.64, "learning_rate": 6.0827163964639364e-05, "loss": 0.0707, "step": 80520 }, { "epoch": 22.65, "learning_rate": 6.0808421578733645e-05, "loss": 0.0681, "step": 80550 }, { "epoch": 22.65, "learning_rate": 6.078967919282792e-05, "loss": 0.0636, "step": 80580 }, { "epoch": 22.66, "learning_rate": 6.077093680692219e-05, "loss": 0.0723, "step": 80610 }, { "epoch": 22.67, "learning_rate": 6.075219442101646e-05, "loss": 0.059, "step": 80640 }, { "epoch": 22.68, "learning_rate": 6.073345203511074e-05, "loss": 0.0718, "step": 80670 }, { "epoch": 22.69, "learning_rate": 6.0714709649205016e-05, "loss": 0.0687, "step": 80700 }, { "epoch": 22.7, "learning_rate": 6.069596726329929e-05, "loss": 0.064, "step": 80730 }, { "epoch": 22.7, "learning_rate": 6.067722487739356e-05, "loss": 0.0753, "step": 80760 }, { "epoch": 22.71, "learning_rate": 6.065848249148783e-05, "loss": 0.067, "step": 80790 }, { "epoch": 22.72, "learning_rate": 6.063974010558211e-05, "loss": 0.072, "step": 80820 }, { "epoch": 22.73, "learning_rate": 6.0620997719676386e-05, "loss": 0.0687, "step": 80850 }, { "epoch": 22.74, "learning_rate": 6.060225533377066e-05, "loss": 0.0664, "step": 80880 }, { "epoch": 22.75, "learning_rate": 6.058351294786493e-05, "loss": 0.0791, "step": 80910 }, { "epoch": 22.76, "learning_rate": 6.05647705619592e-05, "loss": 0.0604, "step": 80940 }, { "epoch": 22.76, "learning_rate": 6.054602817605348e-05, "loss": 0.0726, "step": 80970 }, { "epoch": 22.77, "learning_rate": 6.052728579014776e-05, "loss": 0.068, "step": 81000 }, { "epoch": 22.78, "learning_rate": 6.0508543404242025e-05, "loss": 0.0691, "step": 81030 }, { "epoch": 22.79, "learning_rate": 6.04898010183363e-05, "loss": 0.0768, "step": 81060 }, { "epoch": 22.8, "learning_rate": 6.047105863243058e-05, "loss": 0.0681, "step": 81090 }, { "epoch": 22.81, "learning_rate": 6.0452316246524854e-05, "loss": 0.0712, "step": 81120 }, { "epoch": 22.81, "learning_rate": 6.043357386061913e-05, "loss": 0.0706, "step": 81150 }, { "epoch": 22.82, "learning_rate": 6.0414831474713396e-05, "loss": 0.0649, "step": 81180 }, { "epoch": 22.83, "learning_rate": 6.039608908880767e-05, "loss": 0.0739, "step": 81210 }, { "epoch": 22.84, "learning_rate": 6.037734670290195e-05, "loss": 0.0649, "step": 81240 }, { "epoch": 22.85, "learning_rate": 6.0358604316996225e-05, "loss": 0.0732, "step": 81270 }, { "epoch": 22.86, "learning_rate": 6.03398619310905e-05, "loss": 0.0731, "step": 81300 }, { "epoch": 22.86, "learning_rate": 6.032111954518477e-05, "loss": 0.0668, "step": 81330 }, { "epoch": 22.87, "learning_rate": 6.030237715927904e-05, "loss": 0.0761, "step": 81360 }, { "epoch": 22.88, "learning_rate": 6.028363477337332e-05, "loss": 0.0663, "step": 81390 }, { "epoch": 22.89, "learning_rate": 6.0264892387467596e-05, "loss": 0.0739, "step": 81420 }, { "epoch": 22.9, "learning_rate": 6.0246150001561864e-05, "loss": 0.0685, "step": 81450 }, { "epoch": 22.91, "learning_rate": 6.022740761565614e-05, "loss": 0.0705, "step": 81480 }, { "epoch": 22.92, "learning_rate": 6.020866522975042e-05, "loss": 0.0717, "step": 81510 }, { "epoch": 22.92, "learning_rate": 6.018992284384469e-05, "loss": 0.0645, "step": 81540 }, { "epoch": 22.93, "learning_rate": 6.017118045793897e-05, "loss": 0.0729, "step": 81570 }, { "epoch": 22.94, "learning_rate": 6.0152438072033234e-05, "loss": 0.0691, "step": 81600 }, { "epoch": 22.95, "learning_rate": 6.013369568612751e-05, "loss": 0.0706, "step": 81630 }, { "epoch": 22.96, "learning_rate": 6.011495330022179e-05, "loss": 0.0751, "step": 81660 }, { "epoch": 22.97, "learning_rate": 6.0096210914316064e-05, "loss": 0.0633, "step": 81690 }, { "epoch": 22.97, "learning_rate": 6.007746852841034e-05, "loss": 0.0755, "step": 81720 }, { "epoch": 22.98, "learning_rate": 6.0058726142504605e-05, "loss": 0.0714, "step": 81750 }, { "epoch": 22.99, "learning_rate": 6.0039983756598886e-05, "loss": 0.0712, "step": 81780 }, { "epoch": 23.0, "learning_rate": 6.002124137069316e-05, "loss": 0.0764, "step": 81810 }, { "epoch": 23.0, "eval_loss": 0.10718846321105957, "eval_runtime": 629.1357, "eval_samples_per_second": 25.484, "eval_steps_per_second": 0.798, "eval_wer": 0.10416524504251225, "step": 81811 }, { "epoch": 23.01, "learning_rate": 6.0002498984787435e-05, "loss": 0.0609, "step": 81840 }, { "epoch": 23.02, "learning_rate": 5.99837565988817e-05, "loss": 0.0743, "step": 81870 }, { "epoch": 23.03, "learning_rate": 5.9965014212975976e-05, "loss": 0.0652, "step": 81900 }, { "epoch": 23.03, "learning_rate": 5.994627182707026e-05, "loss": 0.0694, "step": 81930 }, { "epoch": 23.04, "learning_rate": 5.992752944116453e-05, "loss": 0.0686, "step": 81960 }, { "epoch": 23.05, "learning_rate": 5.9908787055258806e-05, "loss": 0.0652, "step": 81990 }, { "epoch": 23.06, "learning_rate": 5.989004466935307e-05, "loss": 0.0692, "step": 82020 }, { "epoch": 23.07, "learning_rate": 5.987130228344735e-05, "loss": 0.0626, "step": 82050 }, { "epoch": 23.08, "learning_rate": 5.985255989754163e-05, "loss": 0.0718, "step": 82080 }, { "epoch": 23.08, "learning_rate": 5.98338175116359e-05, "loss": 0.0717, "step": 82110 }, { "epoch": 23.09, "learning_rate": 5.981507512573018e-05, "loss": 0.0649, "step": 82140 }, { "epoch": 23.1, "learning_rate": 5.9796332739824444e-05, "loss": 0.0733, "step": 82170 }, { "epoch": 23.11, "learning_rate": 5.9777590353918725e-05, "loss": 0.0636, "step": 82200 }, { "epoch": 23.12, "learning_rate": 5.9758847968013e-05, "loss": 0.0661, "step": 82230 }, { "epoch": 23.13, "learning_rate": 5.9740105582107273e-05, "loss": 0.0759, "step": 82260 }, { "epoch": 23.13, "learning_rate": 5.972136319620154e-05, "loss": 0.0637, "step": 82290 }, { "epoch": 23.14, "learning_rate": 5.9702620810295815e-05, "loss": 0.0702, "step": 82320 }, { "epoch": 23.15, "learning_rate": 5.9683878424390096e-05, "loss": 0.0607, "step": 82350 }, { "epoch": 23.16, "learning_rate": 5.966513603848437e-05, "loss": 0.0675, "step": 82380 }, { "epoch": 23.17, "learning_rate": 5.9646393652578644e-05, "loss": 0.0678, "step": 82410 }, { "epoch": 23.18, "learning_rate": 5.962765126667291e-05, "loss": 0.0628, "step": 82440 }, { "epoch": 23.19, "learning_rate": 5.9608908880767186e-05, "loss": 0.0696, "step": 82470 }, { "epoch": 23.19, "learning_rate": 5.959016649486147e-05, "loss": 0.06, "step": 82500 }, { "epoch": 23.2, "learning_rate": 5.957142410895574e-05, "loss": 0.0669, "step": 82530 }, { "epoch": 23.21, "learning_rate": 5.955268172305002e-05, "loss": 0.0763, "step": 82560 }, { "epoch": 23.22, "learning_rate": 5.953393933714428e-05, "loss": 0.0613, "step": 82590 }, { "epoch": 23.23, "learning_rate": 5.9515196951238564e-05, "loss": 0.0752, "step": 82620 }, { "epoch": 23.24, "learning_rate": 5.949645456533284e-05, "loss": 0.0613, "step": 82650 }, { "epoch": 23.24, "learning_rate": 5.947771217942711e-05, "loss": 0.0709, "step": 82680 }, { "epoch": 23.25, "learning_rate": 5.945896979352138e-05, "loss": 0.0708, "step": 82710 }, { "epoch": 23.26, "learning_rate": 5.9440227407615654e-05, "loss": 0.0616, "step": 82740 }, { "epoch": 23.27, "learning_rate": 5.9421485021709935e-05, "loss": 0.0695, "step": 82770 }, { "epoch": 23.28, "learning_rate": 5.940274263580421e-05, "loss": 0.0621, "step": 82800 }, { "epoch": 23.29, "learning_rate": 5.938400024989848e-05, "loss": 0.0664, "step": 82830 }, { "epoch": 23.29, "learning_rate": 5.936525786399275e-05, "loss": 0.0682, "step": 82860 }, { "epoch": 23.3, "learning_rate": 5.9346515478087025e-05, "loss": 0.0601, "step": 82890 }, { "epoch": 23.31, "learning_rate": 5.9327773092181306e-05, "loss": 0.0691, "step": 82920 }, { "epoch": 23.32, "learning_rate": 5.930903070627558e-05, "loss": 0.062, "step": 82950 }, { "epoch": 23.33, "learning_rate": 5.929028832036986e-05, "loss": 0.067, "step": 82980 }, { "epoch": 23.34, "learning_rate": 5.927154593446412e-05, "loss": 0.07, "step": 83010 }, { "epoch": 23.35, "learning_rate": 5.92528035485584e-05, "loss": 0.0639, "step": 83040 }, { "epoch": 23.35, "learning_rate": 5.9234061162652677e-05, "loss": 0.0749, "step": 83070 }, { "epoch": 23.36, "learning_rate": 5.921531877674695e-05, "loss": 0.0656, "step": 83100 }, { "epoch": 23.37, "learning_rate": 5.919657639084122e-05, "loss": 0.075, "step": 83130 }, { "epoch": 23.38, "learning_rate": 5.917783400493549e-05, "loss": 0.0749, "step": 83160 }, { "epoch": 23.39, "learning_rate": 5.915909161902977e-05, "loss": 0.0669, "step": 83190 }, { "epoch": 23.4, "learning_rate": 5.914034923312405e-05, "loss": 0.0713, "step": 83220 }, { "epoch": 23.4, "learning_rate": 5.912160684721832e-05, "loss": 0.0618, "step": 83250 }, { "epoch": 23.41, "learning_rate": 5.910286446131259e-05, "loss": 0.0689, "step": 83280 }, { "epoch": 23.42, "learning_rate": 5.908412207540687e-05, "loss": 0.0702, "step": 83310 }, { "epoch": 23.43, "learning_rate": 5.9065379689501144e-05, "loss": 0.0641, "step": 83340 }, { "epoch": 23.44, "learning_rate": 5.904663730359542e-05, "loss": 0.0687, "step": 83370 }, { "epoch": 23.45, "learning_rate": 5.90278949176897e-05, "loss": 0.0619, "step": 83400 }, { "epoch": 23.46, "learning_rate": 5.900915253178396e-05, "loss": 0.0723, "step": 83430 }, { "epoch": 23.46, "learning_rate": 5.899041014587824e-05, "loss": 0.0712, "step": 83460 }, { "epoch": 23.47, "learning_rate": 5.8971667759972515e-05, "loss": 0.0631, "step": 83490 }, { "epoch": 23.48, "learning_rate": 5.895292537406679e-05, "loss": 0.0713, "step": 83520 }, { "epoch": 23.49, "learning_rate": 5.893418298816106e-05, "loss": 0.0622, "step": 83550 }, { "epoch": 23.5, "learning_rate": 5.891544060225533e-05, "loss": 0.0719, "step": 83580 }, { "epoch": 23.51, "learning_rate": 5.889669821634961e-05, "loss": 0.0734, "step": 83610 }, { "epoch": 23.51, "learning_rate": 5.8877955830443886e-05, "loss": 0.0612, "step": 83640 }, { "epoch": 23.52, "learning_rate": 5.885921344453816e-05, "loss": 0.0734, "step": 83670 }, { "epoch": 23.53, "learning_rate": 5.884047105863243e-05, "loss": 0.0608, "step": 83700 }, { "epoch": 23.54, "learning_rate": 5.882172867272671e-05, "loss": 0.0667, "step": 83730 }, { "epoch": 23.55, "learning_rate": 5.880298628682098e-05, "loss": 0.071, "step": 83760 }, { "epoch": 23.56, "learning_rate": 5.878424390091526e-05, "loss": 0.0616, "step": 83790 }, { "epoch": 23.56, "learning_rate": 5.876550151500954e-05, "loss": 0.0768, "step": 83820 }, { "epoch": 23.57, "learning_rate": 5.87467591291038e-05, "loss": 0.0648, "step": 83850 }, { "epoch": 23.58, "learning_rate": 5.872801674319808e-05, "loss": 0.0689, "step": 83880 }, { "epoch": 23.59, "learning_rate": 5.8709274357292354e-05, "loss": 0.0712, "step": 83910 }, { "epoch": 23.6, "learning_rate": 5.869053197138663e-05, "loss": 0.0642, "step": 83940 }, { "epoch": 23.61, "learning_rate": 5.8671789585480896e-05, "loss": 0.0776, "step": 83970 }, { "epoch": 23.62, "learning_rate": 5.865304719957517e-05, "loss": 0.0607, "step": 84000 }, { "epoch": 23.62, "learning_rate": 5.863430481366945e-05, "loss": 0.0679, "step": 84030 }, { "epoch": 23.63, "learning_rate": 5.8615562427763725e-05, "loss": 0.07, "step": 84060 }, { "epoch": 23.64, "learning_rate": 5.8596820041858006e-05, "loss": 0.0656, "step": 84090 }, { "epoch": 23.65, "learning_rate": 5.8578077655952267e-05, "loss": 0.0717, "step": 84120 }, { "epoch": 23.66, "learning_rate": 5.855933527004655e-05, "loss": 0.0632, "step": 84150 }, { "epoch": 23.67, "learning_rate": 5.854059288414082e-05, "loss": 0.0705, "step": 84180 }, { "epoch": 23.67, "learning_rate": 5.8521850498235096e-05, "loss": 0.0703, "step": 84210 }, { "epoch": 23.68, "learning_rate": 5.850310811232938e-05, "loss": 0.0623, "step": 84240 }, { "epoch": 23.69, "learning_rate": 5.848436572642364e-05, "loss": 0.0747, "step": 84270 }, { "epoch": 23.7, "learning_rate": 5.846562334051792e-05, "loss": 0.063, "step": 84300 }, { "epoch": 23.71, "learning_rate": 5.844688095461219e-05, "loss": 0.0739, "step": 84330 }, { "epoch": 23.72, "learning_rate": 5.842813856870647e-05, "loss": 0.0656, "step": 84360 }, { "epoch": 23.72, "learning_rate": 5.8409396182800734e-05, "loss": 0.0604, "step": 84390 }, { "epoch": 23.73, "learning_rate": 5.8390653796895015e-05, "loss": 0.0721, "step": 84420 }, { "epoch": 23.74, "learning_rate": 5.837191141098929e-05, "loss": 0.0658, "step": 84450 }, { "epoch": 23.75, "learning_rate": 5.8353169025083564e-05, "loss": 0.065, "step": 84480 }, { "epoch": 23.76, "learning_rate": 5.8334426639177845e-05, "loss": 0.0705, "step": 84510 }, { "epoch": 23.77, "learning_rate": 5.8315684253272105e-05, "loss": 0.0614, "step": 84540 }, { "epoch": 23.78, "learning_rate": 5.8296941867366386e-05, "loss": 0.0742, "step": 84570 }, { "epoch": 23.78, "learning_rate": 5.827819948146066e-05, "loss": 0.0656, "step": 84600 }, { "epoch": 23.79, "learning_rate": 5.8259457095554935e-05, "loss": 0.0648, "step": 84630 }, { "epoch": 23.8, "learning_rate": 5.82407147096492e-05, "loss": 0.074, "step": 84660 }, { "epoch": 23.81, "learning_rate": 5.8221972323743476e-05, "loss": 0.0629, "step": 84690 }, { "epoch": 23.82, "learning_rate": 5.820322993783776e-05, "loss": 0.073, "step": 84720 }, { "epoch": 23.83, "learning_rate": 5.818448755193203e-05, "loss": 0.062, "step": 84750 }, { "epoch": 23.83, "learning_rate": 5.8165745166026305e-05, "loss": 0.0652, "step": 84780 }, { "epoch": 23.84, "learning_rate": 5.814700278012057e-05, "loss": 0.0726, "step": 84810 }, { "epoch": 23.85, "learning_rate": 5.8128260394214854e-05, "loss": 0.0597, "step": 84840 }, { "epoch": 23.86, "learning_rate": 5.810951800830913e-05, "loss": 0.0739, "step": 84870 }, { "epoch": 23.87, "learning_rate": 5.80907756224034e-05, "loss": 0.0656, "step": 84900 }, { "epoch": 23.88, "learning_rate": 5.807203323649768e-05, "loss": 0.0699, "step": 84930 }, { "epoch": 23.89, "learning_rate": 5.8053290850591944e-05, "loss": 0.0676, "step": 84960 }, { "epoch": 23.89, "learning_rate": 5.8034548464686225e-05, "loss": 0.0635, "step": 84990 }, { "epoch": 23.9, "learning_rate": 5.80158060787805e-05, "loss": 0.0709, "step": 85020 }, { "epoch": 23.91, "learning_rate": 5.799706369287477e-05, "loss": 0.0632, "step": 85050 }, { "epoch": 23.92, "learning_rate": 5.797832130696904e-05, "loss": 0.0737, "step": 85080 }, { "epoch": 23.93, "learning_rate": 5.7959578921063315e-05, "loss": 0.0754, "step": 85110 }, { "epoch": 23.94, "learning_rate": 5.7940836535157596e-05, "loss": 0.063, "step": 85140 }, { "epoch": 23.94, "learning_rate": 5.792209414925187e-05, "loss": 0.0731, "step": 85170 }, { "epoch": 23.95, "learning_rate": 5.7903351763346144e-05, "loss": 0.0618, "step": 85200 }, { "epoch": 23.96, "learning_rate": 5.788460937744041e-05, "loss": 0.0697, "step": 85230 }, { "epoch": 23.97, "learning_rate": 5.786586699153469e-05, "loss": 0.069, "step": 85260 }, { "epoch": 23.98, "learning_rate": 5.784712460562897e-05, "loss": 0.063, "step": 85290 }, { "epoch": 23.99, "learning_rate": 5.782838221972324e-05, "loss": 0.072, "step": 85320 }, { "epoch": 23.99, "learning_rate": 5.780963983381752e-05, "loss": 0.0605, "step": 85350 }, { "epoch": 24.0, "eval_loss": 0.1094522774219513, "eval_runtime": 630.878, "eval_samples_per_second": 25.414, "eval_steps_per_second": 0.796, "eval_wer": 0.10262989095574086, "step": 85368 }, { "epoch": 24.0, "learning_rate": 5.779089744791178e-05, "loss": 0.0716, "step": 85380 }, { "epoch": 24.01, "learning_rate": 5.7772155062006063e-05, "loss": 0.0651, "step": 85410 }, { "epoch": 24.02, "learning_rate": 5.775341267610034e-05, "loss": 0.064, "step": 85440 }, { "epoch": 24.03, "learning_rate": 5.773467029019461e-05, "loss": 0.0738, "step": 85470 }, { "epoch": 24.04, "learning_rate": 5.771592790428888e-05, "loss": 0.0568, "step": 85500 }, { "epoch": 24.05, "learning_rate": 5.7697185518383153e-05, "loss": 0.0681, "step": 85530 }, { "epoch": 24.05, "learning_rate": 5.7678443132477434e-05, "loss": 0.063, "step": 85560 }, { "epoch": 24.06, "learning_rate": 5.765970074657171e-05, "loss": 0.0678, "step": 85590 }, { "epoch": 24.07, "learning_rate": 5.764095836066599e-05, "loss": 0.0677, "step": 85620 }, { "epoch": 24.08, "learning_rate": 5.762221597476025e-05, "loss": 0.062, "step": 85650 }, { "epoch": 24.09, "learning_rate": 5.760347358885453e-05, "loss": 0.0704, "step": 85680 }, { "epoch": 24.1, "learning_rate": 5.7584731202948805e-05, "loss": 0.0625, "step": 85710 }, { "epoch": 24.1, "learning_rate": 5.756598881704308e-05, "loss": 0.0695, "step": 85740 }, { "epoch": 24.11, "learning_rate": 5.754724643113736e-05, "loss": 0.0734, "step": 85770 }, { "epoch": 24.12, "learning_rate": 5.752850404523162e-05, "loss": 0.0571, "step": 85800 }, { "epoch": 24.13, "learning_rate": 5.75097616593259e-05, "loss": 0.0693, "step": 85830 }, { "epoch": 24.14, "learning_rate": 5.7491019273420176e-05, "loss": 0.06, "step": 85860 }, { "epoch": 24.15, "learning_rate": 5.747227688751445e-05, "loss": 0.0696, "step": 85890 }, { "epoch": 24.16, "learning_rate": 5.745353450160872e-05, "loss": 0.074, "step": 85920 }, { "epoch": 24.16, "learning_rate": 5.7434792115703e-05, "loss": 0.0605, "step": 85950 }, { "epoch": 24.17, "learning_rate": 5.741604972979727e-05, "loss": 0.0721, "step": 85980 }, { "epoch": 24.18, "learning_rate": 5.739730734389155e-05, "loss": 0.0674, "step": 86010 }, { "epoch": 24.19, "learning_rate": 5.737856495798583e-05, "loss": 0.0705, "step": 86040 }, { "epoch": 24.2, "learning_rate": 5.735982257208009e-05, "loss": 0.0727, "step": 86070 }, { "epoch": 24.21, "learning_rate": 5.734108018617437e-05, "loss": 0.0602, "step": 86100 }, { "epoch": 24.21, "learning_rate": 5.7322337800268644e-05, "loss": 0.0741, "step": 86130 }, { "epoch": 24.22, "learning_rate": 5.730359541436292e-05, "loss": 0.0636, "step": 86160 }, { "epoch": 24.23, "learning_rate": 5.72848530284572e-05, "loss": 0.0623, "step": 86190 }, { "epoch": 24.24, "learning_rate": 5.726611064255146e-05, "loss": 0.0734, "step": 86220 }, { "epoch": 24.25, "learning_rate": 5.724736825664574e-05, "loss": 0.0579, "step": 86250 }, { "epoch": 24.26, "learning_rate": 5.7228625870740015e-05, "loss": 0.0707, "step": 86280 }, { "epoch": 24.26, "learning_rate": 5.720988348483429e-05, "loss": 0.0649, "step": 86310 }, { "epoch": 24.27, "learning_rate": 5.719114109892856e-05, "loss": 0.0698, "step": 86340 }, { "epoch": 24.28, "learning_rate": 5.717239871302284e-05, "loss": 0.0752, "step": 86370 }, { "epoch": 24.29, "learning_rate": 5.715365632711711e-05, "loss": 0.0606, "step": 86400 }, { "epoch": 24.3, "learning_rate": 5.7134913941211386e-05, "loss": 0.0729, "step": 86430 }, { "epoch": 24.31, "learning_rate": 5.711617155530567e-05, "loss": 0.0614, "step": 86460 }, { "epoch": 24.32, "learning_rate": 5.709742916939993e-05, "loss": 0.0644, "step": 86490 }, { "epoch": 24.32, "learning_rate": 5.707868678349421e-05, "loss": 0.074, "step": 86520 }, { "epoch": 24.33, "learning_rate": 5.705994439758848e-05, "loss": 0.0584, "step": 86550 }, { "epoch": 24.34, "learning_rate": 5.704182675787961e-05, "loss": 0.0685, "step": 86580 }, { "epoch": 24.35, "learning_rate": 5.702308437197389e-05, "loss": 0.0673, "step": 86610 }, { "epoch": 24.36, "learning_rate": 5.7004341986068165e-05, "loss": 0.0714, "step": 86640 }, { "epoch": 24.37, "learning_rate": 5.698559960016243e-05, "loss": 0.0712, "step": 86670 }, { "epoch": 24.37, "learning_rate": 5.696685721425671e-05, "loss": 0.0583, "step": 86700 }, { "epoch": 24.38, "learning_rate": 5.694811482835099e-05, "loss": 0.0729, "step": 86730 }, { "epoch": 24.39, "learning_rate": 5.692937244244526e-05, "loss": 0.0615, "step": 86760 }, { "epoch": 24.4, "learning_rate": 5.6910630056539536e-05, "loss": 0.0648, "step": 86790 }, { "epoch": 24.41, "learning_rate": 5.6891887670633804e-05, "loss": 0.0729, "step": 86820 }, { "epoch": 24.42, "learning_rate": 5.687314528472808e-05, "loss": 0.0605, "step": 86850 }, { "epoch": 24.43, "learning_rate": 5.685440289882236e-05, "loss": 0.0729, "step": 86880 }, { "epoch": 24.43, "learning_rate": 5.683566051291663e-05, "loss": 0.0623, "step": 86910 }, { "epoch": 24.44, "learning_rate": 5.681691812701091e-05, "loss": 0.0662, "step": 86940 }, { "epoch": 24.45, "learning_rate": 5.6798175741105175e-05, "loss": 0.0737, "step": 86970 }, { "epoch": 24.46, "learning_rate": 5.677943335519945e-05, "loss": 0.0603, "step": 87000 }, { "epoch": 24.47, "learning_rate": 5.676069096929373e-05, "loss": 0.0676, "step": 87030 }, { "epoch": 24.48, "learning_rate": 5.6741948583388004e-05, "loss": 0.0618, "step": 87060 }, { "epoch": 24.48, "learning_rate": 5.672320619748227e-05, "loss": 0.065, "step": 87090 }, { "epoch": 24.49, "learning_rate": 5.6704463811576546e-05, "loss": 0.0732, "step": 87120 }, { "epoch": 24.5, "learning_rate": 5.6685721425670827e-05, "loss": 0.0606, "step": 87150 }, { "epoch": 24.51, "learning_rate": 5.66669790397651e-05, "loss": 0.0741, "step": 87180 }, { "epoch": 24.52, "learning_rate": 5.6648236653859375e-05, "loss": 0.0638, "step": 87210 }, { "epoch": 24.53, "learning_rate": 5.662949426795364e-05, "loss": 0.0631, "step": 87240 }, { "epoch": 24.53, "learning_rate": 5.6610751882047917e-05, "loss": 0.0698, "step": 87270 }, { "epoch": 24.54, "learning_rate": 5.65920094961422e-05, "loss": 0.06, "step": 87300 }, { "epoch": 24.55, "learning_rate": 5.657326711023647e-05, "loss": 0.0706, "step": 87330 }, { "epoch": 24.56, "learning_rate": 5.6554524724330746e-05, "loss": 0.0634, "step": 87360 }, { "epoch": 24.57, "learning_rate": 5.653578233842501e-05, "loss": 0.0666, "step": 87390 }, { "epoch": 24.58, "learning_rate": 5.651703995251929e-05, "loss": 0.0749, "step": 87420 }, { "epoch": 24.59, "learning_rate": 5.649829756661357e-05, "loss": 0.0614, "step": 87450 }, { "epoch": 24.59, "learning_rate": 5.647955518070784e-05, "loss": 0.0708, "step": 87480 }, { "epoch": 24.6, "learning_rate": 5.646081279480211e-05, "loss": 0.0624, "step": 87510 }, { "epoch": 24.61, "learning_rate": 5.6442070408896384e-05, "loss": 0.0672, "step": 87540 }, { "epoch": 24.62, "learning_rate": 5.6423328022990665e-05, "loss": 0.0718, "step": 87570 }, { "epoch": 24.63, "learning_rate": 5.640458563708494e-05, "loss": 0.059, "step": 87600 }, { "epoch": 24.64, "learning_rate": 5.6385843251179214e-05, "loss": 0.0733, "step": 87630 }, { "epoch": 24.64, "learning_rate": 5.636710086527348e-05, "loss": 0.0607, "step": 87660 }, { "epoch": 24.65, "learning_rate": 5.634898322556462e-05, "loss": 0.0657, "step": 87690 }, { "epoch": 24.66, "learning_rate": 5.633024083965889e-05, "loss": 0.0707, "step": 87720 }, { "epoch": 24.67, "learning_rate": 5.6311498453753164e-05, "loss": 0.0602, "step": 87750 }, { "epoch": 24.68, "learning_rate": 5.629275606784744e-05, "loss": 0.0665, "step": 87780 }, { "epoch": 24.69, "learning_rate": 5.627401368194172e-05, "loss": 0.065, "step": 87810 }, { "epoch": 24.69, "learning_rate": 5.6255271296035986e-05, "loss": 0.0652, "step": 87840 }, { "epoch": 24.7, "learning_rate": 5.623652891013026e-05, "loss": 0.0701, "step": 87870 }, { "epoch": 24.71, "learning_rate": 5.6217786524224535e-05, "loss": 0.0571, "step": 87900 }, { "epoch": 24.72, "learning_rate": 5.6199044138318816e-05, "loss": 0.0692, "step": 87930 }, { "epoch": 24.73, "learning_rate": 5.618030175241309e-05, "loss": 0.0617, "step": 87960 }, { "epoch": 24.74, "learning_rate": 5.616155936650736e-05, "loss": 0.0684, "step": 87990 }, { "epoch": 24.75, "learning_rate": 5.614281698060163e-05, "loss": 0.0758, "step": 88020 }, { "epoch": 24.75, "learning_rate": 5.6124074594695906e-05, "loss": 0.0627, "step": 88050 }, { "epoch": 24.76, "learning_rate": 5.6105332208790186e-05, "loss": 0.07, "step": 88080 }, { "epoch": 24.77, "learning_rate": 5.608658982288446e-05, "loss": 0.0656, "step": 88110 }, { "epoch": 24.78, "learning_rate": 5.606784743697873e-05, "loss": 0.0706, "step": 88140 }, { "epoch": 24.79, "learning_rate": 5.6049105051073e-05, "loss": 0.0702, "step": 88170 }, { "epoch": 24.8, "learning_rate": 5.6030362665167276e-05, "loss": 0.0591, "step": 88200 }, { "epoch": 24.8, "learning_rate": 5.601162027926156e-05, "loss": 0.0686, "step": 88230 }, { "epoch": 24.81, "learning_rate": 5.5992877893355825e-05, "loss": 0.0655, "step": 88260 }, { "epoch": 24.82, "learning_rate": 5.59741355074501e-05, "loss": 0.0697, "step": 88290 }, { "epoch": 24.83, "learning_rate": 5.595539312154437e-05, "loss": 0.0739, "step": 88320 }, { "epoch": 24.84, "learning_rate": 5.5936650735638654e-05, "loss": 0.0583, "step": 88350 }, { "epoch": 24.85, "learning_rate": 5.591790834973293e-05, "loss": 0.0707, "step": 88380 }, { "epoch": 24.86, "learning_rate": 5.5899165963827196e-05, "loss": 0.0634, "step": 88410 }, { "epoch": 24.86, "learning_rate": 5.588042357792147e-05, "loss": 0.0661, "step": 88440 }, { "epoch": 24.87, "learning_rate": 5.5861681192015744e-05, "loss": 0.0743, "step": 88470 }, { "epoch": 24.88, "learning_rate": 5.5842938806110025e-05, "loss": 0.0581, "step": 88500 }, { "epoch": 24.89, "learning_rate": 5.58241964202043e-05, "loss": 0.0681, "step": 88530 }, { "epoch": 24.9, "learning_rate": 5.580545403429857e-05, "loss": 0.0646, "step": 88560 }, { "epoch": 24.91, "learning_rate": 5.578671164839284e-05, "loss": 0.0675, "step": 88590 }, { "epoch": 24.91, "learning_rate": 5.576796926248712e-05, "loss": 0.0753, "step": 88620 }, { "epoch": 24.92, "learning_rate": 5.5749226876581396e-05, "loss": 0.0611, "step": 88650 }, { "epoch": 24.93, "learning_rate": 5.5730484490675664e-05, "loss": 0.0717, "step": 88680 }, { "epoch": 24.94, "learning_rate": 5.571174210476994e-05, "loss": 0.0637, "step": 88710 }, { "epoch": 24.95, "learning_rate": 5.569299971886421e-05, "loss": 0.0665, "step": 88740 }, { "epoch": 24.96, "learning_rate": 5.567425733295849e-05, "loss": 0.0753, "step": 88770 }, { "epoch": 24.96, "learning_rate": 5.565551494705277e-05, "loss": 0.0588, "step": 88800 }, { "epoch": 24.97, "learning_rate": 5.5636772561147034e-05, "loss": 0.0679, "step": 88830 }, { "epoch": 24.98, "learning_rate": 5.561803017524131e-05, "loss": 0.0613, "step": 88860 }, { "epoch": 24.99, "learning_rate": 5.559928778933558e-05, "loss": 0.0701, "step": 88890 }, { "epoch": 25.0, "learning_rate": 5.5580545403429864e-05, "loss": 0.0722, "step": 88920 }, { "epoch": 25.0, "eval_loss": 0.1143936961889267, "eval_runtime": 628.7306, "eval_samples_per_second": 25.501, "eval_steps_per_second": 0.798, "eval_wer": 0.10660816398946406, "step": 88925 }, { "epoch": 25.01, "learning_rate": 5.556180301752414e-05, "loss": 0.0631, "step": 88950 }, { "epoch": 25.02, "learning_rate": 5.5543060631618405e-05, "loss": 0.07, "step": 88980 }, { "epoch": 25.02, "learning_rate": 5.552431824571268e-05, "loss": 0.0542, "step": 89010 }, { "epoch": 25.03, "learning_rate": 5.550557585980696e-05, "loss": 0.0706, "step": 89040 }, { "epoch": 25.04, "learning_rate": 5.5486833473901235e-05, "loss": 0.0644, "step": 89070 }, { "epoch": 25.05, "learning_rate": 5.54680910879955e-05, "loss": 0.0628, "step": 89100 }, { "epoch": 25.06, "learning_rate": 5.5449348702089776e-05, "loss": 0.0723, "step": 89130 }, { "epoch": 25.07, "learning_rate": 5.543060631618405e-05, "loss": 0.0625, "step": 89160 }, { "epoch": 25.07, "learning_rate": 5.541186393027833e-05, "loss": 0.0683, "step": 89190 }, { "epoch": 25.08, "learning_rate": 5.5393121544372606e-05, "loss": 0.0675, "step": 89220 }, { "epoch": 25.09, "learning_rate": 5.537437915846687e-05, "loss": 0.0657, "step": 89250 }, { "epoch": 25.1, "learning_rate": 5.535563677256115e-05, "loss": 0.0654, "step": 89280 }, { "epoch": 25.11, "learning_rate": 5.533689438665542e-05, "loss": 0.0587, "step": 89310 }, { "epoch": 25.12, "learning_rate": 5.53181520007497e-05, "loss": 0.0687, "step": 89340 }, { "epoch": 25.13, "learning_rate": 5.529940961484398e-05, "loss": 0.063, "step": 89370 }, { "epoch": 25.13, "learning_rate": 5.5280667228938244e-05, "loss": 0.0588, "step": 89400 }, { "epoch": 25.14, "learning_rate": 5.526192484303252e-05, "loss": 0.0698, "step": 89430 }, { "epoch": 25.15, "learning_rate": 5.52431824571268e-05, "loss": 0.0578, "step": 89460 }, { "epoch": 25.16, "learning_rate": 5.522506481741793e-05, "loss": 0.0683, "step": 89490 }, { "epoch": 25.17, "learning_rate": 5.52063224315122e-05, "loss": 0.0622, "step": 89520 }, { "epoch": 25.18, "learning_rate": 5.518758004560648e-05, "loss": 0.0672, "step": 89550 }, { "epoch": 25.18, "learning_rate": 5.516883765970074e-05, "loss": 0.0685, "step": 89580 }, { "epoch": 25.19, "learning_rate": 5.5150095273795023e-05, "loss": 0.057, "step": 89610 }, { "epoch": 25.2, "learning_rate": 5.51313528878893e-05, "loss": 0.071, "step": 89640 }, { "epoch": 25.21, "learning_rate": 5.511261050198357e-05, "loss": 0.0644, "step": 89670 }, { "epoch": 25.22, "learning_rate": 5.509386811607785e-05, "loss": 0.0595, "step": 89700 }, { "epoch": 25.23, "learning_rate": 5.507512573017212e-05, "loss": 0.0692, "step": 89730 }, { "epoch": 25.23, "learning_rate": 5.5056383344266394e-05, "loss": 0.0561, "step": 89760 }, { "epoch": 25.24, "learning_rate": 5.503764095836067e-05, "loss": 0.0681, "step": 89790 }, { "epoch": 25.25, "learning_rate": 5.501889857245495e-05, "loss": 0.06, "step": 89820 }, { "epoch": 25.26, "learning_rate": 5.500015618654921e-05, "loss": 0.0626, "step": 89850 }, { "epoch": 25.27, "learning_rate": 5.498141380064349e-05, "loss": 0.0717, "step": 89880 }, { "epoch": 25.28, "learning_rate": 5.4962671414737765e-05, "loss": 0.0613, "step": 89910 }, { "epoch": 25.29, "learning_rate": 5.494392902883204e-05, "loss": 0.0667, "step": 89940 }, { "epoch": 25.29, "learning_rate": 5.492518664292632e-05, "loss": 0.0636, "step": 89970 }, { "epoch": 25.3, "learning_rate": 5.490644425702058e-05, "loss": 0.0655, "step": 90000 }, { "epoch": 25.31, "learning_rate": 5.488770187111486e-05, "loss": 0.0711, "step": 90030 }, { "epoch": 25.32, "learning_rate": 5.4868959485209136e-05, "loss": 0.056, "step": 90060 }, { "epoch": 25.33, "learning_rate": 5.485021709930341e-05, "loss": 0.0722, "step": 90090 }, { "epoch": 25.34, "learning_rate": 5.483147471339769e-05, "loss": 0.0665, "step": 90120 }, { "epoch": 25.34, "learning_rate": 5.481273232749196e-05, "loss": 0.0634, "step": 90150 }, { "epoch": 25.35, "learning_rate": 5.479398994158623e-05, "loss": 0.0706, "step": 90180 }, { "epoch": 25.36, "learning_rate": 5.477524755568051e-05, "loss": 0.0586, "step": 90210 }, { "epoch": 25.37, "learning_rate": 5.475650516977479e-05, "loss": 0.0655, "step": 90240 }, { "epoch": 25.38, "learning_rate": 5.473776278386905e-05, "loss": 0.0638, "step": 90270 }, { "epoch": 25.39, "learning_rate": 5.471902039796333e-05, "loss": 0.0637, "step": 90300 }, { "epoch": 25.39, "learning_rate": 5.4700278012057604e-05, "loss": 0.0698, "step": 90330 }, { "epoch": 25.4, "learning_rate": 5.468153562615188e-05, "loss": 0.0572, "step": 90360 }, { "epoch": 25.41, "learning_rate": 5.466279324024616e-05, "loss": 0.0693, "step": 90390 }, { "epoch": 25.42, "learning_rate": 5.464405085434042e-05, "loss": 0.062, "step": 90420 }, { "epoch": 25.43, "learning_rate": 5.46253084684347e-05, "loss": 0.0624, "step": 90450 }, { "epoch": 25.44, "learning_rate": 5.4606566082528975e-05, "loss": 0.0695, "step": 90480 }, { "epoch": 25.45, "learning_rate": 5.4587823696623256e-05, "loss": 0.0575, "step": 90510 }, { "epoch": 25.45, "learning_rate": 5.456908131071753e-05, "loss": 0.0671, "step": 90540 }, { "epoch": 25.46, "learning_rate": 5.45503389248118e-05, "loss": 0.0662, "step": 90570 }, { "epoch": 25.47, "learning_rate": 5.453159653890607e-05, "loss": 0.0626, "step": 90600 }, { "epoch": 25.48, "learning_rate": 5.4512854153000346e-05, "loss": 0.0715, "step": 90630 }, { "epoch": 25.49, "learning_rate": 5.449411176709463e-05, "loss": 0.0581, "step": 90660 }, { "epoch": 25.5, "learning_rate": 5.447536938118889e-05, "loss": 0.0669, "step": 90690 }, { "epoch": 25.5, "learning_rate": 5.445662699528317e-05, "loss": 0.0708, "step": 90720 }, { "epoch": 25.51, "learning_rate": 5.443788460937744e-05, "loss": 0.0649, "step": 90750 }, { "epoch": 25.52, "learning_rate": 5.441914222347172e-05, "loss": 0.0704, "step": 90780 }, { "epoch": 25.53, "learning_rate": 5.4400399837566e-05, "loss": 0.0619, "step": 90810 }, { "epoch": 25.54, "learning_rate": 5.438165745166026e-05, "loss": 0.0708, "step": 90840 }, { "epoch": 25.55, "learning_rate": 5.436291506575454e-05, "loss": 0.0616, "step": 90870 }, { "epoch": 25.56, "learning_rate": 5.4344172679848814e-05, "loss": 0.0651, "step": 90900 }, { "epoch": 25.56, "learning_rate": 5.4325430293943095e-05, "loss": 0.069, "step": 90930 }, { "epoch": 25.57, "learning_rate": 5.4306687908037355e-05, "loss": 0.0606, "step": 90960 }, { "epoch": 25.58, "learning_rate": 5.4287945522131636e-05, "loss": 0.0689, "step": 90990 }, { "epoch": 25.59, "learning_rate": 5.426920313622591e-05, "loss": 0.0645, "step": 91020 }, { "epoch": 25.6, "learning_rate": 5.4250460750320185e-05, "loss": 0.0606, "step": 91050 }, { "epoch": 25.61, "learning_rate": 5.4231718364414466e-05, "loss": 0.0699, "step": 91080 }, { "epoch": 25.61, "learning_rate": 5.4212975978508726e-05, "loss": 0.0595, "step": 91110 }, { "epoch": 25.62, "learning_rate": 5.419423359260301e-05, "loss": 0.0687, "step": 91140 }, { "epoch": 25.63, "learning_rate": 5.417549120669728e-05, "loss": 0.0632, "step": 91170 }, { "epoch": 25.64, "learning_rate": 5.4156748820791556e-05, "loss": 0.0632, "step": 91200 }, { "epoch": 25.65, "learning_rate": 5.4138006434885837e-05, "loss": 0.072, "step": 91230 }, { "epoch": 25.66, "learning_rate": 5.4119264048980104e-05, "loss": 0.0603, "step": 91260 }, { "epoch": 25.66, "learning_rate": 5.410052166307438e-05, "loss": 0.0695, "step": 91290 }, { "epoch": 25.67, "learning_rate": 5.408177927716865e-05, "loss": 0.0663, "step": 91320 }, { "epoch": 25.68, "learning_rate": 5.406303689126293e-05, "loss": 0.0639, "step": 91350 }, { "epoch": 25.69, "learning_rate": 5.4044294505357194e-05, "loss": 0.0713, "step": 91380 }, { "epoch": 25.7, "learning_rate": 5.4025552119451475e-05, "loss": 0.063, "step": 91410 }, { "epoch": 25.71, "learning_rate": 5.400680973354575e-05, "loss": 0.0682, "step": 91440 }, { "epoch": 25.72, "learning_rate": 5.398806734764002e-05, "loss": 0.0637, "step": 91470 }, { "epoch": 25.72, "learning_rate": 5.3969324961734304e-05, "loss": 0.0654, "step": 91500 }, { "epoch": 25.73, "learning_rate": 5.3950582575828565e-05, "loss": 0.0693, "step": 91530 }, { "epoch": 25.74, "learning_rate": 5.3931840189922846e-05, "loss": 0.0592, "step": 91560 }, { "epoch": 25.75, "learning_rate": 5.391309780401712e-05, "loss": 0.0687, "step": 91590 }, { "epoch": 25.76, "learning_rate": 5.3894355418111394e-05, "loss": 0.0625, "step": 91620 }, { "epoch": 25.77, "learning_rate": 5.3875613032205675e-05, "loss": 0.0636, "step": 91650 }, { "epoch": 25.77, "learning_rate": 5.385687064629994e-05, "loss": 0.0687, "step": 91680 }, { "epoch": 25.78, "learning_rate": 5.383812826039422e-05, "loss": 0.0618, "step": 91710 }, { "epoch": 25.79, "learning_rate": 5.381938587448849e-05, "loss": 0.0699, "step": 91740 }, { "epoch": 25.8, "learning_rate": 5.380064348858277e-05, "loss": 0.0626, "step": 91770 }, { "epoch": 25.81, "learning_rate": 5.378190110267703e-05, "loss": 0.0649, "step": 91800 }, { "epoch": 25.82, "learning_rate": 5.3763158716771314e-05, "loss": 0.0729, "step": 91830 }, { "epoch": 25.83, "learning_rate": 5.374441633086559e-05, "loss": 0.0576, "step": 91860 }, { "epoch": 25.83, "learning_rate": 5.372567394495986e-05, "loss": 0.0639, "step": 91890 }, { "epoch": 25.84, "learning_rate": 5.370693155905414e-05, "loss": 0.0648, "step": 91920 }, { "epoch": 25.85, "learning_rate": 5.3688189173148404e-05, "loss": 0.0661, "step": 91950 }, { "epoch": 25.86, "learning_rate": 5.3669446787242684e-05, "loss": 0.07, "step": 91980 }, { "epoch": 25.87, "learning_rate": 5.365070440133696e-05, "loss": 0.0577, "step": 92010 }, { "epoch": 25.88, "learning_rate": 5.363196201543124e-05, "loss": 0.0656, "step": 92040 }, { "epoch": 25.88, "learning_rate": 5.3613219629525514e-05, "loss": 0.0624, "step": 92070 }, { "epoch": 25.89, "learning_rate": 5.359447724361978e-05, "loss": 0.0605, "step": 92100 }, { "epoch": 25.9, "learning_rate": 5.3575734857714055e-05, "loss": 0.0716, "step": 92130 }, { "epoch": 25.91, "learning_rate": 5.355699247180833e-05, "loss": 0.0552, "step": 92160 }, { "epoch": 25.92, "learning_rate": 5.353825008590261e-05, "loss": 0.0679, "step": 92190 }, { "epoch": 25.93, "learning_rate": 5.351950769999687e-05, "loss": 0.065, "step": 92220 }, { "epoch": 25.93, "learning_rate": 5.350076531409115e-05, "loss": 0.0645, "step": 92250 }, { "epoch": 25.94, "learning_rate": 5.3482022928185426e-05, "loss": 0.0723, "step": 92280 }, { "epoch": 25.95, "learning_rate": 5.34632805422797e-05, "loss": 0.0594, "step": 92310 }, { "epoch": 25.96, "learning_rate": 5.344453815637398e-05, "loss": 0.069, "step": 92340 }, { "epoch": 25.97, "learning_rate": 5.342579577046824e-05, "loss": 0.0617, "step": 92370 }, { "epoch": 25.98, "learning_rate": 5.340705338456252e-05, "loss": 0.0655, "step": 92400 }, { "epoch": 25.99, "learning_rate": 5.33883109986568e-05, "loss": 0.0662, "step": 92430 }, { "epoch": 25.99, "learning_rate": 5.336956861275108e-05, "loss": 0.0597, "step": 92460 }, { "epoch": 26.0, "eval_loss": 0.10869389772415161, "eval_runtime": 630.2477, "eval_samples_per_second": 25.439, "eval_steps_per_second": 0.797, "eval_wer": 0.10220681560738608, "step": 92482 }, { "epoch": 26.0, "learning_rate": 5.335082622684535e-05, "loss": 0.0729, "step": 92490 }, { "epoch": 26.01, "learning_rate": 5.333208384093962e-05, "loss": 0.0565, "step": 92520 }, { "epoch": 26.02, "learning_rate": 5.3313341455033894e-05, "loss": 0.0647, "step": 92550 }, { "epoch": 26.03, "learning_rate": 5.329459906912817e-05, "loss": 0.0654, "step": 92580 }, { "epoch": 26.04, "learning_rate": 5.327585668322245e-05, "loss": 0.0605, "step": 92610 }, { "epoch": 26.04, "learning_rate": 5.325711429731671e-05, "loss": 0.068, "step": 92640 }, { "epoch": 26.05, "learning_rate": 5.323837191141099e-05, "loss": 0.062, "step": 92670 }, { "epoch": 26.06, "learning_rate": 5.3219629525505265e-05, "loss": 0.0692, "step": 92700 }, { "epoch": 26.07, "learning_rate": 5.320088713959954e-05, "loss": 0.0614, "step": 92730 }, { "epoch": 26.08, "learning_rate": 5.318214475369382e-05, "loss": 0.0604, "step": 92760 }, { "epoch": 26.09, "learning_rate": 5.316340236778809e-05, "loss": 0.0641, "step": 92790 }, { "epoch": 26.1, "learning_rate": 5.314465998188236e-05, "loss": 0.0565, "step": 92820 }, { "epoch": 26.1, "learning_rate": 5.3125917595976636e-05, "loss": 0.066, "step": 92850 }, { "epoch": 26.11, "learning_rate": 5.310717521007092e-05, "loss": 0.0658, "step": 92880 }, { "epoch": 26.12, "learning_rate": 5.308843282416519e-05, "loss": 0.0601, "step": 92910 }, { "epoch": 26.13, "learning_rate": 5.306969043825946e-05, "loss": 0.0706, "step": 92940 }, { "epoch": 26.14, "learning_rate": 5.305094805235373e-05, "loss": 0.0562, "step": 92970 }, { "epoch": 26.15, "learning_rate": 5.303220566644801e-05, "loss": 0.0639, "step": 93000 }, { "epoch": 26.15, "learning_rate": 5.301346328054229e-05, "loss": 0.0657, "step": 93030 }, { "epoch": 26.16, "learning_rate": 5.299472089463655e-05, "loss": 0.0587, "step": 93060 }, { "epoch": 26.17, "learning_rate": 5.297597850873083e-05, "loss": 0.0669, "step": 93090 }, { "epoch": 26.18, "learning_rate": 5.2957236122825104e-05, "loss": 0.0595, "step": 93120 }, { "epoch": 26.19, "learning_rate": 5.293849373691938e-05, "loss": 0.0666, "step": 93150 }, { "epoch": 26.2, "learning_rate": 5.291975135101366e-05, "loss": 0.0663, "step": 93180 }, { "epoch": 26.2, "learning_rate": 5.2901008965107926e-05, "loss": 0.0608, "step": 93210 }, { "epoch": 26.21, "learning_rate": 5.28822665792022e-05, "loss": 0.0675, "step": 93240 }, { "epoch": 26.22, "learning_rate": 5.2863524193296475e-05, "loss": 0.0614, "step": 93270 }, { "epoch": 26.23, "learning_rate": 5.2844781807390756e-05, "loss": 0.0622, "step": 93300 }, { "epoch": 26.24, "learning_rate": 5.282603942148503e-05, "loss": 0.0633, "step": 93330 }, { "epoch": 26.25, "learning_rate": 5.28072970355793e-05, "loss": 0.0621, "step": 93360 }, { "epoch": 26.26, "learning_rate": 5.278855464967357e-05, "loss": 0.0665, "step": 93390 }, { "epoch": 26.26, "learning_rate": 5.2769812263767846e-05, "loss": 0.0584, "step": 93420 }, { "epoch": 26.27, "learning_rate": 5.275106987786213e-05, "loss": 0.0636, "step": 93450 }, { "epoch": 26.28, "learning_rate": 5.273232749195639e-05, "loss": 0.0667, "step": 93480 }, { "epoch": 26.29, "learning_rate": 5.271358510605067e-05, "loss": 0.0599, "step": 93510 }, { "epoch": 26.3, "learning_rate": 5.269484272014494e-05, "loss": 0.0681, "step": 93540 }, { "epoch": 26.31, "learning_rate": 5.267610033423922e-05, "loss": 0.0574, "step": 93570 }, { "epoch": 26.31, "learning_rate": 5.26573579483335e-05, "loss": 0.0631, "step": 93600 }, { "epoch": 26.32, "learning_rate": 5.2638615562427765e-05, "loss": 0.0651, "step": 93630 }, { "epoch": 26.33, "learning_rate": 5.261987317652204e-05, "loss": 0.0595, "step": 93660 }, { "epoch": 26.34, "learning_rate": 5.260113079061631e-05, "loss": 0.0676, "step": 93690 }, { "epoch": 26.35, "learning_rate": 5.2582388404710594e-05, "loss": 0.0608, "step": 93720 }, { "epoch": 26.36, "learning_rate": 5.256364601880487e-05, "loss": 0.0653, "step": 93750 }, { "epoch": 26.36, "learning_rate": 5.2544903632899136e-05, "loss": 0.0653, "step": 93780 }, { "epoch": 26.37, "learning_rate": 5.252616124699341e-05, "loss": 0.0629, "step": 93810 }, { "epoch": 26.38, "learning_rate": 5.2507418861087684e-05, "loss": 0.0695, "step": 93840 }, { "epoch": 26.39, "learning_rate": 5.2488676475181965e-05, "loss": 0.0593, "step": 93870 }, { "epoch": 26.4, "learning_rate": 5.2469934089276226e-05, "loss": 0.065, "step": 93900 }, { "epoch": 26.41, "learning_rate": 5.245119170337051e-05, "loss": 0.0616, "step": 93930 }, { "epoch": 26.42, "learning_rate": 5.243244931746478e-05, "loss": 0.0582, "step": 93960 }, { "epoch": 26.42, "learning_rate": 5.241370693155906e-05, "loss": 0.0676, "step": 93990 }, { "epoch": 26.43, "learning_rate": 5.2394964545653336e-05, "loss": 0.0589, "step": 94020 }, { "epoch": 26.44, "learning_rate": 5.2376222159747604e-05, "loss": 0.0667, "step": 94050 }, { "epoch": 26.45, "learning_rate": 5.235747977384188e-05, "loss": 0.0653, "step": 94080 }, { "epoch": 26.46, "learning_rate": 5.233873738793615e-05, "loss": 0.0577, "step": 94110 }, { "epoch": 26.47, "learning_rate": 5.231999500203043e-05, "loss": 0.0691, "step": 94140 }, { "epoch": 26.47, "learning_rate": 5.230125261612471e-05, "loss": 0.0584, "step": 94170 }, { "epoch": 26.48, "learning_rate": 5.2282510230218975e-05, "loss": 0.065, "step": 94200 }, { "epoch": 26.49, "learning_rate": 5.226376784431325e-05, "loss": 0.0644, "step": 94230 }, { "epoch": 26.5, "learning_rate": 5.224502545840752e-05, "loss": 0.0591, "step": 94260 }, { "epoch": 26.51, "learning_rate": 5.2226283072501804e-05, "loss": 0.0649, "step": 94290 }, { "epoch": 26.52, "learning_rate": 5.220754068659607e-05, "loss": 0.0591, "step": 94320 }, { "epoch": 26.53, "learning_rate": 5.2188798300690346e-05, "loss": 0.0653, "step": 94350 }, { "epoch": 26.53, "learning_rate": 5.217005591478462e-05, "loss": 0.0668, "step": 94380 }, { "epoch": 26.54, "learning_rate": 5.21513135288789e-05, "loss": 0.0586, "step": 94410 }, { "epoch": 26.55, "learning_rate": 5.2132571142973175e-05, "loss": 0.0694, "step": 94440 }, { "epoch": 26.56, "learning_rate": 5.211382875706744e-05, "loss": 0.0607, "step": 94470 }, { "epoch": 26.57, "learning_rate": 5.2095086371161717e-05, "loss": 0.0662, "step": 94500 }, { "epoch": 26.58, "learning_rate": 5.207634398525599e-05, "loss": 0.0668, "step": 94530 }, { "epoch": 26.58, "learning_rate": 5.205760159935027e-05, "loss": 0.0608, "step": 94560 }, { "epoch": 26.59, "learning_rate": 5.203885921344453e-05, "loss": 0.0673, "step": 94590 }, { "epoch": 26.6, "learning_rate": 5.202011682753881e-05, "loss": 0.0627, "step": 94620 }, { "epoch": 26.61, "learning_rate": 5.200137444163309e-05, "loss": 0.0657, "step": 94650 }, { "epoch": 26.62, "learning_rate": 5.198263205572736e-05, "loss": 0.0628, "step": 94680 }, { "epoch": 26.63, "learning_rate": 5.196388966982164e-05, "loss": 0.0574, "step": 94710 }, { "epoch": 26.63, "learning_rate": 5.194514728391591e-05, "loss": 0.0683, "step": 94740 }, { "epoch": 26.64, "learning_rate": 5.1926404898010184e-05, "loss": 0.0574, "step": 94770 }, { "epoch": 26.65, "learning_rate": 5.190766251210446e-05, "loss": 0.0633, "step": 94800 }, { "epoch": 26.66, "learning_rate": 5.188892012619874e-05, "loss": 0.0629, "step": 94830 }, { "epoch": 26.67, "learning_rate": 5.1870177740293014e-05, "loss": 0.0647, "step": 94860 }, { "epoch": 26.68, "learning_rate": 5.185143535438728e-05, "loss": 0.0656, "step": 94890 }, { "epoch": 26.69, "learning_rate": 5.1832692968481555e-05, "loss": 0.0545, "step": 94920 }, { "epoch": 26.69, "learning_rate": 5.181395058257583e-05, "loss": 0.0653, "step": 94950 }, { "epoch": 26.7, "learning_rate": 5.179520819667011e-05, "loss": 0.0662, "step": 94980 }, { "epoch": 26.71, "learning_rate": 5.177646581076437e-05, "loss": 0.0585, "step": 95010 }, { "epoch": 26.72, "learning_rate": 5.175772342485865e-05, "loss": 0.0705, "step": 95040 }, { "epoch": 26.73, "learning_rate": 5.1738981038952926e-05, "loss": 0.0596, "step": 95070 }, { "epoch": 26.74, "learning_rate": 5.172023865304721e-05, "loss": 0.0637, "step": 95100 }, { "epoch": 26.74, "learning_rate": 5.170149626714148e-05, "loss": 0.0634, "step": 95130 }, { "epoch": 26.75, "learning_rate": 5.168275388123575e-05, "loss": 0.0633, "step": 95160 }, { "epoch": 26.76, "learning_rate": 5.166401149533002e-05, "loss": 0.0679, "step": 95190 }, { "epoch": 26.77, "learning_rate": 5.16452691094243e-05, "loss": 0.058, "step": 95220 }, { "epoch": 26.78, "learning_rate": 5.162652672351858e-05, "loss": 0.0693, "step": 95250 }, { "epoch": 26.79, "learning_rate": 5.160778433761285e-05, "loss": 0.0654, "step": 95280 }, { "epoch": 26.79, "learning_rate": 5.158904195170712e-05, "loss": 0.0623, "step": 95310 }, { "epoch": 26.8, "learning_rate": 5.1570299565801394e-05, "loss": 0.0671, "step": 95340 }, { "epoch": 26.81, "learning_rate": 5.155155717989567e-05, "loss": 0.0601, "step": 95370 }, { "epoch": 26.82, "learning_rate": 5.153281479398995e-05, "loss": 0.0634, "step": 95400 }, { "epoch": 26.83, "learning_rate": 5.151407240808421e-05, "loss": 0.0642, "step": 95430 }, { "epoch": 26.84, "learning_rate": 5.149533002217849e-05, "loss": 0.0602, "step": 95460 }, { "epoch": 26.85, "learning_rate": 5.1476587636272765e-05, "loss": 0.0716, "step": 95490 }, { "epoch": 26.85, "learning_rate": 5.1457845250367046e-05, "loss": 0.0635, "step": 95520 }, { "epoch": 26.86, "learning_rate": 5.143972761065817e-05, "loss": 0.0642, "step": 95550 }, { "epoch": 26.87, "learning_rate": 5.142098522475245e-05, "loss": 0.0648, "step": 95580 }, { "epoch": 26.88, "learning_rate": 5.140224283884673e-05, "loss": 0.0621, "step": 95610 }, { "epoch": 26.89, "learning_rate": 5.138350045294099e-05, "loss": 0.0653, "step": 95640 }, { "epoch": 26.9, "learning_rate": 5.136475806703527e-05, "loss": 0.0552, "step": 95670 }, { "epoch": 26.9, "learning_rate": 5.1346015681129544e-05, "loss": 0.0671, "step": 95700 }, { "epoch": 26.91, "learning_rate": 5.132727329522382e-05, "loss": 0.0613, "step": 95730 }, { "epoch": 26.92, "learning_rate": 5.1308530909318086e-05, "loss": 0.0615, "step": 95760 }, { "epoch": 26.93, "learning_rate": 5.128978852341236e-05, "loss": 0.0678, "step": 95790 }, { "epoch": 26.94, "learning_rate": 5.127104613750664e-05, "loss": 0.0587, "step": 95820 }, { "epoch": 26.95, "learning_rate": 5.1252303751600915e-05, "loss": 0.0637, "step": 95850 }, { "epoch": 26.96, "learning_rate": 5.1233561365695196e-05, "loss": 0.0616, "step": 95880 }, { "epoch": 26.96, "learning_rate": 5.121481897978946e-05, "loss": 0.0634, "step": 95910 }, { "epoch": 26.97, "learning_rate": 5.119607659388374e-05, "loss": 0.0672, "step": 95940 }, { "epoch": 26.98, "learning_rate": 5.117733420797801e-05, "loss": 0.0604, "step": 95970 }, { "epoch": 26.99, "learning_rate": 5.1158591822072286e-05, "loss": 0.0658, "step": 96000 }, { "epoch": 27.0, "learning_rate": 5.113984943616657e-05, "loss": 0.062, "step": 96030 }, { "epoch": 27.0, "eval_loss": 0.10732191056013107, "eval_runtime": 630.3808, "eval_samples_per_second": 25.434, "eval_steps_per_second": 0.796, "eval_wer": 0.10270495271109413, "step": 96039 }, { "epoch": 27.01, "learning_rate": 5.112110705026083e-05, "loss": 0.0595, "step": 96060 }, { "epoch": 27.01, "learning_rate": 5.110236466435511e-05, "loss": 0.0678, "step": 96090 }, { "epoch": 27.02, "learning_rate": 5.108362227844938e-05, "loss": 0.0525, "step": 96120 }, { "epoch": 27.03, "learning_rate": 5.106487989254366e-05, "loss": 0.0699, "step": 96150 }, { "epoch": 27.04, "learning_rate": 5.1046137506637924e-05, "loss": 0.0593, "step": 96180 }, { "epoch": 27.05, "learning_rate": 5.1027395120732205e-05, "loss": 0.0636, "step": 96210 }, { "epoch": 27.06, "learning_rate": 5.100865273482648e-05, "loss": 0.0704, "step": 96240 }, { "epoch": 27.06, "learning_rate": 5.0989910348920754e-05, "loss": 0.0575, "step": 96270 }, { "epoch": 27.07, "learning_rate": 5.0971167963015035e-05, "loss": 0.0617, "step": 96300 }, { "epoch": 27.08, "learning_rate": 5.0952425577109295e-05, "loss": 0.0576, "step": 96330 }, { "epoch": 27.09, "learning_rate": 5.0933683191203576e-05, "loss": 0.0571, "step": 96360 }, { "epoch": 27.1, "learning_rate": 5.091494080529785e-05, "loss": 0.0673, "step": 96390 }, { "epoch": 27.11, "learning_rate": 5.0896198419392125e-05, "loss": 0.0561, "step": 96420 }, { "epoch": 27.12, "learning_rate": 5.0877456033486406e-05, "loss": 0.0685, "step": 96450 }, { "epoch": 27.12, "learning_rate": 5.0858713647580666e-05, "loss": 0.0611, "step": 96480 }, { "epoch": 27.13, "learning_rate": 5.083997126167495e-05, "loss": 0.0629, "step": 96510 }, { "epoch": 27.14, "learning_rate": 5.082122887576922e-05, "loss": 0.0714, "step": 96540 }, { "epoch": 27.15, "learning_rate": 5.0802486489863496e-05, "loss": 0.0578, "step": 96570 }, { "epoch": 27.16, "learning_rate": 5.078374410395776e-05, "loss": 0.0619, "step": 96600 }, { "epoch": 27.17, "learning_rate": 5.0765001718052044e-05, "loss": 0.0582, "step": 96630 }, { "epoch": 27.17, "learning_rate": 5.074625933214632e-05, "loss": 0.0638, "step": 96660 }, { "epoch": 27.18, "learning_rate": 5.072751694624059e-05, "loss": 0.0711, "step": 96690 }, { "epoch": 27.19, "learning_rate": 5.0708774560334873e-05, "loss": 0.0598, "step": 96720 }, { "epoch": 27.2, "learning_rate": 5.0690032174429134e-05, "loss": 0.0692, "step": 96750 }, { "epoch": 27.21, "learning_rate": 5.0671289788523415e-05, "loss": 0.0596, "step": 96780 }, { "epoch": 27.22, "learning_rate": 5.065254740261769e-05, "loss": 0.0656, "step": 96810 }, { "epoch": 27.23, "learning_rate": 5.0633805016711963e-05, "loss": 0.0685, "step": 96840 }, { "epoch": 27.23, "learning_rate": 5.0615062630806244e-05, "loss": 0.0562, "step": 96870 }, { "epoch": 27.24, "learning_rate": 5.0596320244900505e-05, "loss": 0.065, "step": 96900 }, { "epoch": 27.25, "learning_rate": 5.0577577858994786e-05, "loss": 0.057, "step": 96930 }, { "epoch": 27.26, "learning_rate": 5.055883547308906e-05, "loss": 0.0637, "step": 96960 }, { "epoch": 27.27, "learning_rate": 5.054009308718334e-05, "loss": 0.0718, "step": 96990 }, { "epoch": 27.28, "learning_rate": 5.05213507012776e-05, "loss": 0.0564, "step": 97020 }, { "epoch": 27.28, "learning_rate": 5.050260831537188e-05, "loss": 0.0638, "step": 97050 }, { "epoch": 27.29, "learning_rate": 5.048386592946616e-05, "loss": 0.0578, "step": 97080 }, { "epoch": 27.3, "learning_rate": 5.046512354356043e-05, "loss": 0.064, "step": 97110 }, { "epoch": 27.31, "learning_rate": 5.044638115765471e-05, "loss": 0.066, "step": 97140 }, { "epoch": 27.32, "learning_rate": 5.042763877174897e-05, "loss": 0.0562, "step": 97170 }, { "epoch": 27.33, "learning_rate": 5.0408896385843254e-05, "loss": 0.0623, "step": 97200 }, { "epoch": 27.33, "learning_rate": 5.039015399993753e-05, "loss": 0.0625, "step": 97230 }, { "epoch": 27.34, "learning_rate": 5.03714116140318e-05, "loss": 0.0596, "step": 97260 }, { "epoch": 27.35, "learning_rate": 5.035266922812608e-05, "loss": 0.0703, "step": 97290 }, { "epoch": 27.36, "learning_rate": 5.0333926842220344e-05, "loss": 0.056, "step": 97320 }, { "epoch": 27.37, "learning_rate": 5.0315184456314625e-05, "loss": 0.0707, "step": 97350 }, { "epoch": 27.38, "learning_rate": 5.02964420704089e-05, "loss": 0.0571, "step": 97380 }, { "epoch": 27.39, "learning_rate": 5.027769968450318e-05, "loss": 0.0614, "step": 97410 }, { "epoch": 27.39, "learning_rate": 5.025895729859744e-05, "loss": 0.0656, "step": 97440 }, { "epoch": 27.4, "learning_rate": 5.024021491269172e-05, "loss": 0.0571, "step": 97470 }, { "epoch": 27.41, "learning_rate": 5.0221472526785996e-05, "loss": 0.0646, "step": 97500 }, { "epoch": 27.42, "learning_rate": 5.020273014088027e-05, "loss": 0.0554, "step": 97530 }, { "epoch": 27.43, "learning_rate": 5.018398775497455e-05, "loss": 0.0613, "step": 97560 }, { "epoch": 27.44, "learning_rate": 5.016524536906881e-05, "loss": 0.0668, "step": 97590 }, { "epoch": 27.44, "learning_rate": 5.014650298316309e-05, "loss": 0.0542, "step": 97620 }, { "epoch": 27.45, "learning_rate": 5.0127760597257367e-05, "loss": 0.0692, "step": 97650 }, { "epoch": 27.46, "learning_rate": 5.010901821135164e-05, "loss": 0.0579, "step": 97680 }, { "epoch": 27.47, "learning_rate": 5.009027582544592e-05, "loss": 0.0613, "step": 97710 }, { "epoch": 27.48, "learning_rate": 5.007153343954019e-05, "loss": 0.0703, "step": 97740 }, { "epoch": 27.49, "learning_rate": 5.005279105363446e-05, "loss": 0.0545, "step": 97770 }, { "epoch": 27.5, "learning_rate": 5.003404866772874e-05, "loss": 0.0627, "step": 97800 }, { "epoch": 27.5, "learning_rate": 5.001530628182302e-05, "loss": 0.0578, "step": 97830 }, { "epoch": 27.51, "learning_rate": 4.9997188642114146e-05, "loss": 0.0654, "step": 97860 }, { "epoch": 27.52, "learning_rate": 4.997844625620841e-05, "loss": 0.0674, "step": 97890 }, { "epoch": 27.53, "learning_rate": 4.9959703870302694e-05, "loss": 0.0545, "step": 97920 }, { "epoch": 27.54, "learning_rate": 4.994096148439696e-05, "loss": 0.0683, "step": 97950 }, { "epoch": 27.55, "learning_rate": 4.992221909849124e-05, "loss": 0.0593, "step": 97980 }, { "epoch": 27.55, "learning_rate": 4.990347671258551e-05, "loss": 0.0622, "step": 98010 }, { "epoch": 27.56, "learning_rate": 4.988473432667979e-05, "loss": 0.0662, "step": 98040 }, { "epoch": 27.57, "learning_rate": 4.9865991940774065e-05, "loss": 0.0581, "step": 98070 }, { "epoch": 27.58, "learning_rate": 4.984724955486833e-05, "loss": 0.0689, "step": 98100 }, { "epoch": 27.59, "learning_rate": 4.9828507168962614e-05, "loss": 0.0598, "step": 98130 }, { "epoch": 27.6, "learning_rate": 4.980976478305688e-05, "loss": 0.0653, "step": 98160 }, { "epoch": 27.6, "learning_rate": 4.979102239715116e-05, "loss": 0.0679, "step": 98190 }, { "epoch": 27.61, "learning_rate": 4.977228001124543e-05, "loss": 0.0583, "step": 98220 }, { "epoch": 27.62, "learning_rate": 4.975353762533971e-05, "loss": 0.0665, "step": 98250 }, { "epoch": 27.63, "learning_rate": 4.9734795239433985e-05, "loss": 0.0567, "step": 98280 }, { "epoch": 27.64, "learning_rate": 4.971605285352826e-05, "loss": 0.0628, "step": 98310 }, { "epoch": 27.65, "learning_rate": 4.969731046762253e-05, "loss": 0.0661, "step": 98340 }, { "epoch": 27.66, "learning_rate": 4.96785680817168e-05, "loss": 0.0534, "step": 98370 }, { "epoch": 27.66, "learning_rate": 4.965982569581108e-05, "loss": 0.0601, "step": 98400 }, { "epoch": 27.67, "learning_rate": 4.964108330990535e-05, "loss": 0.0605, "step": 98430 }, { "epoch": 27.68, "learning_rate": 4.962234092399963e-05, "loss": 0.0637, "step": 98460 }, { "epoch": 27.69, "learning_rate": 4.9603598538093904e-05, "loss": 0.0658, "step": 98490 }, { "epoch": 27.7, "learning_rate": 4.958485615218818e-05, "loss": 0.0579, "step": 98520 }, { "epoch": 27.71, "learning_rate": 4.956611376628245e-05, "loss": 0.0702, "step": 98550 }, { "epoch": 27.71, "learning_rate": 4.954737138037672e-05, "loss": 0.0553, "step": 98580 }, { "epoch": 27.72, "learning_rate": 4.9528628994471e-05, "loss": 0.0621, "step": 98610 }, { "epoch": 27.73, "learning_rate": 4.950988660856527e-05, "loss": 0.0653, "step": 98640 }, { "epoch": 27.74, "learning_rate": 4.949114422265955e-05, "loss": 0.0531, "step": 98670 }, { "epoch": 27.75, "learning_rate": 4.947240183675382e-05, "loss": 0.0667, "step": 98700 }, { "epoch": 27.76, "learning_rate": 4.94536594508481e-05, "loss": 0.0586, "step": 98730 }, { "epoch": 27.76, "learning_rate": 4.943491706494237e-05, "loss": 0.0685, "step": 98760 }, { "epoch": 27.77, "learning_rate": 4.941617467903664e-05, "loss": 0.0677, "step": 98790 }, { "epoch": 27.78, "learning_rate": 4.939743229313092e-05, "loss": 0.0566, "step": 98820 }, { "epoch": 27.79, "learning_rate": 4.937868990722519e-05, "loss": 0.0662, "step": 98850 }, { "epoch": 27.8, "learning_rate": 4.935994752131947e-05, "loss": 0.0593, "step": 98880 }, { "epoch": 27.81, "learning_rate": 4.934120513541374e-05, "loss": 0.0601, "step": 98910 }, { "epoch": 27.82, "learning_rate": 4.932246274950802e-05, "loss": 0.0646, "step": 98940 }, { "epoch": 27.82, "learning_rate": 4.930372036360229e-05, "loss": 0.0543, "step": 98970 }, { "epoch": 27.83, "learning_rate": 4.928497797769656e-05, "loss": 0.0674, "step": 99000 }, { "epoch": 27.84, "learning_rate": 4.926623559179084e-05, "loss": 0.0553, "step": 99030 }, { "epoch": 27.85, "learning_rate": 4.924749320588511e-05, "loss": 0.0593, "step": 99060 }, { "epoch": 27.86, "learning_rate": 4.922875081997939e-05, "loss": 0.0636, "step": 99090 }, { "epoch": 27.87, "learning_rate": 4.921000843407366e-05, "loss": 0.0572, "step": 99120 }, { "epoch": 27.87, "learning_rate": 4.9191266048167936e-05, "loss": 0.0644, "step": 99150 }, { "epoch": 27.88, "learning_rate": 4.917252366226221e-05, "loss": 0.0599, "step": 99180 }, { "epoch": 27.89, "learning_rate": 4.915378127635648e-05, "loss": 0.0647, "step": 99210 }, { "epoch": 27.9, "learning_rate": 4.913503889045076e-05, "loss": 0.0717, "step": 99240 }, { "epoch": 27.91, "learning_rate": 4.9116296504545026e-05, "loss": 0.0548, "step": 99270 }, { "epoch": 27.92, "learning_rate": 4.909755411863931e-05, "loss": 0.0657, "step": 99300 }, { "epoch": 27.93, "learning_rate": 4.907881173273358e-05, "loss": 0.0594, "step": 99330 }, { "epoch": 27.93, "learning_rate": 4.9060069346827855e-05, "loss": 0.0558, "step": 99360 }, { "epoch": 27.94, "learning_rate": 4.904132696092213e-05, "loss": 0.0672, "step": 99390 }, { "epoch": 27.95, "learning_rate": 4.90225845750164e-05, "loss": 0.0531, "step": 99420 }, { "epoch": 27.96, "learning_rate": 4.900384218911068e-05, "loss": 0.0662, "step": 99450 }, { "epoch": 27.97, "learning_rate": 4.8985099803204945e-05, "loss": 0.0613, "step": 99480 }, { "epoch": 27.98, "learning_rate": 4.8966357417299226e-05, "loss": 0.0614, "step": 99510 }, { "epoch": 27.98, "learning_rate": 4.89476150313935e-05, "loss": 0.0703, "step": 99540 }, { "epoch": 27.99, "learning_rate": 4.8928872645487775e-05, "loss": 0.0536, "step": 99570 }, { "epoch": 28.0, "eval_loss": 0.10675393790006638, "eval_runtime": 629.0591, "eval_samples_per_second": 25.487, "eval_steps_per_second": 0.798, "eval_wer": 0.10265036234356448, "step": 99596 }, { "epoch": 28.0, "learning_rate": 4.891013025958205e-05, "loss": 0.0698, "step": 99600 }, { "epoch": 28.01, "learning_rate": 4.889138787367632e-05, "loss": 0.0523, "step": 99630 }, { "epoch": 28.02, "learning_rate": 4.887327023396746e-05, "loss": 0.0634, "step": 99660 }, { "epoch": 28.03, "learning_rate": 4.8854527848061725e-05, "loss": 0.0593, "step": 99690 }, { "epoch": 28.03, "learning_rate": 4.8835785462156006e-05, "loss": 0.0598, "step": 99720 }, { "epoch": 28.04, "learning_rate": 4.881704307625027e-05, "loss": 0.0633, "step": 99750 }, { "epoch": 28.05, "learning_rate": 4.879830069034455e-05, "loss": 0.0548, "step": 99780 }, { "epoch": 28.06, "learning_rate": 4.877955830443882e-05, "loss": 0.0629, "step": 99810 }, { "epoch": 28.07, "learning_rate": 4.8760815918533096e-05, "loss": 0.0599, "step": 99840 }, { "epoch": 28.08, "learning_rate": 4.874207353262738e-05, "loss": 0.0584, "step": 99870 }, { "epoch": 28.09, "learning_rate": 4.8723331146721644e-05, "loss": 0.0631, "step": 99900 }, { "epoch": 28.09, "learning_rate": 4.8704588760815925e-05, "loss": 0.0546, "step": 99930 }, { "epoch": 28.1, "learning_rate": 4.868584637491019e-05, "loss": 0.0645, "step": 99960 }, { "epoch": 28.11, "learning_rate": 4.866710398900447e-05, "loss": 0.062, "step": 99990 }, { "epoch": 28.12, "learning_rate": 4.864836160309874e-05, "loss": 0.0613, "step": 100020 }, { "epoch": 28.13, "learning_rate": 4.8629619217193015e-05, "loss": 0.0665, "step": 100050 }, { "epoch": 28.14, "learning_rate": 4.8610876831287296e-05, "loss": 0.0534, "step": 100080 }, { "epoch": 28.14, "learning_rate": 4.8592134445381563e-05, "loss": 0.0639, "step": 100110 }, { "epoch": 28.15, "learning_rate": 4.8573392059475844e-05, "loss": 0.0589, "step": 100140 }, { "epoch": 28.16, "learning_rate": 4.855464967357011e-05, "loss": 0.0624, "step": 100170 }, { "epoch": 28.17, "learning_rate": 4.853590728766439e-05, "loss": 0.0657, "step": 100200 }, { "epoch": 28.18, "learning_rate": 4.851716490175866e-05, "loss": 0.0509, "step": 100230 }, { "epoch": 28.19, "learning_rate": 4.8498422515852934e-05, "loss": 0.0644, "step": 100260 }, { "epoch": 28.2, "learning_rate": 4.8479680129947215e-05, "loss": 0.06, "step": 100290 }, { "epoch": 28.2, "learning_rate": 4.846093774404148e-05, "loss": 0.0591, "step": 100320 }, { "epoch": 28.21, "learning_rate": 4.8442195358135764e-05, "loss": 0.0675, "step": 100350 }, { "epoch": 28.22, "learning_rate": 4.842345297223003e-05, "loss": 0.0525, "step": 100380 }, { "epoch": 28.23, "learning_rate": 4.840471058632431e-05, "loss": 0.0644, "step": 100410 }, { "epoch": 28.24, "learning_rate": 4.838596820041858e-05, "loss": 0.0593, "step": 100440 }, { "epoch": 28.25, "learning_rate": 4.8367225814512854e-05, "loss": 0.058, "step": 100470 }, { "epoch": 28.25, "learning_rate": 4.8348483428607135e-05, "loss": 0.0663, "step": 100500 }, { "epoch": 28.26, "learning_rate": 4.83297410427014e-05, "loss": 0.0543, "step": 100530 }, { "epoch": 28.27, "learning_rate": 4.831099865679568e-05, "loss": 0.0633, "step": 100560 }, { "epoch": 28.28, "learning_rate": 4.829225627088995e-05, "loss": 0.0585, "step": 100590 }, { "epoch": 28.29, "learning_rate": 4.827351388498423e-05, "loss": 0.0588, "step": 100620 }, { "epoch": 28.3, "learning_rate": 4.82547714990785e-05, "loss": 0.0684, "step": 100650 }, { "epoch": 28.3, "learning_rate": 4.823602911317277e-05, "loss": 0.0536, "step": 100680 }, { "epoch": 28.31, "learning_rate": 4.8217286727267054e-05, "loss": 0.0623, "step": 100710 }, { "epoch": 28.32, "learning_rate": 4.819854434136132e-05, "loss": 0.0586, "step": 100740 }, { "epoch": 28.33, "learning_rate": 4.81798019554556e-05, "loss": 0.0595, "step": 100770 }, { "epoch": 28.34, "learning_rate": 4.816105956954987e-05, "loss": 0.0641, "step": 100800 }, { "epoch": 28.35, "learning_rate": 4.814231718364415e-05, "loss": 0.0561, "step": 100830 }, { "epoch": 28.36, "learning_rate": 4.812357479773842e-05, "loss": 0.0643, "step": 100860 }, { "epoch": 28.36, "learning_rate": 4.810483241183269e-05, "loss": 0.0583, "step": 100890 }, { "epoch": 28.37, "learning_rate": 4.808609002592697e-05, "loss": 0.0575, "step": 100920 }, { "epoch": 28.38, "learning_rate": 4.806734764002124e-05, "loss": 0.0683, "step": 100950 }, { "epoch": 28.39, "learning_rate": 4.804860525411552e-05, "loss": 0.055, "step": 100980 }, { "epoch": 28.4, "learning_rate": 4.802986286820979e-05, "loss": 0.0626, "step": 101010 }, { "epoch": 28.41, "learning_rate": 4.801112048230407e-05, "loss": 0.0627, "step": 101040 }, { "epoch": 28.41, "learning_rate": 4.799237809639834e-05, "loss": 0.0636, "step": 101070 }, { "epoch": 28.42, "learning_rate": 4.797363571049261e-05, "loss": 0.0699, "step": 101100 }, { "epoch": 28.43, "learning_rate": 4.795489332458689e-05, "loss": 0.0535, "step": 101130 }, { "epoch": 28.44, "learning_rate": 4.793615093868116e-05, "loss": 0.0668, "step": 101160 }, { "epoch": 28.45, "learning_rate": 4.791740855277544e-05, "loss": 0.0601, "step": 101190 }, { "epoch": 28.46, "learning_rate": 4.789866616686971e-05, "loss": 0.0602, "step": 101220 }, { "epoch": 28.46, "learning_rate": 4.787992378096399e-05, "loss": 0.0672, "step": 101250 }, { "epoch": 28.47, "learning_rate": 4.786118139505826e-05, "loss": 0.0522, "step": 101280 }, { "epoch": 28.48, "learning_rate": 4.784243900915253e-05, "loss": 0.0665, "step": 101310 }, { "epoch": 28.49, "learning_rate": 4.782369662324681e-05, "loss": 0.0615, "step": 101340 }, { "epoch": 28.5, "learning_rate": 4.780495423734108e-05, "loss": 0.0564, "step": 101370 }, { "epoch": 28.51, "learning_rate": 4.778621185143536e-05, "loss": 0.0673, "step": 101400 }, { "epoch": 28.52, "learning_rate": 4.776746946552963e-05, "loss": 0.0568, "step": 101430 }, { "epoch": 28.52, "learning_rate": 4.774872707962391e-05, "loss": 0.0644, "step": 101460 }, { "epoch": 28.53, "learning_rate": 4.7729984693718176e-05, "loss": 0.0634, "step": 101490 }, { "epoch": 28.54, "learning_rate": 4.771124230781245e-05, "loss": 0.0609, "step": 101520 }, { "epoch": 28.55, "learning_rate": 4.769249992190673e-05, "loss": 0.0657, "step": 101550 }, { "epoch": 28.56, "learning_rate": 4.7673757536001e-05, "loss": 0.0544, "step": 101580 }, { "epoch": 28.57, "learning_rate": 4.765501515009528e-05, "loss": 0.0652, "step": 101610 }, { "epoch": 28.57, "learning_rate": 4.763627276418955e-05, "loss": 0.0578, "step": 101640 }, { "epoch": 28.58, "learning_rate": 4.761753037828383e-05, "loss": 0.0578, "step": 101670 }, { "epoch": 28.59, "learning_rate": 4.7598787992378096e-05, "loss": 0.0694, "step": 101700 }, { "epoch": 28.6, "learning_rate": 4.7580045606472377e-05, "loss": 0.055, "step": 101730 }, { "epoch": 28.61, "learning_rate": 4.756130322056665e-05, "loss": 0.0609, "step": 101760 }, { "epoch": 28.62, "learning_rate": 4.754256083466092e-05, "loss": 0.0563, "step": 101790 }, { "epoch": 28.63, "learning_rate": 4.75238184487552e-05, "loss": 0.0589, "step": 101820 }, { "epoch": 28.63, "learning_rate": 4.7505076062849466e-05, "loss": 0.0667, "step": 101850 }, { "epoch": 28.64, "learning_rate": 4.748633367694375e-05, "loss": 0.0564, "step": 101880 }, { "epoch": 28.65, "learning_rate": 4.7467591291038015e-05, "loss": 0.0707, "step": 101910 }, { "epoch": 28.66, "learning_rate": 4.7448848905132296e-05, "loss": 0.0598, "step": 101940 }, { "epoch": 28.67, "learning_rate": 4.743010651922657e-05, "loss": 0.0608, "step": 101970 }, { "epoch": 28.68, "learning_rate": 4.741136413332084e-05, "loss": 0.0687, "step": 102000 }, { "epoch": 28.68, "learning_rate": 4.739262174741512e-05, "loss": 0.0543, "step": 102030 }, { "epoch": 28.69, "learning_rate": 4.7373879361509386e-05, "loss": 0.0624, "step": 102060 }, { "epoch": 28.7, "learning_rate": 4.735513697560367e-05, "loss": 0.0582, "step": 102090 }, { "epoch": 28.71, "learning_rate": 4.7336394589697934e-05, "loss": 0.0604, "step": 102120 }, { "epoch": 28.72, "learning_rate": 4.7317652203792215e-05, "loss": 0.0683, "step": 102150 }, { "epoch": 28.73, "learning_rate": 4.729890981788648e-05, "loss": 0.0564, "step": 102180 }, { "epoch": 28.73, "learning_rate": 4.728016743198076e-05, "loss": 0.0656, "step": 102210 }, { "epoch": 28.74, "learning_rate": 4.726142504607504e-05, "loss": 0.0597, "step": 102240 }, { "epoch": 28.75, "learning_rate": 4.7242682660169305e-05, "loss": 0.0596, "step": 102270 }, { "epoch": 28.76, "learning_rate": 4.7223940274263586e-05, "loss": 0.0658, "step": 102300 }, { "epoch": 28.77, "learning_rate": 4.7205197888357854e-05, "loss": 0.0557, "step": 102330 }, { "epoch": 28.78, "learning_rate": 4.7186455502452135e-05, "loss": 0.0663, "step": 102360 }, { "epoch": 28.79, "learning_rate": 4.71677131165464e-05, "loss": 0.061, "step": 102390 }, { "epoch": 28.79, "learning_rate": 4.7148970730640676e-05, "loss": 0.0598, "step": 102420 }, { "epoch": 28.8, "learning_rate": 4.713022834473496e-05, "loss": 0.0665, "step": 102450 }, { "epoch": 28.81, "learning_rate": 4.7111485958829224e-05, "loss": 0.0547, "step": 102480 }, { "epoch": 28.82, "learning_rate": 4.7092743572923505e-05, "loss": 0.0642, "step": 102510 }, { "epoch": 28.83, "learning_rate": 4.707400118701777e-05, "loss": 0.0581, "step": 102540 }, { "epoch": 28.84, "learning_rate": 4.7055258801112054e-05, "loss": 0.06, "step": 102570 }, { "epoch": 28.84, "learning_rate": 4.703651641520632e-05, "loss": 0.0661, "step": 102600 }, { "epoch": 28.85, "learning_rate": 4.7017774029300595e-05, "loss": 0.0549, "step": 102630 }, { "epoch": 28.86, "learning_rate": 4.6999031643394876e-05, "loss": 0.0674, "step": 102660 }, { "epoch": 28.87, "learning_rate": 4.6980289257489144e-05, "loss": 0.0559, "step": 102690 }, { "epoch": 28.88, "learning_rate": 4.6961546871583425e-05, "loss": 0.0606, "step": 102720 }, { "epoch": 28.89, "learning_rate": 4.694280448567769e-05, "loss": 0.0657, "step": 102750 }, { "epoch": 28.9, "learning_rate": 4.692406209977197e-05, "loss": 0.0546, "step": 102780 }, { "epoch": 28.9, "learning_rate": 4.690531971386624e-05, "loss": 0.0619, "step": 102810 }, { "epoch": 28.91, "learning_rate": 4.6886577327960515e-05, "loss": 0.0607, "step": 102840 }, { "epoch": 28.92, "learning_rate": 4.6867834942054796e-05, "loss": 0.0588, "step": 102870 }, { "epoch": 28.93, "learning_rate": 4.684909255614906e-05, "loss": 0.067, "step": 102900 }, { "epoch": 28.94, "learning_rate": 4.6830350170243344e-05, "loss": 0.0537, "step": 102930 }, { "epoch": 28.95, "learning_rate": 4.681160778433761e-05, "loss": 0.0688, "step": 102960 }, { "epoch": 28.95, "learning_rate": 4.679286539843189e-05, "loss": 0.0612, "step": 102990 }, { "epoch": 28.96, "learning_rate": 4.677412301252616e-05, "loss": 0.0559, "step": 103020 }, { "epoch": 28.97, "learning_rate": 4.6755380626620434e-05, "loss": 0.0692, "step": 103050 }, { "epoch": 28.98, "learning_rate": 4.6736638240714715e-05, "loss": 0.0534, "step": 103080 }, { "epoch": 28.99, "learning_rate": 4.671789585480898e-05, "loss": 0.0663, "step": 103110 }, { "epoch": 29.0, "learning_rate": 4.6699153468903263e-05, "loss": 0.0616, "step": 103140 }, { "epoch": 29.0, "eval_loss": 0.10966203361749649, "eval_runtime": 631.5692, "eval_samples_per_second": 25.386, "eval_steps_per_second": 0.795, "eval_wer": 0.10370805071445144, "step": 103153 }, { "epoch": 29.0, "learning_rate": 4.668103582919439e-05, "loss": 0.0653, "step": 103170 }, { "epoch": 29.01, "learning_rate": 4.6662293443288665e-05, "loss": 0.0621, "step": 103200 }, { "epoch": 29.02, "learning_rate": 4.664355105738294e-05, "loss": 0.0575, "step": 103230 }, { "epoch": 29.03, "learning_rate": 4.6624808671477213e-05, "loss": 0.0644, "step": 103260 }, { "epoch": 29.04, "learning_rate": 4.660606628557149e-05, "loss": 0.0525, "step": 103290 }, { "epoch": 29.05, "learning_rate": 4.658732389966576e-05, "loss": 0.059, "step": 103320 }, { "epoch": 29.06, "learning_rate": 4.6568581513760036e-05, "loss": 0.0604, "step": 103350 }, { "epoch": 29.06, "learning_rate": 4.654983912785431e-05, "loss": 0.0559, "step": 103380 }, { "epoch": 29.07, "learning_rate": 4.6531096741948584e-05, "loss": 0.0654, "step": 103410 }, { "epoch": 29.08, "learning_rate": 4.651235435604286e-05, "loss": 0.0553, "step": 103440 }, { "epoch": 29.09, "learning_rate": 4.649361197013713e-05, "loss": 0.0629, "step": 103470 }, { "epoch": 29.1, "learning_rate": 4.647486958423141e-05, "loss": 0.0578, "step": 103500 }, { "epoch": 29.11, "learning_rate": 4.645612719832568e-05, "loss": 0.0536, "step": 103530 }, { "epoch": 29.11, "learning_rate": 4.6437384812419955e-05, "loss": 0.0646, "step": 103560 }, { "epoch": 29.12, "learning_rate": 4.641864242651423e-05, "loss": 0.0535, "step": 103590 }, { "epoch": 29.13, "learning_rate": 4.639990004060851e-05, "loss": 0.0641, "step": 103620 }, { "epoch": 29.14, "learning_rate": 4.638115765470278e-05, "loss": 0.0643, "step": 103650 }, { "epoch": 29.15, "learning_rate": 4.636241526879705e-05, "loss": 0.0572, "step": 103680 }, { "epoch": 29.16, "learning_rate": 4.6343672882891326e-05, "loss": 0.0626, "step": 103710 }, { "epoch": 29.17, "learning_rate": 4.63249304969856e-05, "loss": 0.0576, "step": 103740 }, { "epoch": 29.17, "learning_rate": 4.6306188111079875e-05, "loss": 0.0621, "step": 103770 }, { "epoch": 29.18, "learning_rate": 4.628744572517415e-05, "loss": 0.0613, "step": 103800 }, { "epoch": 29.19, "learning_rate": 4.626870333926843e-05, "loss": 0.0578, "step": 103830 }, { "epoch": 29.2, "learning_rate": 4.62499609533627e-05, "loss": 0.0657, "step": 103860 }, { "epoch": 29.21, "learning_rate": 4.623121856745697e-05, "loss": 0.0561, "step": 103890 }, { "epoch": 29.22, "learning_rate": 4.6212476181551246e-05, "loss": 0.0651, "step": 103920 }, { "epoch": 29.22, "learning_rate": 4.619373379564552e-05, "loss": 0.059, "step": 103950 }, { "epoch": 29.23, "learning_rate": 4.6174991409739794e-05, "loss": 0.0567, "step": 103980 }, { "epoch": 29.24, "learning_rate": 4.615624902383407e-05, "loss": 0.0647, "step": 104010 }, { "epoch": 29.25, "learning_rate": 4.613750663792835e-05, "loss": 0.0572, "step": 104040 }, { "epoch": 29.26, "learning_rate": 4.611876425202262e-05, "loss": 0.0647, "step": 104070 }, { "epoch": 29.27, "learning_rate": 4.610002186611689e-05, "loss": 0.0622, "step": 104100 }, { "epoch": 29.27, "learning_rate": 4.6081279480211165e-05, "loss": 0.0561, "step": 104130 }, { "epoch": 29.28, "learning_rate": 4.606253709430544e-05, "loss": 0.0621, "step": 104160 }, { "epoch": 29.29, "learning_rate": 4.604379470839971e-05, "loss": 0.0559, "step": 104190 }, { "epoch": 29.3, "learning_rate": 4.602505232249399e-05, "loss": 0.0634, "step": 104220 }, { "epoch": 29.31, "learning_rate": 4.600630993658827e-05, "loss": 0.0583, "step": 104250 }, { "epoch": 29.32, "learning_rate": 4.5987567550682536e-05, "loss": 0.0524, "step": 104280 }, { "epoch": 29.33, "learning_rate": 4.596882516477681e-05, "loss": 0.0619, "step": 104310 }, { "epoch": 29.33, "learning_rate": 4.5950082778871084e-05, "loss": 0.0549, "step": 104340 }, { "epoch": 29.34, "learning_rate": 4.593134039296536e-05, "loss": 0.0624, "step": 104370 }, { "epoch": 29.35, "learning_rate": 4.591259800705963e-05, "loss": 0.061, "step": 104400 }, { "epoch": 29.36, "learning_rate": 4.589385562115391e-05, "loss": 0.0562, "step": 104430 }, { "epoch": 29.37, "learning_rate": 4.587511323524819e-05, "loss": 0.0619, "step": 104460 }, { "epoch": 29.38, "learning_rate": 4.5856370849342455e-05, "loss": 0.0508, "step": 104490 }, { "epoch": 29.38, "learning_rate": 4.583762846343673e-05, "loss": 0.0607, "step": 104520 }, { "epoch": 29.39, "learning_rate": 4.5818886077531004e-05, "loss": 0.0599, "step": 104550 }, { "epoch": 29.4, "learning_rate": 4.580014369162528e-05, "loss": 0.0568, "step": 104580 }, { "epoch": 29.41, "learning_rate": 4.578140130571955e-05, "loss": 0.0653, "step": 104610 }, { "epoch": 29.42, "learning_rate": 4.5762658919813826e-05, "loss": 0.0528, "step": 104640 }, { "epoch": 29.43, "learning_rate": 4.574391653390811e-05, "loss": 0.063, "step": 104670 }, { "epoch": 29.43, "learning_rate": 4.5725174148002375e-05, "loss": 0.0613, "step": 104700 }, { "epoch": 29.44, "learning_rate": 4.570643176209665e-05, "loss": 0.0601, "step": 104730 }, { "epoch": 29.45, "learning_rate": 4.568768937619092e-05, "loss": 0.0635, "step": 104760 }, { "epoch": 29.46, "learning_rate": 4.56689469902852e-05, "loss": 0.0555, "step": 104790 }, { "epoch": 29.47, "learning_rate": 4.565020460437947e-05, "loss": 0.0605, "step": 104820 }, { "epoch": 29.48, "learning_rate": 4.5631462218473746e-05, "loss": 0.0655, "step": 104850 }, { "epoch": 29.49, "learning_rate": 4.5612719832568027e-05, "loss": 0.0575, "step": 104880 }, { "epoch": 29.49, "learning_rate": 4.5593977446662294e-05, "loss": 0.0635, "step": 104910 }, { "epoch": 29.5, "learning_rate": 4.557523506075657e-05, "loss": 0.0515, "step": 104940 }, { "epoch": 29.51, "learning_rate": 4.555649267485084e-05, "loss": 0.0598, "step": 104970 }, { "epoch": 29.52, "learning_rate": 4.5537750288945117e-05, "loss": 0.0622, "step": 105000 }, { "epoch": 29.53, "learning_rate": 4.551900790303939e-05, "loss": 0.0523, "step": 105030 }, { "epoch": 29.54, "learning_rate": 4.5500265517133665e-05, "loss": 0.0659, "step": 105060 }, { "epoch": 29.54, "learning_rate": 4.5481523131227946e-05, "loss": 0.0532, "step": 105090 }, { "epoch": 29.55, "learning_rate": 4.546278074532221e-05, "loss": 0.0613, "step": 105120 }, { "epoch": 29.56, "learning_rate": 4.5444038359416494e-05, "loss": 0.058, "step": 105150 }, { "epoch": 29.57, "learning_rate": 4.542529597351076e-05, "loss": 0.0591, "step": 105180 }, { "epoch": 29.58, "learning_rate": 4.5406553587605036e-05, "loss": 0.0648, "step": 105210 }, { "epoch": 29.59, "learning_rate": 4.538781120169931e-05, "loss": 0.0531, "step": 105240 }, { "epoch": 29.6, "learning_rate": 4.5369068815793584e-05, "loss": 0.0633, "step": 105270 }, { "epoch": 29.6, "learning_rate": 4.5350326429887865e-05, "loss": 0.0593, "step": 105300 }, { "epoch": 29.61, "learning_rate": 4.533158404398213e-05, "loss": 0.0569, "step": 105330 }, { "epoch": 29.62, "learning_rate": 4.5312841658076414e-05, "loss": 0.0636, "step": 105360 }, { "epoch": 29.63, "learning_rate": 4.529409927217068e-05, "loss": 0.0574, "step": 105390 }, { "epoch": 29.64, "learning_rate": 4.5275356886264955e-05, "loss": 0.0657, "step": 105420 }, { "epoch": 29.65, "learning_rate": 4.525661450035923e-05, "loss": 0.0593, "step": 105450 }, { "epoch": 29.65, "learning_rate": 4.5237872114453504e-05, "loss": 0.0597, "step": 105480 }, { "epoch": 29.66, "learning_rate": 4.5219129728547785e-05, "loss": 0.0639, "step": 105510 }, { "epoch": 29.67, "learning_rate": 4.520038734264205e-05, "loss": 0.0552, "step": 105540 }, { "epoch": 29.68, "learning_rate": 4.518164495673633e-05, "loss": 0.0602, "step": 105570 }, { "epoch": 29.69, "learning_rate": 4.51629025708306e-05, "loss": 0.0595, "step": 105600 }, { "epoch": 29.7, "learning_rate": 4.5144160184924875e-05, "loss": 0.0563, "step": 105630 }, { "epoch": 29.7, "learning_rate": 4.512541779901915e-05, "loss": 0.0638, "step": 105660 }, { "epoch": 29.71, "learning_rate": 4.510667541311342e-05, "loss": 0.056, "step": 105690 }, { "epoch": 29.72, "learning_rate": 4.5087933027207704e-05, "loss": 0.0606, "step": 105720 }, { "epoch": 29.73, "learning_rate": 4.506919064130197e-05, "loss": 0.0598, "step": 105750 }, { "epoch": 29.74, "learning_rate": 4.505044825539625e-05, "loss": 0.0564, "step": 105780 }, { "epoch": 29.75, "learning_rate": 4.503170586949052e-05, "loss": 0.0631, "step": 105810 }, { "epoch": 29.76, "learning_rate": 4.5012963483584794e-05, "loss": 0.0554, "step": 105840 }, { "epoch": 29.76, "learning_rate": 4.499422109767907e-05, "loss": 0.063, "step": 105870 }, { "epoch": 29.77, "learning_rate": 4.497547871177334e-05, "loss": 0.0598, "step": 105900 }, { "epoch": 29.78, "learning_rate": 4.495673632586762e-05, "loss": 0.0588, "step": 105930 }, { "epoch": 29.79, "learning_rate": 4.493799393996189e-05, "loss": 0.0649, "step": 105960 }, { "epoch": 29.8, "learning_rate": 4.491925155405617e-05, "loss": 0.0536, "step": 105990 }, { "epoch": 29.81, "learning_rate": 4.490050916815044e-05, "loss": 0.0595, "step": 106020 }, { "epoch": 29.81, "learning_rate": 4.488176678224471e-05, "loss": 0.0591, "step": 106050 }, { "epoch": 29.82, "learning_rate": 4.486302439633899e-05, "loss": 0.0582, "step": 106080 }, { "epoch": 29.83, "learning_rate": 4.484428201043326e-05, "loss": 0.066, "step": 106110 }, { "epoch": 29.84, "learning_rate": 4.482553962452754e-05, "loss": 0.0534, "step": 106140 }, { "epoch": 29.85, "learning_rate": 4.480679723862181e-05, "loss": 0.0644, "step": 106170 }, { "epoch": 29.86, "learning_rate": 4.478805485271609e-05, "loss": 0.0613, "step": 106200 }, { "epoch": 29.86, "learning_rate": 4.476931246681036e-05, "loss": 0.058, "step": 106230 }, { "epoch": 29.87, "learning_rate": 4.475057008090463e-05, "loss": 0.0638, "step": 106260 }, { "epoch": 29.88, "learning_rate": 4.473182769499891e-05, "loss": 0.0548, "step": 106290 }, { "epoch": 29.89, "learning_rate": 4.471308530909318e-05, "loss": 0.0614, "step": 106320 }, { "epoch": 29.9, "learning_rate": 4.469434292318746e-05, "loss": 0.0605, "step": 106350 }, { "epoch": 29.91, "learning_rate": 4.467560053728173e-05, "loss": 0.0577, "step": 106380 }, { "epoch": 29.92, "learning_rate": 4.465685815137601e-05, "loss": 0.0665, "step": 106410 }, { "epoch": 29.92, "learning_rate": 4.463811576547028e-05, "loss": 0.0554, "step": 106440 }, { "epoch": 29.93, "learning_rate": 4.461937337956455e-05, "loss": 0.0607, "step": 106470 }, { "epoch": 29.94, "learning_rate": 4.4600630993658826e-05, "loss": 0.0595, "step": 106500 }, { "epoch": 29.95, "learning_rate": 4.45818886077531e-05, "loss": 0.0545, "step": 106530 }, { "epoch": 29.96, "learning_rate": 4.4563146221847374e-05, "loss": 0.0625, "step": 106560 }, { "epoch": 29.97, "learning_rate": 4.454440383594165e-05, "loss": 0.0519, "step": 106590 }, { "epoch": 29.97, "learning_rate": 4.452566145003593e-05, "loss": 0.0671, "step": 106620 }, { "epoch": 29.98, "learning_rate": 4.45069190641302e-05, "loss": 0.0617, "step": 106650 }, { "epoch": 29.99, "learning_rate": 4.448817667822448e-05, "loss": 0.0578, "step": 106680 }, { "epoch": 30.0, "learning_rate": 4.4469434292318745e-05, "loss": 0.0642, "step": 106710 }, { "epoch": 30.0, "eval_loss": 0.11168166995048523, "eval_runtime": 629.3759, "eval_samples_per_second": 25.474, "eval_steps_per_second": 0.798, "eval_wer": 0.1020089255250911, "step": 106710 }, { "epoch": 30.01, "learning_rate": 4.445069190641302e-05, "loss": 0.0513, "step": 106740 }, { "epoch": 30.02, "learning_rate": 4.4431949520507294e-05, "loss": 0.0647, "step": 106770 }, { "epoch": 30.03, "learning_rate": 4.441320713460157e-05, "loss": 0.0548, "step": 106800 }, { "epoch": 30.03, "learning_rate": 4.439446474869585e-05, "loss": 0.0575, "step": 106830 }, { "epoch": 30.04, "learning_rate": 4.4375722362790116e-05, "loss": 0.0621, "step": 106860 }, { "epoch": 30.05, "learning_rate": 4.43569799768844e-05, "loss": 0.0499, "step": 106890 }, { "epoch": 30.06, "learning_rate": 4.4338237590978665e-05, "loss": 0.063, "step": 106920 }, { "epoch": 30.07, "learning_rate": 4.431949520507294e-05, "loss": 0.0558, "step": 106950 }, { "epoch": 30.08, "learning_rate": 4.430075281916721e-05, "loss": 0.0579, "step": 106980 }, { "epoch": 30.08, "learning_rate": 4.428201043326149e-05, "loss": 0.0643, "step": 107010 }, { "epoch": 30.09, "learning_rate": 4.426326804735577e-05, "loss": 0.0532, "step": 107040 }, { "epoch": 30.1, "learning_rate": 4.4244525661450036e-05, "loss": 0.0659, "step": 107070 }, { "epoch": 30.11, "learning_rate": 4.422578327554432e-05, "loss": 0.0552, "step": 107100 }, { "epoch": 30.12, "learning_rate": 4.4207040889638584e-05, "loss": 0.0597, "step": 107130 }, { "epoch": 30.13, "learning_rate": 4.418892324992972e-05, "loss": 0.0622, "step": 107160 }, { "epoch": 30.13, "learning_rate": 4.417018086402399e-05, "loss": 0.0526, "step": 107190 }, { "epoch": 30.14, "learning_rate": 4.415143847811827e-05, "loss": 0.0628, "step": 107220 }, { "epoch": 30.15, "learning_rate": 4.413269609221254e-05, "loss": 0.0547, "step": 107250 }, { "epoch": 30.16, "learning_rate": 4.4113953706306815e-05, "loss": 0.0574, "step": 107280 }, { "epoch": 30.17, "learning_rate": 4.409521132040109e-05, "loss": 0.0626, "step": 107310 }, { "epoch": 30.18, "learning_rate": 4.4076468934495363e-05, "loss": 0.0507, "step": 107340 }, { "epoch": 30.19, "learning_rate": 4.405772654858964e-05, "loss": 0.0583, "step": 107370 }, { "epoch": 30.19, "learning_rate": 4.403898416268391e-05, "loss": 0.0527, "step": 107400 }, { "epoch": 30.2, "learning_rate": 4.4020241776778186e-05, "loss": 0.0566, "step": 107430 }, { "epoch": 30.21, "learning_rate": 4.400149939087246e-05, "loss": 0.0619, "step": 107460 }, { "epoch": 30.22, "learning_rate": 4.3982757004966734e-05, "loss": 0.0497, "step": 107490 }, { "epoch": 30.23, "learning_rate": 4.396401461906101e-05, "loss": 0.065, "step": 107520 }, { "epoch": 30.24, "learning_rate": 4.394527223315528e-05, "loss": 0.0545, "step": 107550 }, { "epoch": 30.24, "learning_rate": 4.392652984724956e-05, "loss": 0.0627, "step": 107580 }, { "epoch": 30.25, "learning_rate": 4.390778746134383e-05, "loss": 0.0619, "step": 107610 }, { "epoch": 30.26, "learning_rate": 4.3889045075438105e-05, "loss": 0.0507, "step": 107640 }, { "epoch": 30.27, "learning_rate": 4.387030268953238e-05, "loss": 0.065, "step": 107670 }, { "epoch": 30.28, "learning_rate": 4.3851560303626654e-05, "loss": 0.0539, "step": 107700 }, { "epoch": 30.29, "learning_rate": 4.383281791772093e-05, "loss": 0.0633, "step": 107730 }, { "epoch": 30.3, "learning_rate": 4.38140755318152e-05, "loss": 0.0643, "step": 107760 }, { "epoch": 30.3, "learning_rate": 4.3795333145909476e-05, "loss": 0.0504, "step": 107790 }, { "epoch": 30.31, "learning_rate": 4.377659076000375e-05, "loss": 0.067, "step": 107820 }, { "epoch": 30.32, "learning_rate": 4.3757848374098025e-05, "loss": 0.0535, "step": 107850 }, { "epoch": 30.33, "learning_rate": 4.37391059881923e-05, "loss": 0.0572, "step": 107880 }, { "epoch": 30.34, "learning_rate": 4.372036360228657e-05, "loss": 0.0637, "step": 107910 }, { "epoch": 30.35, "learning_rate": 4.370162121638085e-05, "loss": 0.0524, "step": 107940 }, { "epoch": 30.35, "learning_rate": 4.368287883047512e-05, "loss": 0.0625, "step": 107970 }, { "epoch": 30.36, "learning_rate": 4.3664136444569396e-05, "loss": 0.0557, "step": 108000 }, { "epoch": 30.37, "learning_rate": 4.364539405866367e-05, "loss": 0.0586, "step": 108030 }, { "epoch": 30.38, "learning_rate": 4.3626651672757944e-05, "loss": 0.0632, "step": 108060 }, { "epoch": 30.39, "learning_rate": 4.360790928685222e-05, "loss": 0.0544, "step": 108090 }, { "epoch": 30.4, "learning_rate": 4.358916690094649e-05, "loss": 0.0607, "step": 108120 }, { "epoch": 30.4, "learning_rate": 4.3570424515040767e-05, "loss": 0.0562, "step": 108150 }, { "epoch": 30.41, "learning_rate": 4.355168212913504e-05, "loss": 0.0607, "step": 108180 }, { "epoch": 30.42, "learning_rate": 4.3532939743229315e-05, "loss": 0.0623, "step": 108210 }, { "epoch": 30.43, "learning_rate": 4.351419735732359e-05, "loss": 0.0517, "step": 108240 }, { "epoch": 30.44, "learning_rate": 4.349545497141786e-05, "loss": 0.0678, "step": 108270 }, { "epoch": 30.45, "learning_rate": 4.347671258551214e-05, "loss": 0.0573, "step": 108300 }, { "epoch": 30.46, "learning_rate": 4.345797019960641e-05, "loss": 0.0569, "step": 108330 }, { "epoch": 30.46, "learning_rate": 4.3439227813700686e-05, "loss": 0.0641, "step": 108360 }, { "epoch": 30.47, "learning_rate": 4.342048542779496e-05, "loss": 0.0539, "step": 108390 }, { "epoch": 30.48, "learning_rate": 4.3401743041889234e-05, "loss": 0.0618, "step": 108420 }, { "epoch": 30.49, "learning_rate": 4.338300065598351e-05, "loss": 0.0507, "step": 108450 }, { "epoch": 30.5, "learning_rate": 4.336425827007778e-05, "loss": 0.0559, "step": 108480 }, { "epoch": 30.51, "learning_rate": 4.334551588417206e-05, "loss": 0.061, "step": 108510 }, { "epoch": 30.51, "learning_rate": 4.332677349826633e-05, "loss": 0.055, "step": 108540 }, { "epoch": 30.52, "learning_rate": 4.3308031112360605e-05, "loss": 0.062, "step": 108570 }, { "epoch": 30.53, "learning_rate": 4.328928872645488e-05, "loss": 0.0527, "step": 108600 }, { "epoch": 30.54, "learning_rate": 4.3270546340549154e-05, "loss": 0.0614, "step": 108630 }, { "epoch": 30.55, "learning_rate": 4.325180395464343e-05, "loss": 0.0638, "step": 108660 }, { "epoch": 30.56, "learning_rate": 4.32330615687377e-05, "loss": 0.0509, "step": 108690 }, { "epoch": 30.57, "learning_rate": 4.3214319182831976e-05, "loss": 0.0633, "step": 108720 }, { "epoch": 30.57, "learning_rate": 4.319557679692625e-05, "loss": 0.0517, "step": 108750 }, { "epoch": 30.58, "learning_rate": 4.3176834411020525e-05, "loss": 0.0611, "step": 108780 }, { "epoch": 30.59, "learning_rate": 4.31580920251148e-05, "loss": 0.0646, "step": 108810 }, { "epoch": 30.6, "learning_rate": 4.313934963920907e-05, "loss": 0.0532, "step": 108840 }, { "epoch": 30.61, "learning_rate": 4.312060725330335e-05, "loss": 0.0609, "step": 108870 }, { "epoch": 30.62, "learning_rate": 4.310186486739762e-05, "loss": 0.0505, "step": 108900 }, { "epoch": 30.62, "learning_rate": 4.3083122481491896e-05, "loss": 0.0562, "step": 108930 }, { "epoch": 30.63, "learning_rate": 4.306438009558617e-05, "loss": 0.0602, "step": 108960 }, { "epoch": 30.64, "learning_rate": 4.3045637709680444e-05, "loss": 0.0536, "step": 108990 }, { "epoch": 30.65, "learning_rate": 4.302689532377472e-05, "loss": 0.0654, "step": 109020 }, { "epoch": 30.66, "learning_rate": 4.300815293786899e-05, "loss": 0.0553, "step": 109050 }, { "epoch": 30.67, "learning_rate": 4.2989410551963266e-05, "loss": 0.0605, "step": 109080 }, { "epoch": 30.67, "learning_rate": 4.297066816605754e-05, "loss": 0.0613, "step": 109110 }, { "epoch": 30.68, "learning_rate": 4.2951925780151815e-05, "loss": 0.0518, "step": 109140 }, { "epoch": 30.69, "learning_rate": 4.293318339424609e-05, "loss": 0.0615, "step": 109170 }, { "epoch": 30.7, "learning_rate": 4.291444100834036e-05, "loss": 0.0538, "step": 109200 }, { "epoch": 30.71, "learning_rate": 4.289569862243464e-05, "loss": 0.0599, "step": 109230 }, { "epoch": 30.72, "learning_rate": 4.287695623652891e-05, "loss": 0.0649, "step": 109260 }, { "epoch": 30.73, "learning_rate": 4.2858838596820046e-05, "loss": 0.0548, "step": 109290 }, { "epoch": 30.73, "learning_rate": 4.284009621091431e-05, "loss": 0.0622, "step": 109320 }, { "epoch": 30.74, "learning_rate": 4.2821353825008594e-05, "loss": 0.0531, "step": 109350 }, { "epoch": 30.75, "learning_rate": 4.280261143910287e-05, "loss": 0.0582, "step": 109380 }, { "epoch": 30.76, "learning_rate": 4.278386905319714e-05, "loss": 0.0657, "step": 109410 }, { "epoch": 30.77, "learning_rate": 4.276512666729142e-05, "loss": 0.0511, "step": 109440 }, { "epoch": 30.78, "learning_rate": 4.2746384281385684e-05, "loss": 0.0618, "step": 109470 }, { "epoch": 30.78, "learning_rate": 4.2727641895479965e-05, "loss": 0.0524, "step": 109500 }, { "epoch": 30.79, "learning_rate": 4.270889950957423e-05, "loss": 0.0595, "step": 109530 }, { "epoch": 30.8, "learning_rate": 4.2690157123668514e-05, "loss": 0.062, "step": 109560 }, { "epoch": 30.81, "learning_rate": 4.267141473776279e-05, "loss": 0.0522, "step": 109590 }, { "epoch": 30.82, "learning_rate": 4.265267235185706e-05, "loss": 0.0611, "step": 109620 }, { "epoch": 30.83, "learning_rate": 4.2633929965951336e-05, "loss": 0.0543, "step": 109650 }, { "epoch": 30.83, "learning_rate": 4.2615187580045604e-05, "loss": 0.0619, "step": 109680 }, { "epoch": 30.84, "learning_rate": 4.2596445194139884e-05, "loss": 0.064, "step": 109710 }, { "epoch": 30.85, "learning_rate": 4.257770280823415e-05, "loss": 0.0533, "step": 109740 }, { "epoch": 30.86, "learning_rate": 4.255896042232843e-05, "loss": 0.0599, "step": 109770 }, { "epoch": 30.87, "learning_rate": 4.254021803642271e-05, "loss": 0.0586, "step": 109800 }, { "epoch": 30.88, "learning_rate": 4.252147565051698e-05, "loss": 0.063, "step": 109830 }, { "epoch": 30.89, "learning_rate": 4.2502733264611255e-05, "loss": 0.0623, "step": 109860 }, { "epoch": 30.89, "learning_rate": 4.248399087870553e-05, "loss": 0.0551, "step": 109890 }, { "epoch": 30.9, "learning_rate": 4.2465248492799804e-05, "loss": 0.062, "step": 109920 }, { "epoch": 30.91, "learning_rate": 4.244650610689407e-05, "loss": 0.055, "step": 109950 }, { "epoch": 30.92, "learning_rate": 4.242776372098835e-05, "loss": 0.0566, "step": 109980 }, { "epoch": 30.93, "learning_rate": 4.2409021335082626e-05, "loss": 0.0622, "step": 110010 }, { "epoch": 30.94, "learning_rate": 4.23902789491769e-05, "loss": 0.0494, "step": 110040 }, { "epoch": 30.94, "learning_rate": 4.2371536563271175e-05, "loss": 0.0608, "step": 110070 }, { "epoch": 30.95, "learning_rate": 4.235279417736545e-05, "loss": 0.0536, "step": 110100 }, { "epoch": 30.96, "learning_rate": 4.233405179145972e-05, "loss": 0.059, "step": 110130 }, { "epoch": 30.97, "learning_rate": 4.231530940555399e-05, "loss": 0.0642, "step": 110160 }, { "epoch": 30.98, "learning_rate": 4.229656701964827e-05, "loss": 0.0514, "step": 110190 }, { "epoch": 30.99, "learning_rate": 4.2277824633742546e-05, "loss": 0.0651, "step": 110220 }, { "epoch": 31.0, "learning_rate": 4.225908224783682e-05, "loss": 0.0555, "step": 110250 }, { "epoch": 31.0, "eval_loss": 0.11092609167098999, "eval_runtime": 629.5598, "eval_samples_per_second": 25.467, "eval_steps_per_second": 0.797, "eval_wer": 0.09900645531096038, "step": 110267 }, { "epoch": 31.0, "learning_rate": 4.2240339861931094e-05, "loss": 0.0594, "step": 110280 }, { "epoch": 31.01, "learning_rate": 4.222159747602537e-05, "loss": 0.0534, "step": 110310 }, { "epoch": 31.02, "learning_rate": 4.220285509011964e-05, "loss": 0.0538, "step": 110340 }, { "epoch": 31.03, "learning_rate": 4.218411270421391e-05, "loss": 0.0627, "step": 110370 }, { "epoch": 31.04, "learning_rate": 4.216537031830819e-05, "loss": 0.0524, "step": 110400 }, { "epoch": 31.05, "learning_rate": 4.2146627932402465e-05, "loss": 0.0592, "step": 110430 }, { "epoch": 31.05, "learning_rate": 4.212788554649674e-05, "loss": 0.0546, "step": 110460 }, { "epoch": 31.06, "learning_rate": 4.2109143160591013e-05, "loss": 0.0599, "step": 110490 }, { "epoch": 31.07, "learning_rate": 4.209040077468529e-05, "loss": 0.0606, "step": 110520 }, { "epoch": 31.08, "learning_rate": 4.207165838877956e-05, "loss": 0.0518, "step": 110550 }, { "epoch": 31.09, "learning_rate": 4.205291600287383e-05, "loss": 0.0596, "step": 110580 }, { "epoch": 31.1, "learning_rate": 4.203417361696811e-05, "loss": 0.0544, "step": 110610 }, { "epoch": 31.1, "learning_rate": 4.2015431231062384e-05, "loss": 0.057, "step": 110640 }, { "epoch": 31.11, "learning_rate": 4.199668884515666e-05, "loss": 0.0612, "step": 110670 }, { "epoch": 31.12, "learning_rate": 4.197794645925093e-05, "loss": 0.0543, "step": 110700 }, { "epoch": 31.13, "learning_rate": 4.195920407334521e-05, "loss": 0.0575, "step": 110730 }, { "epoch": 31.14, "learning_rate": 4.194046168743948e-05, "loss": 0.0601, "step": 110760 }, { "epoch": 31.15, "learning_rate": 4.192171930153375e-05, "loss": 0.0552, "step": 110790 }, { "epoch": 31.16, "learning_rate": 4.190297691562803e-05, "loss": 0.0655, "step": 110820 }, { "epoch": 31.16, "learning_rate": 4.1884234529722304e-05, "loss": 0.0502, "step": 110850 }, { "epoch": 31.17, "learning_rate": 4.186549214381658e-05, "loss": 0.0594, "step": 110880 }, { "epoch": 31.18, "learning_rate": 4.184674975791085e-05, "loss": 0.0557, "step": 110910 }, { "epoch": 31.19, "learning_rate": 4.1828007372005126e-05, "loss": 0.0574, "step": 110940 }, { "epoch": 31.2, "learning_rate": 4.18092649860994e-05, "loss": 0.0623, "step": 110970 }, { "epoch": 31.21, "learning_rate": 4.179052260019367e-05, "loss": 0.0511, "step": 111000 }, { "epoch": 31.21, "learning_rate": 4.177178021428795e-05, "loss": 0.0575, "step": 111030 }, { "epoch": 31.22, "learning_rate": 4.175303782838222e-05, "loss": 0.0584, "step": 111060 }, { "epoch": 31.23, "learning_rate": 4.17342954424765e-05, "loss": 0.0609, "step": 111090 }, { "epoch": 31.24, "learning_rate": 4.171555305657077e-05, "loss": 0.0667, "step": 111120 }, { "epoch": 31.25, "learning_rate": 4.1696810670665046e-05, "loss": 0.054, "step": 111150 }, { "epoch": 31.26, "learning_rate": 4.167806828475932e-05, "loss": 0.0587, "step": 111180 }, { "epoch": 31.27, "learning_rate": 4.165932589885359e-05, "loss": 0.0544, "step": 111210 }, { "epoch": 31.27, "learning_rate": 4.164058351294787e-05, "loss": 0.0553, "step": 111240 }, { "epoch": 31.28, "learning_rate": 4.162184112704214e-05, "loss": 0.0634, "step": 111270 }, { "epoch": 31.29, "learning_rate": 4.1603098741136417e-05, "loss": 0.0524, "step": 111300 }, { "epoch": 31.3, "learning_rate": 4.1584981101427544e-05, "loss": 0.0599, "step": 111330 }, { "epoch": 31.31, "learning_rate": 4.156623871552182e-05, "loss": 0.0543, "step": 111360 }, { "epoch": 31.32, "learning_rate": 4.15474963296161e-05, "loss": 0.0556, "step": 111390 }, { "epoch": 31.32, "learning_rate": 4.1528753943710367e-05, "loss": 0.0608, "step": 111420 }, { "epoch": 31.33, "learning_rate": 4.151001155780465e-05, "loss": 0.0509, "step": 111450 }, { "epoch": 31.34, "learning_rate": 4.1491269171898915e-05, "loss": 0.0619, "step": 111480 }, { "epoch": 31.35, "learning_rate": 4.1472526785993196e-05, "loss": 0.0556, "step": 111510 }, { "epoch": 31.36, "learning_rate": 4.145378440008746e-05, "loss": 0.0605, "step": 111540 }, { "epoch": 31.37, "learning_rate": 4.143504201418174e-05, "loss": 0.0625, "step": 111570 }, { "epoch": 31.37, "learning_rate": 4.141629962827602e-05, "loss": 0.0461, "step": 111600 }, { "epoch": 31.38, "learning_rate": 4.1397557242370286e-05, "loss": 0.0624, "step": 111630 }, { "epoch": 31.39, "learning_rate": 4.137881485646457e-05, "loss": 0.0548, "step": 111660 }, { "epoch": 31.4, "learning_rate": 4.1360072470558834e-05, "loss": 0.0564, "step": 111690 }, { "epoch": 31.41, "learning_rate": 4.1341330084653115e-05, "loss": 0.0626, "step": 111720 }, { "epoch": 31.42, "learning_rate": 4.132258769874738e-05, "loss": 0.0492, "step": 111750 }, { "epoch": 31.43, "learning_rate": 4.130384531284166e-05, "loss": 0.0601, "step": 111780 }, { "epoch": 31.43, "learning_rate": 4.128510292693594e-05, "loss": 0.0549, "step": 111810 }, { "epoch": 31.44, "learning_rate": 4.1266360541030205e-05, "loss": 0.057, "step": 111840 }, { "epoch": 31.45, "learning_rate": 4.1247618155124486e-05, "loss": 0.0615, "step": 111870 }, { "epoch": 31.46, "learning_rate": 4.1228875769218754e-05, "loss": 0.0492, "step": 111900 }, { "epoch": 31.47, "learning_rate": 4.1210133383313035e-05, "loss": 0.0618, "step": 111930 }, { "epoch": 31.48, "learning_rate": 4.11913909974073e-05, "loss": 0.058, "step": 111960 }, { "epoch": 31.48, "learning_rate": 4.117264861150158e-05, "loss": 0.0602, "step": 111990 }, { "epoch": 31.49, "learning_rate": 4.115390622559586e-05, "loss": 0.0634, "step": 112020 }, { "epoch": 31.5, "learning_rate": 4.1135163839690125e-05, "loss": 0.0531, "step": 112050 }, { "epoch": 31.51, "learning_rate": 4.1116421453784406e-05, "loss": 0.0623, "step": 112080 }, { "epoch": 31.52, "learning_rate": 4.109767906787867e-05, "loss": 0.0517, "step": 112110 }, { "epoch": 31.53, "learning_rate": 4.1078936681972954e-05, "loss": 0.0595, "step": 112140 }, { "epoch": 31.53, "learning_rate": 4.106019429606722e-05, "loss": 0.0601, "step": 112170 }, { "epoch": 31.54, "learning_rate": 4.10414519101615e-05, "loss": 0.0529, "step": 112200 }, { "epoch": 31.55, "learning_rate": 4.1022709524255777e-05, "loss": 0.0597, "step": 112230 }, { "epoch": 31.56, "learning_rate": 4.1003967138350044e-05, "loss": 0.0574, "step": 112260 }, { "epoch": 31.57, "learning_rate": 4.0985224752444325e-05, "loss": 0.0561, "step": 112290 }, { "epoch": 31.58, "learning_rate": 4.096648236653859e-05, "loss": 0.06, "step": 112320 }, { "epoch": 31.59, "learning_rate": 4.094773998063287e-05, "loss": 0.0509, "step": 112350 }, { "epoch": 31.59, "learning_rate": 4.092899759472714e-05, "loss": 0.0608, "step": 112380 }, { "epoch": 31.6, "learning_rate": 4.091025520882142e-05, "loss": 0.0557, "step": 112410 }, { "epoch": 31.61, "learning_rate": 4.0891512822915696e-05, "loss": 0.0584, "step": 112440 }, { "epoch": 31.62, "learning_rate": 4.087277043700996e-05, "loss": 0.0645, "step": 112470 }, { "epoch": 31.63, "learning_rate": 4.0854028051104244e-05, "loss": 0.0511, "step": 112500 }, { "epoch": 31.64, "learning_rate": 4.083528566519851e-05, "loss": 0.0581, "step": 112530 }, { "epoch": 31.64, "learning_rate": 4.081654327929279e-05, "loss": 0.057, "step": 112560 }, { "epoch": 31.65, "learning_rate": 4.079780089338706e-05, "loss": 0.0572, "step": 112590 }, { "epoch": 31.66, "learning_rate": 4.077905850748134e-05, "loss": 0.0644, "step": 112620 }, { "epoch": 31.67, "learning_rate": 4.0760316121575615e-05, "loss": 0.0508, "step": 112650 }, { "epoch": 31.68, "learning_rate": 4.074157373566988e-05, "loss": 0.0602, "step": 112680 }, { "epoch": 31.69, "learning_rate": 4.0722831349764164e-05, "loss": 0.0519, "step": 112710 }, { "epoch": 31.7, "learning_rate": 4.070408896385843e-05, "loss": 0.0558, "step": 112740 }, { "epoch": 31.7, "learning_rate": 4.068534657795271e-05, "loss": 0.0621, "step": 112770 }, { "epoch": 31.71, "learning_rate": 4.066660419204698e-05, "loss": 0.0505, "step": 112800 }, { "epoch": 31.72, "learning_rate": 4.064786180614126e-05, "loss": 0.0608, "step": 112830 }, { "epoch": 31.73, "learning_rate": 4.062911942023553e-05, "loss": 0.0554, "step": 112860 }, { "epoch": 31.74, "learning_rate": 4.06103770343298e-05, "loss": 0.0563, "step": 112890 }, { "epoch": 31.75, "learning_rate": 4.059163464842408e-05, "loss": 0.0666, "step": 112920 }, { "epoch": 31.75, "learning_rate": 4.057289226251835e-05, "loss": 0.0532, "step": 112950 }, { "epoch": 31.76, "learning_rate": 4.055414987661263e-05, "loss": 0.0572, "step": 112980 }, { "epoch": 31.77, "learning_rate": 4.05354074907069e-05, "loss": 0.0549, "step": 113010 }, { "epoch": 31.78, "learning_rate": 4.051666510480118e-05, "loss": 0.0577, "step": 113040 }, { "epoch": 31.79, "learning_rate": 4.049792271889545e-05, "loss": 0.0664, "step": 113070 }, { "epoch": 31.8, "learning_rate": 4.047918033298972e-05, "loss": 0.0488, "step": 113100 }, { "epoch": 31.8, "learning_rate": 4.0460437947084e-05, "loss": 0.0587, "step": 113130 }, { "epoch": 31.81, "learning_rate": 4.044169556117827e-05, "loss": 0.0551, "step": 113160 }, { "epoch": 31.82, "learning_rate": 4.042295317527255e-05, "loss": 0.0531, "step": 113190 }, { "epoch": 31.83, "learning_rate": 4.040421078936682e-05, "loss": 0.0628, "step": 113220 }, { "epoch": 31.84, "learning_rate": 4.03854684034611e-05, "loss": 0.052, "step": 113250 }, { "epoch": 31.85, "learning_rate": 4.0366726017555366e-05, "loss": 0.0608, "step": 113280 }, { "epoch": 31.86, "learning_rate": 4.034798363164965e-05, "loss": 0.0536, "step": 113310 }, { "epoch": 31.86, "learning_rate": 4.032924124574392e-05, "loss": 0.0582, "step": 113340 }, { "epoch": 31.87, "learning_rate": 4.031049885983819e-05, "loss": 0.0613, "step": 113370 }, { "epoch": 31.88, "learning_rate": 4.029175647393247e-05, "loss": 0.0509, "step": 113400 }, { "epoch": 31.89, "learning_rate": 4.027301408802674e-05, "loss": 0.0626, "step": 113430 }, { "epoch": 31.9, "learning_rate": 4.025427170212102e-05, "loss": 0.053, "step": 113460 }, { "epoch": 31.91, "learning_rate": 4.0235529316215286e-05, "loss": 0.054, "step": 113490 }, { "epoch": 31.91, "learning_rate": 4.021678693030957e-05, "loss": 0.0595, "step": 113520 }, { "epoch": 31.92, "learning_rate": 4.019804454440384e-05, "loss": 0.051, "step": 113550 }, { "epoch": 31.93, "learning_rate": 4.017930215849811e-05, "loss": 0.0603, "step": 113580 }, { "epoch": 31.94, "learning_rate": 4.016055977259239e-05, "loss": 0.055, "step": 113610 }, { "epoch": 31.95, "learning_rate": 4.014181738668666e-05, "loss": 0.0546, "step": 113640 }, { "epoch": 31.96, "learning_rate": 4.012307500078094e-05, "loss": 0.0595, "step": 113670 }, { "epoch": 31.97, "learning_rate": 4.0104332614875205e-05, "loss": 0.0509, "step": 113700 }, { "epoch": 31.97, "learning_rate": 4.0085590228969486e-05, "loss": 0.0595, "step": 113730 }, { "epoch": 31.98, "learning_rate": 4.006684784306376e-05, "loss": 0.0563, "step": 113760 }, { "epoch": 31.99, "learning_rate": 4.004810545715803e-05, "loss": 0.0582, "step": 113790 }, { "epoch": 32.0, "learning_rate": 4.002936307125231e-05, "loss": 0.0632, "step": 113820 }, { "epoch": 32.0, "eval_loss": 0.11038082838058472, "eval_runtime": 633.2401, "eval_samples_per_second": 25.319, "eval_steps_per_second": 0.793, "eval_wer": 0.09773722926589604, "step": 113824 }, { "epoch": 32.01, "learning_rate": 4.0010620685346576e-05, "loss": 0.0504, "step": 113850 }, { "epoch": 32.02, "learning_rate": 3.999187829944086e-05, "loss": 0.0617, "step": 113880 }, { "epoch": 32.02, "learning_rate": 3.9973135913535124e-05, "loss": 0.0508, "step": 113910 }, { "epoch": 32.03, "learning_rate": 3.9954393527629405e-05, "loss": 0.0602, "step": 113940 }, { "epoch": 32.04, "learning_rate": 3.993627588792053e-05, "loss": 0.0588, "step": 113970 }, { "epoch": 32.05, "learning_rate": 3.991753350201481e-05, "loss": 0.0533, "step": 114000 }, { "epoch": 32.06, "learning_rate": 3.989879111610908e-05, "loss": 0.0574, "step": 114030 }, { "epoch": 32.07, "learning_rate": 3.9880048730203355e-05, "loss": 0.0511, "step": 114060 }, { "epoch": 32.07, "learning_rate": 3.9861306344297636e-05, "loss": 0.0627, "step": 114090 }, { "epoch": 32.08, "learning_rate": 3.9842563958391904e-05, "loss": 0.0528, "step": 114120 }, { "epoch": 32.09, "learning_rate": 3.982382157248618e-05, "loss": 0.0575, "step": 114150 }, { "epoch": 32.1, "learning_rate": 3.980507918658045e-05, "loss": 0.0627, "step": 114180 }, { "epoch": 32.11, "learning_rate": 3.9786336800674726e-05, "loss": 0.0525, "step": 114210 }, { "epoch": 32.12, "learning_rate": 3.9767594414769e-05, "loss": 0.0617, "step": 114240 }, { "epoch": 32.13, "learning_rate": 3.9748852028863275e-05, "loss": 0.0543, "step": 114270 }, { "epoch": 32.13, "learning_rate": 3.9730109642957556e-05, "loss": 0.052, "step": 114300 }, { "epoch": 32.14, "learning_rate": 3.971199200324868e-05, "loss": 0.0661, "step": 114330 }, { "epoch": 32.15, "learning_rate": 3.969324961734295e-05, "loss": 0.0487, "step": 114360 }, { "epoch": 32.16, "learning_rate": 3.967450723143723e-05, "loss": 0.0601, "step": 114390 }, { "epoch": 32.17, "learning_rate": 3.9655764845531506e-05, "loss": 0.0603, "step": 114420 }, { "epoch": 32.18, "learning_rate": 3.963702245962578e-05, "loss": 0.0572, "step": 114450 }, { "epoch": 32.18, "learning_rate": 3.9618280073720054e-05, "loss": 0.0645, "step": 114480 }, { "epoch": 32.19, "learning_rate": 3.959953768781433e-05, "loss": 0.0547, "step": 114510 }, { "epoch": 32.2, "learning_rate": 3.95807953019086e-05, "loss": 0.0625, "step": 114540 }, { "epoch": 32.21, "learning_rate": 3.956205291600287e-05, "loss": 0.0578, "step": 114570 }, { "epoch": 32.22, "learning_rate": 3.954331053009715e-05, "loss": 0.0556, "step": 114600 }, { "epoch": 32.23, "learning_rate": 3.9524568144191425e-05, "loss": 0.0583, "step": 114630 }, { "epoch": 32.23, "learning_rate": 3.95058257582857e-05, "loss": 0.0506, "step": 114660 }, { "epoch": 32.24, "learning_rate": 3.9487083372379973e-05, "loss": 0.0577, "step": 114690 }, { "epoch": 32.25, "learning_rate": 3.946834098647425e-05, "loss": 0.053, "step": 114720 }, { "epoch": 32.26, "learning_rate": 3.944959860056852e-05, "loss": 0.0532, "step": 114750 }, { "epoch": 32.27, "learning_rate": 3.943085621466279e-05, "loss": 0.0612, "step": 114780 }, { "epoch": 32.28, "learning_rate": 3.941211382875707e-05, "loss": 0.0496, "step": 114810 }, { "epoch": 32.29, "learning_rate": 3.9393371442851344e-05, "loss": 0.0563, "step": 114840 }, { "epoch": 32.29, "learning_rate": 3.937462905694562e-05, "loss": 0.0581, "step": 114870 }, { "epoch": 32.3, "learning_rate": 3.935588667103989e-05, "loss": 0.0554, "step": 114900 }, { "epoch": 32.31, "learning_rate": 3.933714428513417e-05, "loss": 0.06, "step": 114930 }, { "epoch": 32.32, "learning_rate": 3.931840189922844e-05, "loss": 0.0559, "step": 114960 }, { "epoch": 32.33, "learning_rate": 3.929965951332271e-05, "loss": 0.0615, "step": 114990 }, { "epoch": 32.34, "learning_rate": 3.928091712741699e-05, "loss": 0.0545, "step": 115020 }, { "epoch": 32.34, "learning_rate": 3.9262174741511264e-05, "loss": 0.0539, "step": 115050 }, { "epoch": 32.35, "learning_rate": 3.924343235560554e-05, "loss": 0.0599, "step": 115080 }, { "epoch": 32.36, "learning_rate": 3.922468996969981e-05, "loss": 0.0564, "step": 115110 }, { "epoch": 32.37, "learning_rate": 3.9205947583794086e-05, "loss": 0.0606, "step": 115140 }, { "epoch": 32.38, "learning_rate": 3.918720519788836e-05, "loss": 0.0537, "step": 115170 }, { "epoch": 32.39, "learning_rate": 3.9168462811982635e-05, "loss": 0.0543, "step": 115200 }, { "epoch": 32.4, "learning_rate": 3.914972042607691e-05, "loss": 0.0571, "step": 115230 }, { "epoch": 32.4, "learning_rate": 3.913097804017118e-05, "loss": 0.0523, "step": 115260 }, { "epoch": 32.41, "learning_rate": 3.911223565426546e-05, "loss": 0.0582, "step": 115290 }, { "epoch": 32.42, "learning_rate": 3.909349326835973e-05, "loss": 0.0581, "step": 115320 }, { "epoch": 32.43, "learning_rate": 3.9074750882454006e-05, "loss": 0.0543, "step": 115350 }, { "epoch": 32.44, "learning_rate": 3.905600849654828e-05, "loss": 0.0595, "step": 115380 }, { "epoch": 32.45, "learning_rate": 3.9037266110642554e-05, "loss": 0.0531, "step": 115410 }, { "epoch": 32.45, "learning_rate": 3.901852372473683e-05, "loss": 0.0582, "step": 115440 }, { "epoch": 32.46, "learning_rate": 3.89997813388311e-05, "loss": 0.0541, "step": 115470 }, { "epoch": 32.47, "learning_rate": 3.8981038952925377e-05, "loss": 0.0542, "step": 115500 }, { "epoch": 32.48, "learning_rate": 3.896229656701965e-05, "loss": 0.0615, "step": 115530 }, { "epoch": 32.49, "learning_rate": 3.8943554181113925e-05, "loss": 0.049, "step": 115560 }, { "epoch": 32.5, "learning_rate": 3.89248117952082e-05, "loss": 0.0594, "step": 115590 }, { "epoch": 32.5, "learning_rate": 3.890606940930247e-05, "loss": 0.0563, "step": 115620 }, { "epoch": 32.51, "learning_rate": 3.888732702339675e-05, "loss": 0.0565, "step": 115650 }, { "epoch": 32.52, "learning_rate": 3.886858463749102e-05, "loss": 0.0573, "step": 115680 }, { "epoch": 32.53, "learning_rate": 3.8849842251585296e-05, "loss": 0.0513, "step": 115710 }, { "epoch": 32.54, "learning_rate": 3.883109986567957e-05, "loss": 0.0586, "step": 115740 }, { "epoch": 32.55, "learning_rate": 3.8812357479773844e-05, "loss": 0.054, "step": 115770 }, { "epoch": 32.56, "learning_rate": 3.879361509386812e-05, "loss": 0.0551, "step": 115800 }, { "epoch": 32.56, "learning_rate": 3.877487270796239e-05, "loss": 0.055, "step": 115830 }, { "epoch": 32.57, "learning_rate": 3.875613032205667e-05, "loss": 0.0527, "step": 115860 }, { "epoch": 32.58, "learning_rate": 3.873738793615094e-05, "loss": 0.0583, "step": 115890 }, { "epoch": 32.59, "learning_rate": 3.8718645550245215e-05, "loss": 0.0554, "step": 115920 }, { "epoch": 32.6, "learning_rate": 3.869990316433949e-05, "loss": 0.0517, "step": 115950 }, { "epoch": 32.61, "learning_rate": 3.8681160778433764e-05, "loss": 0.0564, "step": 115980 }, { "epoch": 32.61, "learning_rate": 3.866241839252804e-05, "loss": 0.0497, "step": 116010 }, { "epoch": 32.62, "learning_rate": 3.864367600662231e-05, "loss": 0.0574, "step": 116040 }, { "epoch": 32.63, "learning_rate": 3.8624933620716586e-05, "loss": 0.0567, "step": 116070 }, { "epoch": 32.64, "learning_rate": 3.860619123481086e-05, "loss": 0.0532, "step": 116100 }, { "epoch": 32.65, "learning_rate": 3.8587448848905135e-05, "loss": 0.0578, "step": 116130 }, { "epoch": 32.66, "learning_rate": 3.856870646299941e-05, "loss": 0.0517, "step": 116160 }, { "epoch": 32.67, "learning_rate": 3.854996407709368e-05, "loss": 0.0601, "step": 116190 }, { "epoch": 32.67, "learning_rate": 3.853122169118796e-05, "loss": 0.0559, "step": 116220 }, { "epoch": 32.68, "learning_rate": 3.851247930528223e-05, "loss": 0.0551, "step": 116250 }, { "epoch": 32.69, "learning_rate": 3.8493736919376506e-05, "loss": 0.0584, "step": 116280 }, { "epoch": 32.7, "learning_rate": 3.847499453347078e-05, "loss": 0.0491, "step": 116310 }, { "epoch": 32.71, "learning_rate": 3.8456252147565054e-05, "loss": 0.0582, "step": 116340 }, { "epoch": 32.72, "learning_rate": 3.843750976165933e-05, "loss": 0.0589, "step": 116370 }, { "epoch": 32.72, "learning_rate": 3.84187673757536e-05, "loss": 0.051, "step": 116400 }, { "epoch": 32.73, "learning_rate": 3.8400024989847876e-05, "loss": 0.0578, "step": 116430 }, { "epoch": 32.74, "learning_rate": 3.838128260394215e-05, "loss": 0.0514, "step": 116460 }, { "epoch": 32.75, "learning_rate": 3.8362540218036425e-05, "loss": 0.0612, "step": 116490 }, { "epoch": 32.76, "learning_rate": 3.83437978321307e-05, "loss": 0.0564, "step": 116520 }, { "epoch": 32.77, "learning_rate": 3.832505544622497e-05, "loss": 0.0524, "step": 116550 }, { "epoch": 32.77, "learning_rate": 3.830631306031925e-05, "loss": 0.057, "step": 116580 }, { "epoch": 32.78, "learning_rate": 3.828757067441352e-05, "loss": 0.0519, "step": 116610 }, { "epoch": 32.79, "learning_rate": 3.8268828288507796e-05, "loss": 0.0581, "step": 116640 }, { "epoch": 32.8, "learning_rate": 3.825008590260207e-05, "loss": 0.0558, "step": 116670 }, { "epoch": 32.81, "learning_rate": 3.8231343516696344e-05, "loss": 0.051, "step": 116700 }, { "epoch": 32.82, "learning_rate": 3.821260113079062e-05, "loss": 0.0598, "step": 116730 }, { "epoch": 32.83, "learning_rate": 3.819385874488489e-05, "loss": 0.0492, "step": 116760 }, { "epoch": 32.83, "learning_rate": 3.817511635897917e-05, "loss": 0.0579, "step": 116790 }, { "epoch": 32.84, "learning_rate": 3.815637397307344e-05, "loss": 0.0546, "step": 116820 }, { "epoch": 32.85, "learning_rate": 3.8137631587167715e-05, "loss": 0.0526, "step": 116850 }, { "epoch": 32.86, "learning_rate": 3.811888920126199e-05, "loss": 0.0613, "step": 116880 }, { "epoch": 32.87, "learning_rate": 3.8100146815356264e-05, "loss": 0.0539, "step": 116910 }, { "epoch": 32.88, "learning_rate": 3.808140442945054e-05, "loss": 0.0537, "step": 116940 }, { "epoch": 32.88, "learning_rate": 3.806266204354481e-05, "loss": 0.0543, "step": 116970 }, { "epoch": 32.89, "learning_rate": 3.8043919657639086e-05, "loss": 0.0539, "step": 117000 }, { "epoch": 32.9, "learning_rate": 3.802517727173336e-05, "loss": 0.0607, "step": 117030 }, { "epoch": 32.91, "learning_rate": 3.8006434885827634e-05, "loss": 0.0501, "step": 117060 }, { "epoch": 32.92, "learning_rate": 3.798831724611877e-05, "loss": 0.0597, "step": 117090 }, { "epoch": 32.93, "learning_rate": 3.796957486021304e-05, "loss": 0.0578, "step": 117120 }, { "epoch": 32.93, "learning_rate": 3.795083247430731e-05, "loss": 0.0534, "step": 117150 }, { "epoch": 32.94, "learning_rate": 3.793209008840159e-05, "loss": 0.063, "step": 117180 }, { "epoch": 32.95, "learning_rate": 3.791334770249586e-05, "loss": 0.0546, "step": 117210 }, { "epoch": 32.96, "learning_rate": 3.789460531659014e-05, "loss": 0.0554, "step": 117240 }, { "epoch": 32.97, "learning_rate": 3.7875862930684414e-05, "loss": 0.0541, "step": 117270 }, { "epoch": 32.98, "learning_rate": 3.785712054477869e-05, "loss": 0.0536, "step": 117300 }, { "epoch": 32.99, "learning_rate": 3.783837815887296e-05, "loss": 0.0595, "step": 117330 }, { "epoch": 32.99, "learning_rate": 3.781963577296723e-05, "loss": 0.0482, "step": 117360 }, { "epoch": 33.0, "eval_loss": 0.1107897162437439, "eval_runtime": 635.0944, "eval_samples_per_second": 25.245, "eval_steps_per_second": 0.79, "eval_wer": 0.09579244742265228, "step": 117381 }, { "epoch": 33.0, "learning_rate": 3.780089338706151e-05, "loss": 0.0576, "step": 117390 }, { "epoch": 33.01, "learning_rate": 3.778215100115578e-05, "loss": 0.0484, "step": 117420 }, { "epoch": 33.02, "learning_rate": 3.776340861525006e-05, "loss": 0.0556, "step": 117450 }, { "epoch": 33.03, "learning_rate": 3.774466622934433e-05, "loss": 0.0565, "step": 117480 }, { "epoch": 33.04, "learning_rate": 3.772592384343861e-05, "loss": 0.0475, "step": 117510 }, { "epoch": 33.04, "learning_rate": 3.770718145753288e-05, "loss": 0.0623, "step": 117540 }, { "epoch": 33.05, "learning_rate": 3.768843907162715e-05, "loss": 0.052, "step": 117570 }, { "epoch": 33.06, "learning_rate": 3.766969668572143e-05, "loss": 0.0606, "step": 117600 }, { "epoch": 33.07, "learning_rate": 3.76509542998157e-05, "loss": 0.0558, "step": 117630 }, { "epoch": 33.08, "learning_rate": 3.763221191390998e-05, "loss": 0.0525, "step": 117660 }, { "epoch": 33.09, "learning_rate": 3.761346952800425e-05, "loss": 0.0605, "step": 117690 }, { "epoch": 33.1, "learning_rate": 3.759472714209853e-05, "loss": 0.0482, "step": 117720 }, { "epoch": 33.1, "learning_rate": 3.75759847561928e-05, "loss": 0.0554, "step": 117750 }, { "epoch": 33.11, "learning_rate": 3.755724237028707e-05, "loss": 0.0519, "step": 117780 }, { "epoch": 33.12, "learning_rate": 3.753849998438135e-05, "loss": 0.0496, "step": 117810 }, { "epoch": 33.13, "learning_rate": 3.751975759847562e-05, "loss": 0.0607, "step": 117840 }, { "epoch": 33.14, "learning_rate": 3.75010152125699e-05, "loss": 0.0513, "step": 117870 }, { "epoch": 33.15, "learning_rate": 3.748227282666417e-05, "loss": 0.056, "step": 117900 }, { "epoch": 33.15, "learning_rate": 3.7463530440758446e-05, "loss": 0.0586, "step": 117930 }, { "epoch": 33.16, "learning_rate": 3.744478805485272e-05, "loss": 0.0506, "step": 117960 }, { "epoch": 33.17, "learning_rate": 3.742604566894699e-05, "loss": 0.059, "step": 117990 }, { "epoch": 33.18, "learning_rate": 3.740730328304127e-05, "loss": 0.055, "step": 118020 }, { "epoch": 33.19, "learning_rate": 3.7388560897135536e-05, "loss": 0.0578, "step": 118050 }, { "epoch": 33.2, "learning_rate": 3.736981851122982e-05, "loss": 0.0612, "step": 118080 }, { "epoch": 33.2, "learning_rate": 3.735107612532409e-05, "loss": 0.0525, "step": 118110 }, { "epoch": 33.21, "learning_rate": 3.7332333739418365e-05, "loss": 0.0556, "step": 118140 }, { "epoch": 33.22, "learning_rate": 3.731359135351264e-05, "loss": 0.0512, "step": 118170 }, { "epoch": 33.23, "learning_rate": 3.729484896760691e-05, "loss": 0.0612, "step": 118200 }, { "epoch": 33.24, "learning_rate": 3.727610658170119e-05, "loss": 0.0602, "step": 118230 }, { "epoch": 33.25, "learning_rate": 3.7257364195795455e-05, "loss": 0.0498, "step": 118260 }, { "epoch": 33.26, "learning_rate": 3.7238621809889736e-05, "loss": 0.0594, "step": 118290 }, { "epoch": 33.26, "learning_rate": 3.721987942398401e-05, "loss": 0.051, "step": 118320 }, { "epoch": 33.27, "learning_rate": 3.7201137038078285e-05, "loss": 0.0534, "step": 118350 }, { "epoch": 33.28, "learning_rate": 3.718239465217256e-05, "loss": 0.0567, "step": 118380 }, { "epoch": 33.29, "learning_rate": 3.7163652266266826e-05, "loss": 0.0535, "step": 118410 }, { "epoch": 33.3, "learning_rate": 3.714490988036111e-05, "loss": 0.0621, "step": 118440 }, { "epoch": 33.31, "learning_rate": 3.7126167494455375e-05, "loss": 0.0524, "step": 118470 }, { "epoch": 33.31, "learning_rate": 3.7107425108549656e-05, "loss": 0.0539, "step": 118500 }, { "epoch": 33.32, "learning_rate": 3.708868272264393e-05, "loss": 0.058, "step": 118530 }, { "epoch": 33.33, "learning_rate": 3.7069940336738204e-05, "loss": 0.0535, "step": 118560 }, { "epoch": 33.34, "learning_rate": 3.705119795083248e-05, "loss": 0.0625, "step": 118590 }, { "epoch": 33.35, "learning_rate": 3.703245556492675e-05, "loss": 0.0491, "step": 118620 }, { "epoch": 33.36, "learning_rate": 3.7013713179021027e-05, "loss": 0.0542, "step": 118650 }, { "epoch": 33.37, "learning_rate": 3.6994970793115294e-05, "loss": 0.06, "step": 118680 }, { "epoch": 33.37, "learning_rate": 3.6976228407209575e-05, "loss": 0.0484, "step": 118710 }, { "epoch": 33.38, "learning_rate": 3.695748602130385e-05, "loss": 0.0597, "step": 118740 }, { "epoch": 33.39, "learning_rate": 3.693874363539812e-05, "loss": 0.0514, "step": 118770 }, { "epoch": 33.4, "learning_rate": 3.69200012494924e-05, "loss": 0.0573, "step": 118800 }, { "epoch": 33.41, "learning_rate": 3.690125886358667e-05, "loss": 0.0574, "step": 118830 }, { "epoch": 33.42, "learning_rate": 3.6882516477680946e-05, "loss": 0.0553, "step": 118860 }, { "epoch": 33.42, "learning_rate": 3.686377409177521e-05, "loss": 0.0586, "step": 118890 }, { "epoch": 33.43, "learning_rate": 3.6845031705869494e-05, "loss": 0.0507, "step": 118920 }, { "epoch": 33.44, "learning_rate": 3.682628931996376e-05, "loss": 0.0559, "step": 118950 }, { "epoch": 33.45, "learning_rate": 3.680754693405804e-05, "loss": 0.0596, "step": 118980 }, { "epoch": 33.46, "learning_rate": 3.678880454815232e-05, "loss": 0.051, "step": 119010 }, { "epoch": 33.47, "learning_rate": 3.677006216224659e-05, "loss": 0.0614, "step": 119040 }, { "epoch": 33.47, "learning_rate": 3.6751319776340865e-05, "loss": 0.0499, "step": 119070 }, { "epoch": 33.48, "learning_rate": 3.673257739043513e-05, "loss": 0.0544, "step": 119100 }, { "epoch": 33.49, "learning_rate": 3.6713835004529414e-05, "loss": 0.0557, "step": 119130 }, { "epoch": 33.5, "learning_rate": 3.669509261862368e-05, "loss": 0.0507, "step": 119160 }, { "epoch": 33.51, "learning_rate": 3.667635023271796e-05, "loss": 0.058, "step": 119190 }, { "epoch": 33.52, "learning_rate": 3.6657607846812236e-05, "loss": 0.0533, "step": 119220 }, { "epoch": 33.53, "learning_rate": 3.663886546090651e-05, "loss": 0.0547, "step": 119250 }, { "epoch": 33.53, "learning_rate": 3.6620123075000785e-05, "loss": 0.0555, "step": 119280 }, { "epoch": 33.54, "learning_rate": 3.660138068909505e-05, "loss": 0.0506, "step": 119310 }, { "epoch": 33.55, "learning_rate": 3.658263830318933e-05, "loss": 0.0586, "step": 119340 }, { "epoch": 33.56, "learning_rate": 3.65638959172836e-05, "loss": 0.0534, "step": 119370 }, { "epoch": 33.57, "learning_rate": 3.654515353137788e-05, "loss": 0.0563, "step": 119400 }, { "epoch": 33.58, "learning_rate": 3.6526411145472156e-05, "loss": 0.0581, "step": 119430 }, { "epoch": 33.58, "learning_rate": 3.650766875956643e-05, "loss": 0.052, "step": 119460 }, { "epoch": 33.59, "learning_rate": 3.6488926373660704e-05, "loss": 0.0591, "step": 119490 }, { "epoch": 33.6, "learning_rate": 3.647018398775497e-05, "loss": 0.0501, "step": 119520 }, { "epoch": 33.61, "learning_rate": 3.645144160184925e-05, "loss": 0.0555, "step": 119550 }, { "epoch": 33.62, "learning_rate": 3.643269921594352e-05, "loss": 0.0541, "step": 119580 }, { "epoch": 33.63, "learning_rate": 3.64139568300378e-05, "loss": 0.0505, "step": 119610 }, { "epoch": 33.63, "learning_rate": 3.6395214444132075e-05, "loss": 0.058, "step": 119640 }, { "epoch": 33.64, "learning_rate": 3.637647205822635e-05, "loss": 0.0494, "step": 119670 }, { "epoch": 33.65, "learning_rate": 3.635772967232062e-05, "loss": 0.0568, "step": 119700 }, { "epoch": 33.66, "learning_rate": 3.633898728641489e-05, "loss": 0.0581, "step": 119730 }, { "epoch": 33.67, "learning_rate": 3.632024490050917e-05, "loss": 0.0507, "step": 119760 }, { "epoch": 33.68, "learning_rate": 3.630150251460344e-05, "loss": 0.0595, "step": 119790 }, { "epoch": 33.69, "learning_rate": 3.628276012869772e-05, "loss": 0.0476, "step": 119820 }, { "epoch": 33.69, "learning_rate": 3.626464248898885e-05, "loss": 0.0534, "step": 119850 }, { "epoch": 33.7, "learning_rate": 3.624590010308312e-05, "loss": 0.0571, "step": 119880 }, { "epoch": 33.71, "learning_rate": 3.6227157717177396e-05, "loss": 0.0502, "step": 119910 }, { "epoch": 33.72, "learning_rate": 3.620841533127167e-05, "loss": 0.059, "step": 119940 }, { "epoch": 33.73, "learning_rate": 3.618967294536595e-05, "loss": 0.0532, "step": 119970 }, { "epoch": 33.74, "learning_rate": 3.617093055946022e-05, "loss": 0.055, "step": 120000 }, { "epoch": 33.74, "learning_rate": 3.61521881735545e-05, "loss": 0.0539, "step": 120030 }, { "epoch": 33.75, "learning_rate": 3.613344578764877e-05, "loss": 0.0505, "step": 120060 }, { "epoch": 33.76, "learning_rate": 3.611470340174304e-05, "loss": 0.0575, "step": 120090 }, { "epoch": 33.77, "learning_rate": 3.6095961015837315e-05, "loss": 0.0489, "step": 120120 }, { "epoch": 33.78, "learning_rate": 3.607721862993159e-05, "loss": 0.0555, "step": 120150 }, { "epoch": 33.79, "learning_rate": 3.605847624402587e-05, "loss": 0.0545, "step": 120180 }, { "epoch": 33.8, "learning_rate": 3.603973385812014e-05, "loss": 0.0513, "step": 120210 }, { "epoch": 33.8, "learning_rate": 3.602099147221442e-05, "loss": 0.0551, "step": 120240 }, { "epoch": 33.81, "learning_rate": 3.6002249086308686e-05, "loss": 0.0509, "step": 120270 }, { "epoch": 33.82, "learning_rate": 3.598350670040296e-05, "loss": 0.0545, "step": 120300 }, { "epoch": 33.83, "learning_rate": 3.5964764314497234e-05, "loss": 0.0566, "step": 120330 }, { "epoch": 33.84, "learning_rate": 3.594602192859151e-05, "loss": 0.0523, "step": 120360 }, { "epoch": 33.85, "learning_rate": 3.592727954268579e-05, "loss": 0.0609, "step": 120390 }, { "epoch": 33.85, "learning_rate": 3.590853715678006e-05, "loss": 0.0493, "step": 120420 }, { "epoch": 33.86, "learning_rate": 3.588979477087434e-05, "loss": 0.0535, "step": 120450 }, { "epoch": 33.87, "learning_rate": 3.5871052384968605e-05, "loss": 0.055, "step": 120480 }, { "epoch": 33.88, "learning_rate": 3.585230999906288e-05, "loss": 0.0506, "step": 120510 }, { "epoch": 33.89, "learning_rate": 3.5833567613157154e-05, "loss": 0.0584, "step": 120540 }, { "epoch": 33.9, "learning_rate": 3.581482522725143e-05, "loss": 0.0548, "step": 120570 }, { "epoch": 33.9, "learning_rate": 3.579608284134571e-05, "loss": 0.0544, "step": 120600 }, { "epoch": 33.91, "learning_rate": 3.5777340455439976e-05, "loss": 0.0563, "step": 120630 }, { "epoch": 33.92, "learning_rate": 3.575859806953426e-05, "loss": 0.0506, "step": 120660 }, { "epoch": 33.93, "learning_rate": 3.5739855683628525e-05, "loss": 0.058, "step": 120690 }, { "epoch": 33.94, "learning_rate": 3.5721113297722806e-05, "loss": 0.052, "step": 120720 }, { "epoch": 33.95, "learning_rate": 3.570237091181707e-05, "loss": 0.0533, "step": 120750 }, { "epoch": 33.96, "learning_rate": 3.568362852591135e-05, "loss": 0.0572, "step": 120780 }, { "epoch": 33.96, "learning_rate": 3.566488614000563e-05, "loss": 0.051, "step": 120810 }, { "epoch": 33.97, "learning_rate": 3.5646143754099896e-05, "loss": 0.057, "step": 120840 }, { "epoch": 33.98, "learning_rate": 3.562740136819418e-05, "loss": 0.0518, "step": 120870 }, { "epoch": 33.99, "learning_rate": 3.5608658982288444e-05, "loss": 0.0561, "step": 120900 }, { "epoch": 34.0, "learning_rate": 3.5589916596382725e-05, "loss": 0.0601, "step": 120930 }, { "epoch": 34.0, "eval_loss": 0.10950275510549545, "eval_runtime": 635.2492, "eval_samples_per_second": 25.239, "eval_steps_per_second": 0.79, "eval_wer": 0.09571738566729901, "step": 120938 }, { "epoch": 34.01, "learning_rate": 3.557117421047699e-05, "loss": 0.0525, "step": 120960 }, { "epoch": 34.01, "learning_rate": 3.555243182457127e-05, "loss": 0.0614, "step": 120990 }, { "epoch": 34.02, "learning_rate": 3.553368943866555e-05, "loss": 0.0447, "step": 121020 }, { "epoch": 34.03, "learning_rate": 3.5514947052759815e-05, "loss": 0.0569, "step": 121050 }, { "epoch": 34.04, "learning_rate": 3.5496204666854096e-05, "loss": 0.0538, "step": 121080 }, { "epoch": 34.05, "learning_rate": 3.5477462280948363e-05, "loss": 0.0549, "step": 121110 }, { "epoch": 34.06, "learning_rate": 3.5458719895042644e-05, "loss": 0.0593, "step": 121140 }, { "epoch": 34.07, "learning_rate": 3.543997750913691e-05, "loss": 0.0482, "step": 121170 }, { "epoch": 34.07, "learning_rate": 3.5421235123231186e-05, "loss": 0.0544, "step": 121200 }, { "epoch": 34.08, "learning_rate": 3.540249273732547e-05, "loss": 0.0528, "step": 121230 }, { "epoch": 34.09, "learning_rate": 3.5384375097616594e-05, "loss": 0.0516, "step": 121260 }, { "epoch": 34.1, "learning_rate": 3.536563271171087e-05, "loss": 0.0591, "step": 121290 }, { "epoch": 34.11, "learning_rate": 3.534689032580514e-05, "loss": 0.0459, "step": 121320 }, { "epoch": 34.12, "learning_rate": 3.532814793989942e-05, "loss": 0.0567, "step": 121350 }, { "epoch": 34.12, "learning_rate": 3.530940555399369e-05, "loss": 0.0522, "step": 121380 }, { "epoch": 34.13, "learning_rate": 3.5290663168087965e-05, "loss": 0.0501, "step": 121410 }, { "epoch": 34.14, "learning_rate": 3.527192078218224e-05, "loss": 0.0632, "step": 121440 }, { "epoch": 34.15, "learning_rate": 3.5253178396276514e-05, "loss": 0.0473, "step": 121470 }, { "epoch": 34.16, "learning_rate": 3.523443601037079e-05, "loss": 0.0553, "step": 121500 }, { "epoch": 34.17, "learning_rate": 3.521569362446506e-05, "loss": 0.0531, "step": 121530 }, { "epoch": 34.17, "learning_rate": 3.5196951238559336e-05, "loss": 0.0493, "step": 121560 }, { "epoch": 34.18, "learning_rate": 3.517820885265361e-05, "loss": 0.0607, "step": 121590 }, { "epoch": 34.19, "learning_rate": 3.5159466466747885e-05, "loss": 0.0467, "step": 121620 }, { "epoch": 34.2, "learning_rate": 3.514072408084216e-05, "loss": 0.0601, "step": 121650 }, { "epoch": 34.21, "learning_rate": 3.512198169493643e-05, "loss": 0.0513, "step": 121680 }, { "epoch": 34.22, "learning_rate": 3.510323930903071e-05, "loss": 0.0575, "step": 121710 }, { "epoch": 34.23, "learning_rate": 3.508449692312498e-05, "loss": 0.0582, "step": 121740 }, { "epoch": 34.23, "learning_rate": 3.5065754537219256e-05, "loss": 0.049, "step": 121770 }, { "epoch": 34.24, "learning_rate": 3.504701215131353e-05, "loss": 0.0564, "step": 121800 }, { "epoch": 34.25, "learning_rate": 3.5028269765407804e-05, "loss": 0.0527, "step": 121830 }, { "epoch": 34.26, "learning_rate": 3.500952737950208e-05, "loss": 0.0562, "step": 121860 }, { "epoch": 34.27, "learning_rate": 3.499078499359635e-05, "loss": 0.0583, "step": 121890 }, { "epoch": 34.28, "learning_rate": 3.4972042607690627e-05, "loss": 0.0485, "step": 121920 }, { "epoch": 34.28, "learning_rate": 3.49533002217849e-05, "loss": 0.0616, "step": 121950 }, { "epoch": 34.29, "learning_rate": 3.4934557835879175e-05, "loss": 0.0513, "step": 121980 }, { "epoch": 34.3, "learning_rate": 3.491581544997345e-05, "loss": 0.0533, "step": 122010 }, { "epoch": 34.31, "learning_rate": 3.489707306406772e-05, "loss": 0.0566, "step": 122040 }, { "epoch": 34.32, "learning_rate": 3.4878330678162e-05, "loss": 0.0512, "step": 122070 }, { "epoch": 34.33, "learning_rate": 3.485958829225627e-05, "loss": 0.0535, "step": 122100 }, { "epoch": 34.34, "learning_rate": 3.4840845906350546e-05, "loss": 0.0539, "step": 122130 }, { "epoch": 34.34, "learning_rate": 3.482210352044482e-05, "loss": 0.0538, "step": 122160 }, { "epoch": 34.35, "learning_rate": 3.4803361134539094e-05, "loss": 0.06, "step": 122190 }, { "epoch": 34.36, "learning_rate": 3.478461874863337e-05, "loss": 0.0489, "step": 122220 }, { "epoch": 34.37, "learning_rate": 3.476587636272764e-05, "loss": 0.0573, "step": 122250 }, { "epoch": 34.38, "learning_rate": 3.474713397682192e-05, "loss": 0.0505, "step": 122280 }, { "epoch": 34.39, "learning_rate": 3.472839159091619e-05, "loss": 0.0542, "step": 122310 }, { "epoch": 34.39, "learning_rate": 3.4709649205010465e-05, "loss": 0.0562, "step": 122340 }, { "epoch": 34.4, "learning_rate": 3.469090681910474e-05, "loss": 0.0482, "step": 122370 }, { "epoch": 34.41, "learning_rate": 3.4672164433199014e-05, "loss": 0.0562, "step": 122400 }, { "epoch": 34.42, "learning_rate": 3.465342204729329e-05, "loss": 0.0532, "step": 122430 }, { "epoch": 34.43, "learning_rate": 3.463467966138756e-05, "loss": 0.0506, "step": 122460 }, { "epoch": 34.44, "learning_rate": 3.4615937275481836e-05, "loss": 0.057, "step": 122490 }, { "epoch": 34.44, "learning_rate": 3.459719488957611e-05, "loss": 0.0466, "step": 122520 }, { "epoch": 34.45, "learning_rate": 3.4578452503670385e-05, "loss": 0.0542, "step": 122550 }, { "epoch": 34.46, "learning_rate": 3.455971011776466e-05, "loss": 0.0504, "step": 122580 }, { "epoch": 34.47, "learning_rate": 3.454096773185894e-05, "loss": 0.0561, "step": 122610 }, { "epoch": 34.48, "learning_rate": 3.452222534595321e-05, "loss": 0.0599, "step": 122640 }, { "epoch": 34.49, "learning_rate": 3.450348296004748e-05, "loss": 0.0469, "step": 122670 }, { "epoch": 34.5, "learning_rate": 3.4484740574141756e-05, "loss": 0.0622, "step": 122700 }, { "epoch": 34.5, "learning_rate": 3.446599818823603e-05, "loss": 0.0502, "step": 122730 }, { "epoch": 34.51, "learning_rate": 3.4447255802330304e-05, "loss": 0.0536, "step": 122760 }, { "epoch": 34.52, "learning_rate": 3.442851341642458e-05, "loss": 0.0596, "step": 122790 }, { "epoch": 34.53, "learning_rate": 3.440977103051886e-05, "loss": 0.0467, "step": 122820 }, { "epoch": 34.54, "learning_rate": 3.4391028644613127e-05, "loss": 0.0559, "step": 122850 }, { "epoch": 34.55, "learning_rate": 3.43722862587074e-05, "loss": 0.0514, "step": 122880 }, { "epoch": 34.55, "learning_rate": 3.4353543872801675e-05, "loss": 0.0558, "step": 122910 }, { "epoch": 34.56, "learning_rate": 3.433480148689595e-05, "loss": 0.0592, "step": 122940 }, { "epoch": 34.57, "learning_rate": 3.431605910099022e-05, "loss": 0.0479, "step": 122970 }, { "epoch": 34.58, "learning_rate": 3.42973167150845e-05, "loss": 0.0578, "step": 123000 }, { "epoch": 34.59, "learning_rate": 3.427857432917878e-05, "loss": 0.0474, "step": 123030 }, { "epoch": 34.6, "learning_rate": 3.4259831943273046e-05, "loss": 0.0556, "step": 123060 }, { "epoch": 34.6, "learning_rate": 3.424108955736732e-05, "loss": 0.058, "step": 123090 }, { "epoch": 34.61, "learning_rate": 3.4222347171461594e-05, "loss": 0.0469, "step": 123120 }, { "epoch": 34.62, "learning_rate": 3.420360478555587e-05, "loss": 0.0545, "step": 123150 }, { "epoch": 34.63, "learning_rate": 3.418486239965014e-05, "loss": 0.0528, "step": 123180 }, { "epoch": 34.64, "learning_rate": 3.416612001374442e-05, "loss": 0.0531, "step": 123210 }, { "epoch": 34.65, "learning_rate": 3.41473776278387e-05, "loss": 0.0593, "step": 123240 }, { "epoch": 34.66, "learning_rate": 3.4128635241932965e-05, "loss": 0.0467, "step": 123270 }, { "epoch": 34.66, "learning_rate": 3.410989285602724e-05, "loss": 0.0529, "step": 123300 }, { "epoch": 34.67, "learning_rate": 3.4091150470121514e-05, "loss": 0.0527, "step": 123330 }, { "epoch": 34.68, "learning_rate": 3.407240808421579e-05, "loss": 0.0528, "step": 123360 }, { "epoch": 34.69, "learning_rate": 3.405366569831006e-05, "loss": 0.0558, "step": 123390 }, { "epoch": 34.7, "learning_rate": 3.4034923312404336e-05, "loss": 0.0483, "step": 123420 }, { "epoch": 34.71, "learning_rate": 3.401618092649862e-05, "loss": 0.0568, "step": 123450 }, { "epoch": 34.71, "learning_rate": 3.3997438540592885e-05, "loss": 0.0524, "step": 123480 }, { "epoch": 34.72, "learning_rate": 3.397869615468716e-05, "loss": 0.0526, "step": 123510 }, { "epoch": 34.73, "learning_rate": 3.395995376878143e-05, "loss": 0.0546, "step": 123540 }, { "epoch": 34.74, "learning_rate": 3.394121138287571e-05, "loss": 0.0473, "step": 123570 }, { "epoch": 34.75, "learning_rate": 3.392246899696998e-05, "loss": 0.0563, "step": 123600 }, { "epoch": 34.76, "learning_rate": 3.3903726611064255e-05, "loss": 0.0476, "step": 123630 }, { "epoch": 34.77, "learning_rate": 3.3884984225158536e-05, "loss": 0.0573, "step": 123660 }, { "epoch": 34.77, "learning_rate": 3.3866241839252804e-05, "loss": 0.0584, "step": 123690 }, { "epoch": 34.78, "learning_rate": 3.384749945334708e-05, "loss": 0.0471, "step": 123720 }, { "epoch": 34.79, "learning_rate": 3.382875706744135e-05, "loss": 0.0556, "step": 123750 }, { "epoch": 34.8, "learning_rate": 3.3810014681535626e-05, "loss": 0.0508, "step": 123780 }, { "epoch": 34.81, "learning_rate": 3.37912722956299e-05, "loss": 0.0536, "step": 123810 }, { "epoch": 34.82, "learning_rate": 3.3772529909724175e-05, "loss": 0.054, "step": 123840 }, { "epoch": 34.82, "learning_rate": 3.3753787523818456e-05, "loss": 0.0491, "step": 123870 }, { "epoch": 34.83, "learning_rate": 3.373504513791272e-05, "loss": 0.0532, "step": 123900 }, { "epoch": 34.84, "learning_rate": 3.3716302752007e-05, "loss": 0.0492, "step": 123930 }, { "epoch": 34.85, "learning_rate": 3.369756036610127e-05, "loss": 0.0552, "step": 123960 }, { "epoch": 34.86, "learning_rate": 3.3678817980195546e-05, "loss": 0.0559, "step": 123990 }, { "epoch": 34.87, "learning_rate": 3.366007559428982e-05, "loss": 0.0514, "step": 124020 }, { "epoch": 34.87, "learning_rate": 3.3641333208384094e-05, "loss": 0.0558, "step": 124050 }, { "epoch": 34.88, "learning_rate": 3.362259082247837e-05, "loss": 0.0529, "step": 124080 }, { "epoch": 34.89, "learning_rate": 3.360384843657264e-05, "loss": 0.0521, "step": 124110 }, { "epoch": 34.9, "learning_rate": 3.3585106050666923e-05, "loss": 0.0606, "step": 124140 }, { "epoch": 34.91, "learning_rate": 3.356636366476119e-05, "loss": 0.0464, "step": 124170 }, { "epoch": 34.92, "learning_rate": 3.3547621278855465e-05, "loss": 0.0572, "step": 124200 }, { "epoch": 34.93, "learning_rate": 3.352887889294974e-05, "loss": 0.0559, "step": 124230 }, { "epoch": 34.93, "learning_rate": 3.3510136507044013e-05, "loss": 0.0524, "step": 124260 }, { "epoch": 34.94, "learning_rate": 3.349139412113829e-05, "loss": 0.0585, "step": 124290 }, { "epoch": 34.95, "learning_rate": 3.347265173523256e-05, "loss": 0.0487, "step": 124320 }, { "epoch": 34.96, "learning_rate": 3.345390934932684e-05, "loss": 0.0549, "step": 124350 }, { "epoch": 34.97, "learning_rate": 3.343516696342111e-05, "loss": 0.0525, "step": 124380 }, { "epoch": 34.98, "learning_rate": 3.3416424577515384e-05, "loss": 0.0541, "step": 124410 }, { "epoch": 34.98, "learning_rate": 3.339768219160966e-05, "loss": 0.0587, "step": 124440 }, { "epoch": 34.99, "learning_rate": 3.337893980570393e-05, "loss": 0.0508, "step": 124470 }, { "epoch": 35.0, "eval_loss": 0.10791715979576111, "eval_runtime": 635.3837, "eval_samples_per_second": 25.234, "eval_steps_per_second": 0.79, "eval_wer": 0.09728685873377642, "step": 124495 }, { "epoch": 35.0, "learning_rate": 3.336019741979821e-05, "loss": 0.0613, "step": 124500 }, { "epoch": 35.01, "learning_rate": 3.334145503389248e-05, "loss": 0.0491, "step": 124530 }, { "epoch": 35.02, "learning_rate": 3.332271264798676e-05, "loss": 0.0526, "step": 124560 }, { "epoch": 35.03, "learning_rate": 3.330397026208103e-05, "loss": 0.0505, "step": 124590 }, { "epoch": 35.04, "learning_rate": 3.3285227876175304e-05, "loss": 0.0519, "step": 124620 }, { "epoch": 35.04, "learning_rate": 3.326648549026958e-05, "loss": 0.0557, "step": 124650 }, { "epoch": 35.05, "learning_rate": 3.324774310436385e-05, "loss": 0.0465, "step": 124680 }, { "epoch": 35.06, "learning_rate": 3.3229000718458126e-05, "loss": 0.0514, "step": 124710 }, { "epoch": 35.07, "learning_rate": 3.32102583325524e-05, "loss": 0.0523, "step": 124740 }, { "epoch": 35.08, "learning_rate": 3.319151594664668e-05, "loss": 0.05, "step": 124770 }, { "epoch": 35.09, "learning_rate": 3.317277356074095e-05, "loss": 0.0573, "step": 124800 }, { "epoch": 35.09, "learning_rate": 3.315403117483522e-05, "loss": 0.048, "step": 124830 }, { "epoch": 35.1, "learning_rate": 3.31352887889295e-05, "loss": 0.0539, "step": 124860 }, { "epoch": 35.11, "learning_rate": 3.311654640302377e-05, "loss": 0.0501, "step": 124890 }, { "epoch": 35.12, "learning_rate": 3.3097804017118046e-05, "loss": 0.0518, "step": 124920 }, { "epoch": 35.13, "learning_rate": 3.307906163121232e-05, "loss": 0.0587, "step": 124950 }, { "epoch": 35.14, "learning_rate": 3.30603192453066e-05, "loss": 0.0495, "step": 124980 }, { "epoch": 35.14, "learning_rate": 3.304157685940087e-05, "loss": 0.054, "step": 125010 }, { "epoch": 35.15, "learning_rate": 3.302283447349514e-05, "loss": 0.0556, "step": 125040 }, { "epoch": 35.16, "learning_rate": 3.300409208758942e-05, "loss": 0.0485, "step": 125070 }, { "epoch": 35.17, "learning_rate": 3.298534970168369e-05, "loss": 0.056, "step": 125100 }, { "epoch": 35.18, "learning_rate": 3.2966607315777965e-05, "loss": 0.0501, "step": 125130 }, { "epoch": 35.19, "learning_rate": 3.294786492987224e-05, "loss": 0.0544, "step": 125160 }, { "epoch": 35.2, "learning_rate": 3.292912254396652e-05, "loss": 0.0548, "step": 125190 }, { "epoch": 35.2, "learning_rate": 3.291038015806079e-05, "loss": 0.0523, "step": 125220 }, { "epoch": 35.21, "learning_rate": 3.289163777215506e-05, "loss": 0.0596, "step": 125250 }, { "epoch": 35.22, "learning_rate": 3.2872895386249336e-05, "loss": 0.0477, "step": 125280 }, { "epoch": 35.23, "learning_rate": 3.285415300034361e-05, "loss": 0.0563, "step": 125310 }, { "epoch": 35.24, "learning_rate": 3.2835410614437884e-05, "loss": 0.0558, "step": 125340 }, { "epoch": 35.25, "learning_rate": 3.281666822853216e-05, "loss": 0.051, "step": 125370 }, { "epoch": 35.25, "learning_rate": 3.279792584262644e-05, "loss": 0.0586, "step": 125400 }, { "epoch": 35.26, "learning_rate": 3.277918345672071e-05, "loss": 0.0507, "step": 125430 }, { "epoch": 35.27, "learning_rate": 3.276106581701184e-05, "loss": 0.0542, "step": 125460 }, { "epoch": 35.28, "learning_rate": 3.2742323431106115e-05, "loss": 0.0501, "step": 125490 }, { "epoch": 35.29, "learning_rate": 3.272358104520039e-05, "loss": 0.0515, "step": 125520 }, { "epoch": 35.3, "learning_rate": 3.2704838659294664e-05, "loss": 0.0591, "step": 125550 }, { "epoch": 35.3, "learning_rate": 3.268609627338894e-05, "loss": 0.0469, "step": 125580 }, { "epoch": 35.31, "learning_rate": 3.266735388748321e-05, "loss": 0.0545, "step": 125610 }, { "epoch": 35.32, "learning_rate": 3.2648611501577486e-05, "loss": 0.051, "step": 125640 }, { "epoch": 35.33, "learning_rate": 3.262986911567176e-05, "loss": 0.048, "step": 125670 }, { "epoch": 35.34, "learning_rate": 3.2611126729766035e-05, "loss": 0.0577, "step": 125700 }, { "epoch": 35.35, "learning_rate": 3.259238434386031e-05, "loss": 0.0468, "step": 125730 }, { "epoch": 35.36, "learning_rate": 3.257364195795458e-05, "loss": 0.0567, "step": 125760 }, { "epoch": 35.36, "learning_rate": 3.255489957204886e-05, "loss": 0.0479, "step": 125790 }, { "epoch": 35.37, "learning_rate": 3.253615718614313e-05, "loss": 0.0543, "step": 125820 }, { "epoch": 35.38, "learning_rate": 3.2517414800237406e-05, "loss": 0.0594, "step": 125850 }, { "epoch": 35.39, "learning_rate": 3.249867241433168e-05, "loss": 0.0472, "step": 125880 }, { "epoch": 35.4, "learning_rate": 3.2479930028425954e-05, "loss": 0.0585, "step": 125910 }, { "epoch": 35.41, "learning_rate": 3.246118764252023e-05, "loss": 0.0516, "step": 125940 }, { "epoch": 35.41, "learning_rate": 3.24424452566145e-05, "loss": 0.0497, "step": 125970 }, { "epoch": 35.42, "learning_rate": 3.2423702870708777e-05, "loss": 0.0578, "step": 126000 }, { "epoch": 35.43, "learning_rate": 3.240496048480305e-05, "loss": 0.049, "step": 126030 }, { "epoch": 35.44, "learning_rate": 3.2386218098897325e-05, "loss": 0.0557, "step": 126060 }, { "epoch": 35.45, "learning_rate": 3.23674757129916e-05, "loss": 0.0499, "step": 126090 }, { "epoch": 35.46, "learning_rate": 3.234873332708587e-05, "loss": 0.0504, "step": 126120 }, { "epoch": 35.47, "learning_rate": 3.232999094118015e-05, "loss": 0.0612, "step": 126150 }, { "epoch": 35.47, "learning_rate": 3.231124855527442e-05, "loss": 0.0474, "step": 126180 }, { "epoch": 35.48, "learning_rate": 3.2292506169368696e-05, "loss": 0.0541, "step": 126210 }, { "epoch": 35.49, "learning_rate": 3.227376378346297e-05, "loss": 0.0512, "step": 126240 }, { "epoch": 35.5, "learning_rate": 3.2255021397557244e-05, "loss": 0.0511, "step": 126270 }, { "epoch": 35.51, "learning_rate": 3.223627901165152e-05, "loss": 0.0544, "step": 126300 }, { "epoch": 35.52, "learning_rate": 3.221753662574579e-05, "loss": 0.0462, "step": 126330 }, { "epoch": 35.52, "learning_rate": 3.219879423984007e-05, "loss": 0.0594, "step": 126360 }, { "epoch": 35.53, "learning_rate": 3.218005185393434e-05, "loss": 0.0557, "step": 126390 }, { "epoch": 35.54, "learning_rate": 3.2161309468028615e-05, "loss": 0.0517, "step": 126420 }, { "epoch": 35.55, "learning_rate": 3.214256708212289e-05, "loss": 0.0592, "step": 126450 }, { "epoch": 35.56, "learning_rate": 3.2123824696217164e-05, "loss": 0.0457, "step": 126480 }, { "epoch": 35.57, "learning_rate": 3.210508231031144e-05, "loss": 0.054, "step": 126510 }, { "epoch": 35.57, "learning_rate": 3.208633992440571e-05, "loss": 0.0495, "step": 126540 }, { "epoch": 35.58, "learning_rate": 3.2067597538499986e-05, "loss": 0.0472, "step": 126570 }, { "epoch": 35.59, "learning_rate": 3.204885515259426e-05, "loss": 0.0593, "step": 126600 }, { "epoch": 35.6, "learning_rate": 3.2030112766688535e-05, "loss": 0.0498, "step": 126630 }, { "epoch": 35.61, "learning_rate": 3.201137038078281e-05, "loss": 0.0544, "step": 126660 }, { "epoch": 35.62, "learning_rate": 3.199262799487708e-05, "loss": 0.051, "step": 126690 }, { "epoch": 35.63, "learning_rate": 3.197388560897136e-05, "loss": 0.0507, "step": 126720 }, { "epoch": 35.63, "learning_rate": 3.195514322306563e-05, "loss": 0.0566, "step": 126750 }, { "epoch": 35.64, "learning_rate": 3.1936400837159906e-05, "loss": 0.048, "step": 126780 }, { "epoch": 35.65, "learning_rate": 3.191765845125418e-05, "loss": 0.0525, "step": 126810 }, { "epoch": 35.66, "learning_rate": 3.1898916065348454e-05, "loss": 0.0537, "step": 126840 }, { "epoch": 35.67, "learning_rate": 3.188017367944273e-05, "loss": 0.0509, "step": 126870 }, { "epoch": 35.68, "learning_rate": 3.1861431293537e-05, "loss": 0.059, "step": 126900 }, { "epoch": 35.68, "learning_rate": 3.1842688907631276e-05, "loss": 0.0465, "step": 126930 }, { "epoch": 35.69, "learning_rate": 3.182394652172555e-05, "loss": 0.0535, "step": 126960 }, { "epoch": 35.7, "learning_rate": 3.1805204135819825e-05, "loss": 0.0535, "step": 126990 }, { "epoch": 35.71, "learning_rate": 3.17864617499141e-05, "loss": 0.052, "step": 127020 }, { "epoch": 35.72, "learning_rate": 3.176771936400837e-05, "loss": 0.0586, "step": 127050 }, { "epoch": 35.73, "learning_rate": 3.174897697810265e-05, "loss": 0.0485, "step": 127080 }, { "epoch": 35.74, "learning_rate": 3.173023459219692e-05, "loss": 0.0526, "step": 127110 }, { "epoch": 35.74, "learning_rate": 3.1711492206291196e-05, "loss": 0.0541, "step": 127140 }, { "epoch": 35.75, "learning_rate": 3.169274982038547e-05, "loss": 0.0537, "step": 127170 }, { "epoch": 35.76, "learning_rate": 3.1674007434479744e-05, "loss": 0.0619, "step": 127200 }, { "epoch": 35.77, "learning_rate": 3.165526504857402e-05, "loss": 0.0483, "step": 127230 }, { "epoch": 35.78, "learning_rate": 3.163652266266829e-05, "loss": 0.0515, "step": 127260 }, { "epoch": 35.79, "learning_rate": 3.161778027676257e-05, "loss": 0.0516, "step": 127290 }, { "epoch": 35.79, "learning_rate": 3.159903789085684e-05, "loss": 0.0503, "step": 127320 }, { "epoch": 35.8, "learning_rate": 3.1580295504951115e-05, "loss": 0.0573, "step": 127350 }, { "epoch": 35.81, "learning_rate": 3.156155311904539e-05, "loss": 0.0476, "step": 127380 }, { "epoch": 35.82, "learning_rate": 3.1542810733139664e-05, "loss": 0.0542, "step": 127410 }, { "epoch": 35.83, "learning_rate": 3.152406834723394e-05, "loss": 0.0506, "step": 127440 }, { "epoch": 35.84, "learning_rate": 3.150532596132821e-05, "loss": 0.0494, "step": 127470 }, { "epoch": 35.84, "learning_rate": 3.1486583575422486e-05, "loss": 0.0598, "step": 127500 }, { "epoch": 35.85, "learning_rate": 3.146784118951676e-05, "loss": 0.0495, "step": 127530 }, { "epoch": 35.86, "learning_rate": 3.1449098803611034e-05, "loss": 0.0522, "step": 127560 }, { "epoch": 35.87, "learning_rate": 3.143035641770531e-05, "loss": 0.0537, "step": 127590 }, { "epoch": 35.88, "learning_rate": 3.141161403179958e-05, "loss": 0.0524, "step": 127620 }, { "epoch": 35.89, "learning_rate": 3.139287164589386e-05, "loss": 0.0604, "step": 127650 }, { "epoch": 35.9, "learning_rate": 3.137412925998813e-05, "loss": 0.0468, "step": 127680 }, { "epoch": 35.9, "learning_rate": 3.1355386874082405e-05, "loss": 0.058, "step": 127710 }, { "epoch": 35.91, "learning_rate": 3.133664448817668e-05, "loss": 0.053, "step": 127740 }, { "epoch": 35.92, "learning_rate": 3.1317902102270954e-05, "loss": 0.0507, "step": 127770 }, { "epoch": 35.93, "learning_rate": 3.129915971636523e-05, "loss": 0.0529, "step": 127800 }, { "epoch": 35.94, "learning_rate": 3.12804173304595e-05, "loss": 0.046, "step": 127830 }, { "epoch": 35.95, "learning_rate": 3.1261674944553776e-05, "loss": 0.0518, "step": 127860 }, { "epoch": 35.95, "learning_rate": 3.124293255864805e-05, "loss": 0.0546, "step": 127890 }, { "epoch": 35.96, "learning_rate": 3.1224190172742325e-05, "loss": 0.0536, "step": 127920 }, { "epoch": 35.97, "learning_rate": 3.12054477868366e-05, "loss": 0.0564, "step": 127950 }, { "epoch": 35.98, "learning_rate": 3.118670540093087e-05, "loss": 0.0501, "step": 127980 }, { "epoch": 35.99, "learning_rate": 3.116796301502515e-05, "loss": 0.0528, "step": 128010 }, { "epoch": 36.0, "learning_rate": 3.114922062911942e-05, "loss": 0.0526, "step": 128040 }, { "epoch": 36.0, "eval_loss": 0.10677393525838852, "eval_runtime": 635.8282, "eval_samples_per_second": 25.216, "eval_steps_per_second": 0.79, "eval_wer": 0.09673413126253873, "step": 128052 }, { "epoch": 36.01, "learning_rate": 3.1130478243213696e-05, "loss": 0.0513, "step": 128070 }, { "epoch": 36.01, "learning_rate": 3.111173585730797e-05, "loss": 0.0532, "step": 128100 }, { "epoch": 36.02, "learning_rate": 3.1092993471402244e-05, "loss": 0.0461, "step": 128130 }, { "epoch": 36.03, "learning_rate": 3.107425108549652e-05, "loss": 0.0604, "step": 128160 }, { "epoch": 36.04, "learning_rate": 3.105550869959079e-05, "loss": 0.0484, "step": 128190 }, { "epoch": 36.05, "learning_rate": 3.103676631368507e-05, "loss": 0.0542, "step": 128220 }, { "epoch": 36.06, "learning_rate": 3.101802392777934e-05, "loss": 0.0546, "step": 128250 }, { "epoch": 36.06, "learning_rate": 3.0999281541873615e-05, "loss": 0.0495, "step": 128280 }, { "epoch": 36.07, "learning_rate": 3.098053915596789e-05, "loss": 0.0558, "step": 128310 }, { "epoch": 36.08, "learning_rate": 3.0961796770062163e-05, "loss": 0.0449, "step": 128340 }, { "epoch": 36.09, "learning_rate": 3.094305438415644e-05, "loss": 0.0524, "step": 128370 }, { "epoch": 36.1, "learning_rate": 3.092431199825071e-05, "loss": 0.0563, "step": 128400 }, { "epoch": 36.11, "learning_rate": 3.0905569612344986e-05, "loss": 0.0479, "step": 128430 }, { "epoch": 36.11, "learning_rate": 3.088682722643926e-05, "loss": 0.0533, "step": 128460 }, { "epoch": 36.12, "learning_rate": 3.0868084840533534e-05, "loss": 0.0508, "step": 128490 }, { "epoch": 36.13, "learning_rate": 3.084934245462781e-05, "loss": 0.0524, "step": 128520 }, { "epoch": 36.14, "learning_rate": 3.083060006872208e-05, "loss": 0.051, "step": 128550 }, { "epoch": 36.15, "learning_rate": 3.081185768281636e-05, "loss": 0.0497, "step": 128580 }, { "epoch": 36.16, "learning_rate": 3.079311529691063e-05, "loss": 0.0569, "step": 128610 }, { "epoch": 36.17, "learning_rate": 3.0774372911004905e-05, "loss": 0.0478, "step": 128640 }, { "epoch": 36.17, "learning_rate": 3.075563052509918e-05, "loss": 0.0478, "step": 128670 }, { "epoch": 36.18, "learning_rate": 3.0736888139193454e-05, "loss": 0.0542, "step": 128700 }, { "epoch": 36.19, "learning_rate": 3.071814575328773e-05, "loss": 0.0496, "step": 128730 }, { "epoch": 36.2, "learning_rate": 3.0699403367382e-05, "loss": 0.0602, "step": 128760 }, { "epoch": 36.21, "learning_rate": 3.0680660981476276e-05, "loss": 0.049, "step": 128790 }, { "epoch": 36.22, "learning_rate": 3.066191859557055e-05, "loss": 0.0547, "step": 128820 }, { "epoch": 36.22, "learning_rate": 3.0643176209664825e-05, "loss": 0.0498, "step": 128850 }, { "epoch": 36.23, "learning_rate": 3.06244338237591e-05, "loss": 0.0482, "step": 128880 }, { "epoch": 36.24, "learning_rate": 3.060569143785337e-05, "loss": 0.0574, "step": 128910 }, { "epoch": 36.25, "learning_rate": 3.058694905194765e-05, "loss": 0.047, "step": 128940 }, { "epoch": 36.26, "learning_rate": 3.056820666604192e-05, "loss": 0.0539, "step": 128970 }, { "epoch": 36.27, "learning_rate": 3.0549464280136196e-05, "loss": 0.0493, "step": 129000 }, { "epoch": 36.27, "learning_rate": 3.053072189423047e-05, "loss": 0.0476, "step": 129030 }, { "epoch": 36.28, "learning_rate": 3.0511979508324744e-05, "loss": 0.0553, "step": 129060 }, { "epoch": 36.29, "learning_rate": 3.0493237122419015e-05, "loss": 0.0472, "step": 129090 }, { "epoch": 36.3, "learning_rate": 3.0474494736513292e-05, "loss": 0.0503, "step": 129120 }, { "epoch": 36.31, "learning_rate": 3.045575235060757e-05, "loss": 0.0538, "step": 129150 }, { "epoch": 36.32, "learning_rate": 3.043700996470184e-05, "loss": 0.0469, "step": 129180 }, { "epoch": 36.33, "learning_rate": 3.041826757879612e-05, "loss": 0.056, "step": 129210 }, { "epoch": 36.33, "learning_rate": 3.039952519289039e-05, "loss": 0.0484, "step": 129240 }, { "epoch": 36.34, "learning_rate": 3.0380782806984663e-05, "loss": 0.0519, "step": 129270 }, { "epoch": 36.35, "learning_rate": 3.0362040421078934e-05, "loss": 0.0566, "step": 129300 }, { "epoch": 36.36, "learning_rate": 3.0343298035173212e-05, "loss": 0.0472, "step": 129330 }, { "epoch": 36.37, "learning_rate": 3.032455564926749e-05, "loss": 0.057, "step": 129360 }, { "epoch": 36.38, "learning_rate": 3.030581326336176e-05, "loss": 0.0478, "step": 129390 }, { "epoch": 36.38, "learning_rate": 3.0287070877456038e-05, "loss": 0.0531, "step": 129420 }, { "epoch": 36.39, "learning_rate": 3.0268953237747165e-05, "loss": 0.055, "step": 129450 }, { "epoch": 36.4, "learning_rate": 3.0250210851841443e-05, "loss": 0.0496, "step": 129480 }, { "epoch": 36.41, "learning_rate": 3.0231468465935713e-05, "loss": 0.0548, "step": 129510 }, { "epoch": 36.42, "learning_rate": 3.021272608002999e-05, "loss": 0.0471, "step": 129540 }, { "epoch": 36.43, "learning_rate": 3.0193983694124262e-05, "loss": 0.0549, "step": 129570 }, { "epoch": 36.44, "learning_rate": 3.017524130821854e-05, "loss": 0.0539, "step": 129600 }, { "epoch": 36.44, "learning_rate": 3.015649892231281e-05, "loss": 0.0463, "step": 129630 }, { "epoch": 36.45, "learning_rate": 3.0137756536407084e-05, "loss": 0.0532, "step": 129660 }, { "epoch": 36.46, "learning_rate": 3.0119014150501362e-05, "loss": 0.0468, "step": 129690 }, { "epoch": 36.47, "learning_rate": 3.0100271764595633e-05, "loss": 0.0515, "step": 129720 }, { "epoch": 36.48, "learning_rate": 3.008152937868991e-05, "loss": 0.0571, "step": 129750 }, { "epoch": 36.49, "learning_rate": 3.006278699278418e-05, "loss": 0.0492, "step": 129780 }, { "epoch": 36.49, "learning_rate": 3.004404460687846e-05, "loss": 0.0551, "step": 129810 }, { "epoch": 36.5, "learning_rate": 3.002530222097273e-05, "loss": 0.0451, "step": 129840 }, { "epoch": 36.51, "learning_rate": 3.0006559835067004e-05, "loss": 0.0528, "step": 129870 }, { "epoch": 36.52, "learning_rate": 2.998781744916128e-05, "loss": 0.0566, "step": 129900 }, { "epoch": 36.53, "learning_rate": 2.9969075063255552e-05, "loss": 0.0464, "step": 129930 }, { "epoch": 36.54, "learning_rate": 2.995033267734983e-05, "loss": 0.0537, "step": 129960 }, { "epoch": 36.54, "learning_rate": 2.99315902914441e-05, "loss": 0.0489, "step": 129990 }, { "epoch": 36.55, "learning_rate": 2.9912847905538378e-05, "loss": 0.0522, "step": 130020 }, { "epoch": 36.56, "learning_rate": 2.989410551963265e-05, "loss": 0.0513, "step": 130050 }, { "epoch": 36.57, "learning_rate": 2.9875363133726923e-05, "loss": 0.0464, "step": 130080 }, { "epoch": 36.58, "learning_rate": 2.98566207478212e-05, "loss": 0.0558, "step": 130110 }, { "epoch": 36.59, "learning_rate": 2.983787836191547e-05, "loss": 0.0463, "step": 130140 }, { "epoch": 36.6, "learning_rate": 2.981913597600975e-05, "loss": 0.0536, "step": 130170 }, { "epoch": 36.6, "learning_rate": 2.980039359010402e-05, "loss": 0.0517, "step": 130200 }, { "epoch": 36.61, "learning_rate": 2.9781651204198297e-05, "loss": 0.049, "step": 130230 }, { "epoch": 36.62, "learning_rate": 2.9762908818292568e-05, "loss": 0.0582, "step": 130260 }, { "epoch": 36.63, "learning_rate": 2.9744166432386842e-05, "loss": 0.0475, "step": 130290 }, { "epoch": 36.64, "learning_rate": 2.972542404648112e-05, "loss": 0.0558, "step": 130320 }, { "epoch": 36.65, "learning_rate": 2.970668166057539e-05, "loss": 0.0496, "step": 130350 }, { "epoch": 36.65, "learning_rate": 2.968793927466967e-05, "loss": 0.0515, "step": 130380 }, { "epoch": 36.66, "learning_rate": 2.966919688876394e-05, "loss": 0.0581, "step": 130410 }, { "epoch": 36.67, "learning_rate": 2.9650454502858217e-05, "loss": 0.048, "step": 130440 }, { "epoch": 36.68, "learning_rate": 2.9631712116952488e-05, "loss": 0.0519, "step": 130470 }, { "epoch": 36.69, "learning_rate": 2.9612969731046765e-05, "loss": 0.048, "step": 130500 }, { "epoch": 36.7, "learning_rate": 2.959422734514104e-05, "loss": 0.0496, "step": 130530 }, { "epoch": 36.7, "learning_rate": 2.957548495923531e-05, "loss": 0.0532, "step": 130560 }, { "epoch": 36.71, "learning_rate": 2.9556742573329588e-05, "loss": 0.0505, "step": 130590 }, { "epoch": 36.72, "learning_rate": 2.953800018742386e-05, "loss": 0.0524, "step": 130620 }, { "epoch": 36.73, "learning_rate": 2.9519257801518136e-05, "loss": 0.052, "step": 130650 }, { "epoch": 36.74, "learning_rate": 2.9500515415612407e-05, "loss": 0.0498, "step": 130680 }, { "epoch": 36.75, "learning_rate": 2.9481773029706685e-05, "loss": 0.0565, "step": 130710 }, { "epoch": 36.76, "learning_rate": 2.946303064380096e-05, "loss": 0.0473, "step": 130740 }, { "epoch": 36.76, "learning_rate": 2.944428825789523e-05, "loss": 0.0503, "step": 130770 }, { "epoch": 36.77, "learning_rate": 2.9425545871989507e-05, "loss": 0.0535, "step": 130800 }, { "epoch": 36.78, "learning_rate": 2.9406803486083778e-05, "loss": 0.0491, "step": 130830 }, { "epoch": 36.79, "learning_rate": 2.9388061100178055e-05, "loss": 0.0521, "step": 130860 }, { "epoch": 36.8, "learning_rate": 2.9369318714272326e-05, "loss": 0.0443, "step": 130890 }, { "epoch": 36.81, "learning_rate": 2.9350576328366604e-05, "loss": 0.0538, "step": 130920 }, { "epoch": 36.81, "learning_rate": 2.9331833942460878e-05, "loss": 0.0522, "step": 130950 }, { "epoch": 36.82, "learning_rate": 2.931309155655515e-05, "loss": 0.0501, "step": 130980 }, { "epoch": 36.83, "learning_rate": 2.9294349170649426e-05, "loss": 0.0568, "step": 131010 }, { "epoch": 36.84, "learning_rate": 2.9275606784743697e-05, "loss": 0.0475, "step": 131040 }, { "epoch": 36.85, "learning_rate": 2.9256864398837975e-05, "loss": 0.0505, "step": 131070 }, { "epoch": 36.86, "learning_rate": 2.9238746759129106e-05, "loss": 0.0537, "step": 131100 }, { "epoch": 36.87, "learning_rate": 2.922000437322338e-05, "loss": 0.0494, "step": 131130 }, { "epoch": 36.87, "learning_rate": 2.920126198731765e-05, "loss": 0.0543, "step": 131160 }, { "epoch": 36.88, "learning_rate": 2.9182519601411928e-05, "loss": 0.0461, "step": 131190 }, { "epoch": 36.89, "learning_rate": 2.91637772155062e-05, "loss": 0.0523, "step": 131220 }, { "epoch": 36.9, "learning_rate": 2.9145034829600477e-05, "loss": 0.0496, "step": 131250 }, { "epoch": 36.91, "learning_rate": 2.9126292443694754e-05, "loss": 0.0478, "step": 131280 }, { "epoch": 36.92, "learning_rate": 2.9107550057789025e-05, "loss": 0.054, "step": 131310 }, { "epoch": 36.92, "learning_rate": 2.90888076718833e-05, "loss": 0.0467, "step": 131340 }, { "epoch": 36.93, "learning_rate": 2.907006528597757e-05, "loss": 0.0542, "step": 131370 }, { "epoch": 36.94, "learning_rate": 2.9051322900071848e-05, "loss": 0.0543, "step": 131400 }, { "epoch": 36.95, "learning_rate": 2.903258051416612e-05, "loss": 0.0491, "step": 131430 }, { "epoch": 36.96, "learning_rate": 2.9013838128260396e-05, "loss": 0.0573, "step": 131460 }, { "epoch": 36.97, "learning_rate": 2.8995095742354673e-05, "loss": 0.0478, "step": 131490 }, { "epoch": 36.97, "learning_rate": 2.8976353356448944e-05, "loss": 0.0549, "step": 131520 }, { "epoch": 36.98, "learning_rate": 2.895761097054322e-05, "loss": 0.0558, "step": 131550 }, { "epoch": 36.99, "learning_rate": 2.893886858463749e-05, "loss": 0.0487, "step": 131580 }, { "epoch": 37.0, "eval_loss": 0.10814538598060608, "eval_runtime": 637.0458, "eval_samples_per_second": 25.168, "eval_steps_per_second": 0.788, "eval_wer": 0.09662495052747942, "step": 131609 }, { "epoch": 37.0, "learning_rate": 2.8920126198731767e-05, "loss": 0.0589, "step": 131610 }, { "epoch": 37.01, "learning_rate": 2.8901383812826038e-05, "loss": 0.0479, "step": 131640 }, { "epoch": 37.02, "learning_rate": 2.8882641426920315e-05, "loss": 0.0533, "step": 131670 }, { "epoch": 37.03, "learning_rate": 2.8863899041014593e-05, "loss": 0.0463, "step": 131700 }, { "epoch": 37.03, "learning_rate": 2.8845156655108864e-05, "loss": 0.048, "step": 131730 }, { "epoch": 37.04, "learning_rate": 2.8826414269203138e-05, "loss": 0.0577, "step": 131760 }, { "epoch": 37.05, "learning_rate": 2.880767188329741e-05, "loss": 0.0447, "step": 131790 }, { "epoch": 37.06, "learning_rate": 2.8788929497391686e-05, "loss": 0.0561, "step": 131820 }, { "epoch": 37.07, "learning_rate": 2.8770187111485957e-05, "loss": 0.0476, "step": 131850 }, { "epoch": 37.08, "learning_rate": 2.8751444725580235e-05, "loss": 0.0488, "step": 131880 }, { "epoch": 37.08, "learning_rate": 2.8732702339674512e-05, "loss": 0.0553, "step": 131910 }, { "epoch": 37.09, "learning_rate": 2.8713959953768783e-05, "loss": 0.0465, "step": 131940 }, { "epoch": 37.1, "learning_rate": 2.8695217567863057e-05, "loss": 0.054, "step": 131970 }, { "epoch": 37.11, "learning_rate": 2.8676475181957328e-05, "loss": 0.0475, "step": 132000 }, { "epoch": 37.12, "learning_rate": 2.8657732796051606e-05, "loss": 0.0514, "step": 132030 }, { "epoch": 37.13, "learning_rate": 2.8638990410145876e-05, "loss": 0.0529, "step": 132060 }, { "epoch": 37.14, "learning_rate": 2.8620248024240154e-05, "loss": 0.0458, "step": 132090 }, { "epoch": 37.14, "learning_rate": 2.860150563833443e-05, "loss": 0.0527, "step": 132120 }, { "epoch": 37.15, "learning_rate": 2.8582763252428702e-05, "loss": 0.0462, "step": 132150 }, { "epoch": 37.16, "learning_rate": 2.8564020866522976e-05, "loss": 0.0492, "step": 132180 }, { "epoch": 37.17, "learning_rate": 2.854527848061725e-05, "loss": 0.0535, "step": 132210 }, { "epoch": 37.18, "learning_rate": 2.8526536094711525e-05, "loss": 0.047, "step": 132240 }, { "epoch": 37.19, "learning_rate": 2.8507793708805796e-05, "loss": 0.0499, "step": 132270 }, { "epoch": 37.19, "learning_rate": 2.8489051322900073e-05, "loss": 0.0492, "step": 132300 }, { "epoch": 37.2, "learning_rate": 2.847030893699435e-05, "loss": 0.0496, "step": 132330 }, { "epoch": 37.21, "learning_rate": 2.845156655108862e-05, "loss": 0.053, "step": 132360 }, { "epoch": 37.22, "learning_rate": 2.8432824165182896e-05, "loss": 0.0445, "step": 132390 }, { "epoch": 37.23, "learning_rate": 2.841408177927717e-05, "loss": 0.054, "step": 132420 }, { "epoch": 37.24, "learning_rate": 2.8395339393371444e-05, "loss": 0.0484, "step": 132450 }, { "epoch": 37.24, "learning_rate": 2.8376597007465715e-05, "loss": 0.0499, "step": 132480 }, { "epoch": 37.25, "learning_rate": 2.8357854621559993e-05, "loss": 0.0586, "step": 132510 }, { "epoch": 37.26, "learning_rate": 2.833911223565427e-05, "loss": 0.0434, "step": 132540 }, { "epoch": 37.27, "learning_rate": 2.832036984974854e-05, "loss": 0.0539, "step": 132570 }, { "epoch": 37.28, "learning_rate": 2.830162746384282e-05, "loss": 0.0495, "step": 132600 }, { "epoch": 37.29, "learning_rate": 2.828288507793709e-05, "loss": 0.0525, "step": 132630 }, { "epoch": 37.3, "learning_rate": 2.8264142692031364e-05, "loss": 0.0548, "step": 132660 }, { "epoch": 37.3, "learning_rate": 2.8245400306125634e-05, "loss": 0.0429, "step": 132690 }, { "epoch": 37.31, "learning_rate": 2.8226657920219912e-05, "loss": 0.0552, "step": 132720 }, { "epoch": 37.32, "learning_rate": 2.820791553431419e-05, "loss": 0.0485, "step": 132750 }, { "epoch": 37.33, "learning_rate": 2.818917314840846e-05, "loss": 0.0488, "step": 132780 }, { "epoch": 37.34, "learning_rate": 2.8170430762502738e-05, "loss": 0.0592, "step": 132810 }, { "epoch": 37.35, "learning_rate": 2.815168837659701e-05, "loss": 0.0448, "step": 132840 }, { "epoch": 37.35, "learning_rate": 2.8132945990691283e-05, "loss": 0.0562, "step": 132870 }, { "epoch": 37.36, "learning_rate": 2.8114203604785554e-05, "loss": 0.0467, "step": 132900 }, { "epoch": 37.37, "learning_rate": 2.809546121887983e-05, "loss": 0.0519, "step": 132930 }, { "epoch": 37.38, "learning_rate": 2.807671883297411e-05, "loss": 0.0532, "step": 132960 }, { "epoch": 37.39, "learning_rate": 2.805797644706838e-05, "loss": 0.0442, "step": 132990 }, { "epoch": 37.4, "learning_rate": 2.8039234061162657e-05, "loss": 0.052, "step": 133020 }, { "epoch": 37.41, "learning_rate": 2.8020491675256928e-05, "loss": 0.0474, "step": 133050 }, { "epoch": 37.41, "learning_rate": 2.8001749289351202e-05, "loss": 0.0509, "step": 133080 }, { "epoch": 37.42, "learning_rate": 2.7983006903445473e-05, "loss": 0.0553, "step": 133110 }, { "epoch": 37.43, "learning_rate": 2.796426451753975e-05, "loss": 0.0439, "step": 133140 }, { "epoch": 37.44, "learning_rate": 2.794614687783088e-05, "loss": 0.0561, "step": 133170 }, { "epoch": 37.45, "learning_rate": 2.792740449192516e-05, "loss": 0.0503, "step": 133200 }, { "epoch": 37.46, "learning_rate": 2.790866210601943e-05, "loss": 0.0514, "step": 133230 }, { "epoch": 37.46, "learning_rate": 2.7889919720113704e-05, "loss": 0.0523, "step": 133260 }, { "epoch": 37.47, "learning_rate": 2.787117733420798e-05, "loss": 0.044, "step": 133290 }, { "epoch": 37.48, "learning_rate": 2.7852434948302252e-05, "loss": 0.052, "step": 133320 }, { "epoch": 37.49, "learning_rate": 2.783369256239653e-05, "loss": 0.0482, "step": 133350 }, { "epoch": 37.5, "learning_rate": 2.78149501764908e-05, "loss": 0.0521, "step": 133380 }, { "epoch": 37.51, "learning_rate": 2.7796207790585078e-05, "loss": 0.054, "step": 133410 }, { "epoch": 37.51, "learning_rate": 2.777746540467935e-05, "loss": 0.0438, "step": 133440 }, { "epoch": 37.52, "learning_rate": 2.7758723018773623e-05, "loss": 0.055, "step": 133470 }, { "epoch": 37.53, "learning_rate": 2.77399806328679e-05, "loss": 0.0471, "step": 133500 }, { "epoch": 37.54, "learning_rate": 2.772123824696217e-05, "loss": 0.0511, "step": 133530 }, { "epoch": 37.55, "learning_rate": 2.770249586105645e-05, "loss": 0.0517, "step": 133560 }, { "epoch": 37.56, "learning_rate": 2.768375347515072e-05, "loss": 0.0432, "step": 133590 }, { "epoch": 37.57, "learning_rate": 2.7665011089244998e-05, "loss": 0.0514, "step": 133620 }, { "epoch": 37.57, "learning_rate": 2.764626870333927e-05, "loss": 0.0469, "step": 133650 }, { "epoch": 37.58, "learning_rate": 2.7627526317433543e-05, "loss": 0.0526, "step": 133680 }, { "epoch": 37.59, "learning_rate": 2.760878393152782e-05, "loss": 0.0558, "step": 133710 }, { "epoch": 37.6, "learning_rate": 2.759004154562209e-05, "loss": 0.0444, "step": 133740 }, { "epoch": 37.61, "learning_rate": 2.757129915971637e-05, "loss": 0.0545, "step": 133770 }, { "epoch": 37.62, "learning_rate": 2.755255677381064e-05, "loss": 0.0502, "step": 133800 }, { "epoch": 37.62, "learning_rate": 2.7533814387904917e-05, "loss": 0.0506, "step": 133830 }, { "epoch": 37.63, "learning_rate": 2.7515072001999188e-05, "loss": 0.0556, "step": 133860 }, { "epoch": 37.64, "learning_rate": 2.7496329616093462e-05, "loss": 0.0459, "step": 133890 }, { "epoch": 37.65, "learning_rate": 2.747758723018774e-05, "loss": 0.0527, "step": 133920 }, { "epoch": 37.66, "learning_rate": 2.745884484428201e-05, "loss": 0.0477, "step": 133950 }, { "epoch": 37.67, "learning_rate": 2.7440102458376288e-05, "loss": 0.0496, "step": 133980 }, { "epoch": 37.67, "learning_rate": 2.742136007247056e-05, "loss": 0.0527, "step": 134010 }, { "epoch": 37.68, "learning_rate": 2.7402617686564836e-05, "loss": 0.0431, "step": 134040 }, { "epoch": 37.69, "learning_rate": 2.7383875300659107e-05, "loss": 0.0526, "step": 134070 }, { "epoch": 37.7, "learning_rate": 2.7365132914753385e-05, "loss": 0.0458, "step": 134100 }, { "epoch": 37.71, "learning_rate": 2.734639052884766e-05, "loss": 0.052, "step": 134130 }, { "epoch": 37.72, "learning_rate": 2.732764814294193e-05, "loss": 0.0559, "step": 134160 }, { "epoch": 37.73, "learning_rate": 2.7308905757036207e-05, "loss": 0.045, "step": 134190 }, { "epoch": 37.73, "learning_rate": 2.7290163371130478e-05, "loss": 0.0549, "step": 134220 }, { "epoch": 37.74, "learning_rate": 2.7271420985224756e-05, "loss": 0.0464, "step": 134250 }, { "epoch": 37.75, "learning_rate": 2.7252678599319026e-05, "loss": 0.054, "step": 134280 }, { "epoch": 37.76, "learning_rate": 2.7233936213413304e-05, "loss": 0.0567, "step": 134310 }, { "epoch": 37.77, "learning_rate": 2.7215193827507578e-05, "loss": 0.0458, "step": 134340 }, { "epoch": 37.78, "learning_rate": 2.719645144160185e-05, "loss": 0.0567, "step": 134370 }, { "epoch": 37.78, "learning_rate": 2.7177709055696127e-05, "loss": 0.0451, "step": 134400 }, { "epoch": 37.79, "learning_rate": 2.7158966669790397e-05, "loss": 0.0499, "step": 134430 }, { "epoch": 37.8, "learning_rate": 2.7140224283884675e-05, "loss": 0.0555, "step": 134460 }, { "epoch": 37.81, "learning_rate": 2.7121481897978946e-05, "loss": 0.0448, "step": 134490 }, { "epoch": 37.82, "learning_rate": 2.7102739512073223e-05, "loss": 0.0525, "step": 134520 }, { "epoch": 37.83, "learning_rate": 2.7083997126167498e-05, "loss": 0.0479, "step": 134550 }, { "epoch": 37.84, "learning_rate": 2.706525474026177e-05, "loss": 0.0523, "step": 134580 }, { "epoch": 37.84, "learning_rate": 2.7046512354356046e-05, "loss": 0.0534, "step": 134610 }, { "epoch": 37.85, "learning_rate": 2.7027769968450317e-05, "loss": 0.0463, "step": 134640 }, { "epoch": 37.86, "learning_rate": 2.7009027582544594e-05, "loss": 0.054, "step": 134670 }, { "epoch": 37.87, "learning_rate": 2.6990285196638865e-05, "loss": 0.0463, "step": 134700 }, { "epoch": 37.88, "learning_rate": 2.6971542810733143e-05, "loss": 0.0491, "step": 134730 }, { "epoch": 37.89, "learning_rate": 2.6952800424827413e-05, "loss": 0.0543, "step": 134760 }, { "epoch": 37.89, "learning_rate": 2.6934058038921688e-05, "loss": 0.043, "step": 134790 }, { "epoch": 37.9, "learning_rate": 2.6915315653015965e-05, "loss": 0.0539, "step": 134820 }, { "epoch": 37.91, "learning_rate": 2.6896573267110236e-05, "loss": 0.0457, "step": 134850 }, { "epoch": 37.92, "learning_rate": 2.6877830881204514e-05, "loss": 0.054, "step": 134880 }, { "epoch": 37.93, "learning_rate": 2.6859088495298784e-05, "loss": 0.053, "step": 134910 }, { "epoch": 37.94, "learning_rate": 2.6840346109393062e-05, "loss": 0.0456, "step": 134940 }, { "epoch": 37.94, "learning_rate": 2.6821603723487333e-05, "loss": 0.0602, "step": 134970 }, { "epoch": 37.95, "learning_rate": 2.6802861337581607e-05, "loss": 0.0468, "step": 135000 }, { "epoch": 37.96, "learning_rate": 2.6784118951675885e-05, "loss": 0.0524, "step": 135030 }, { "epoch": 37.97, "learning_rate": 2.6765376565770155e-05, "loss": 0.0577, "step": 135060 }, { "epoch": 37.98, "learning_rate": 2.6746634179864433e-05, "loss": 0.0447, "step": 135090 }, { "epoch": 37.99, "learning_rate": 2.6727891793958704e-05, "loss": 0.0546, "step": 135120 }, { "epoch": 38.0, "learning_rate": 2.670914940805298e-05, "loss": 0.0495, "step": 135150 }, { "epoch": 38.0, "eval_loss": 0.1098802462220192, "eval_runtime": 637.127, "eval_samples_per_second": 25.165, "eval_steps_per_second": 0.788, "eval_wer": 0.09562867632006332, "step": 135166 }, { "epoch": 38.0, "learning_rate": 2.6690407022147252e-05, "loss": 0.052, "step": 135180 }, { "epoch": 38.01, "learning_rate": 2.6671664636241526e-05, "loss": 0.049, "step": 135210 }, { "epoch": 38.02, "learning_rate": 2.6652922250335804e-05, "loss": 0.0482, "step": 135240 }, { "epoch": 38.03, "learning_rate": 2.6634179864430075e-05, "loss": 0.0553, "step": 135270 }, { "epoch": 38.04, "learning_rate": 2.6615437478524352e-05, "loss": 0.0441, "step": 135300 }, { "epoch": 38.05, "learning_rate": 2.6596695092618623e-05, "loss": 0.0528, "step": 135330 }, { "epoch": 38.05, "learning_rate": 2.65779527067129e-05, "loss": 0.051, "step": 135360 }, { "epoch": 38.06, "learning_rate": 2.655921032080717e-05, "loss": 0.052, "step": 135390 }, { "epoch": 38.07, "learning_rate": 2.6540467934901446e-05, "loss": 0.0558, "step": 135420 }, { "epoch": 38.08, "learning_rate": 2.6521725548995723e-05, "loss": 0.0429, "step": 135450 }, { "epoch": 38.09, "learning_rate": 2.6502983163089994e-05, "loss": 0.0495, "step": 135480 }, { "epoch": 38.1, "learning_rate": 2.648424077718427e-05, "loss": 0.0512, "step": 135510 }, { "epoch": 38.11, "learning_rate": 2.6465498391278542e-05, "loss": 0.0514, "step": 135540 }, { "epoch": 38.11, "learning_rate": 2.644675600537282e-05, "loss": 0.0523, "step": 135570 }, { "epoch": 38.12, "learning_rate": 2.642801361946709e-05, "loss": 0.0454, "step": 135600 }, { "epoch": 38.13, "learning_rate": 2.640927123356137e-05, "loss": 0.0533, "step": 135630 }, { "epoch": 38.14, "learning_rate": 2.6390528847655643e-05, "loss": 0.0502, "step": 135660 }, { "epoch": 38.15, "learning_rate": 2.6371786461749913e-05, "loss": 0.0519, "step": 135690 }, { "epoch": 38.16, "learning_rate": 2.635304407584419e-05, "loss": 0.0581, "step": 135720 }, { "epoch": 38.16, "learning_rate": 2.6334301689938462e-05, "loss": 0.046, "step": 135750 }, { "epoch": 38.17, "learning_rate": 2.631555930403274e-05, "loss": 0.0523, "step": 135780 }, { "epoch": 38.18, "learning_rate": 2.629681691812701e-05, "loss": 0.0493, "step": 135810 }, { "epoch": 38.19, "learning_rate": 2.6278074532221288e-05, "loss": 0.049, "step": 135840 }, { "epoch": 38.2, "learning_rate": 2.6259332146315562e-05, "loss": 0.0556, "step": 135870 }, { "epoch": 38.21, "learning_rate": 2.6240589760409833e-05, "loss": 0.0444, "step": 135900 }, { "epoch": 38.21, "learning_rate": 2.622184737450411e-05, "loss": 0.0517, "step": 135930 }, { "epoch": 38.22, "learning_rate": 2.620310498859838e-05, "loss": 0.047, "step": 135960 }, { "epoch": 38.23, "learning_rate": 2.618436260269266e-05, "loss": 0.051, "step": 135990 }, { "epoch": 38.24, "learning_rate": 2.616562021678693e-05, "loss": 0.0575, "step": 136020 }, { "epoch": 38.25, "learning_rate": 2.6146877830881207e-05, "loss": 0.0442, "step": 136050 }, { "epoch": 38.26, "learning_rate": 2.612813544497548e-05, "loss": 0.0539, "step": 136080 }, { "epoch": 38.27, "learning_rate": 2.6109393059069752e-05, "loss": 0.0468, "step": 136110 }, { "epoch": 38.27, "learning_rate": 2.609065067316403e-05, "loss": 0.0506, "step": 136140 }, { "epoch": 38.28, "learning_rate": 2.60719082872583e-05, "loss": 0.0533, "step": 136170 }, { "epoch": 38.29, "learning_rate": 2.6053165901352578e-05, "loss": 0.0438, "step": 136200 }, { "epoch": 38.3, "learning_rate": 2.603442351544685e-05, "loss": 0.052, "step": 136230 }, { "epoch": 38.31, "learning_rate": 2.6015681129541126e-05, "loss": 0.048, "step": 136260 }, { "epoch": 38.32, "learning_rate": 2.59969387436354e-05, "loss": 0.0481, "step": 136290 }, { "epoch": 38.32, "learning_rate": 2.597819635772967e-05, "loss": 0.0495, "step": 136320 }, { "epoch": 38.33, "learning_rate": 2.595945397182395e-05, "loss": 0.0414, "step": 136350 }, { "epoch": 38.34, "learning_rate": 2.594071158591822e-05, "loss": 0.0542, "step": 136380 }, { "epoch": 38.35, "learning_rate": 2.5921969200012497e-05, "loss": 0.0479, "step": 136410 }, { "epoch": 38.36, "learning_rate": 2.5903226814106768e-05, "loss": 0.0471, "step": 136440 }, { "epoch": 38.37, "learning_rate": 2.5884484428201046e-05, "loss": 0.0562, "step": 136470 }, { "epoch": 38.37, "learning_rate": 2.586574204229532e-05, "loss": 0.0458, "step": 136500 }, { "epoch": 38.38, "learning_rate": 2.584699965638959e-05, "loss": 0.054, "step": 136530 }, { "epoch": 38.39, "learning_rate": 2.582825727048387e-05, "loss": 0.0503, "step": 136560 }, { "epoch": 38.4, "learning_rate": 2.580951488457814e-05, "loss": 0.0487, "step": 136590 }, { "epoch": 38.41, "learning_rate": 2.5790772498672417e-05, "loss": 0.051, "step": 136620 }, { "epoch": 38.42, "learning_rate": 2.5772030112766688e-05, "loss": 0.0447, "step": 136650 }, { "epoch": 38.43, "learning_rate": 2.5753287726860965e-05, "loss": 0.056, "step": 136680 }, { "epoch": 38.43, "learning_rate": 2.573454534095524e-05, "loss": 0.051, "step": 136710 }, { "epoch": 38.44, "learning_rate": 2.571580295504951e-05, "loss": 0.0496, "step": 136740 }, { "epoch": 38.45, "learning_rate": 2.5697060569143788e-05, "loss": 0.0507, "step": 136770 }, { "epoch": 38.46, "learning_rate": 2.567831818323806e-05, "loss": 0.044, "step": 136800 }, { "epoch": 38.47, "learning_rate": 2.5659575797332336e-05, "loss": 0.0494, "step": 136830 }, { "epoch": 38.48, "learning_rate": 2.5640833411426607e-05, "loss": 0.0449, "step": 136860 }, { "epoch": 38.48, "learning_rate": 2.5622091025520884e-05, "loss": 0.0472, "step": 136890 }, { "epoch": 38.49, "learning_rate": 2.560334863961516e-05, "loss": 0.0534, "step": 136920 }, { "epoch": 38.5, "learning_rate": 2.558460625370943e-05, "loss": 0.0444, "step": 136950 }, { "epoch": 38.51, "learning_rate": 2.5565863867803707e-05, "loss": 0.0541, "step": 136980 }, { "epoch": 38.52, "learning_rate": 2.5547121481897978e-05, "loss": 0.0465, "step": 137010 }, { "epoch": 38.53, "learning_rate": 2.5528379095992255e-05, "loss": 0.05, "step": 137040 }, { "epoch": 38.54, "learning_rate": 2.5509636710086526e-05, "loss": 0.0532, "step": 137070 }, { "epoch": 38.54, "learning_rate": 2.5490894324180804e-05, "loss": 0.0436, "step": 137100 }, { "epoch": 38.55, "learning_rate": 2.5472151938275078e-05, "loss": 0.0514, "step": 137130 }, { "epoch": 38.56, "learning_rate": 2.5453409552369352e-05, "loss": 0.0508, "step": 137160 }, { "epoch": 38.57, "learning_rate": 2.5434667166463626e-05, "loss": 0.0493, "step": 137190 }, { "epoch": 38.58, "learning_rate": 2.5415924780557897e-05, "loss": 0.05, "step": 137220 }, { "epoch": 38.59, "learning_rate": 2.5397182394652175e-05, "loss": 0.0418, "step": 137250 }, { "epoch": 38.59, "learning_rate": 2.5378440008746446e-05, "loss": 0.0512, "step": 137280 }, { "epoch": 38.6, "learning_rate": 2.5359697622840723e-05, "loss": 0.0473, "step": 137310 }, { "epoch": 38.61, "learning_rate": 2.5340955236934997e-05, "loss": 0.0474, "step": 137340 }, { "epoch": 38.62, "learning_rate": 2.532221285102927e-05, "loss": 0.0537, "step": 137370 }, { "epoch": 38.63, "learning_rate": 2.5303470465123546e-05, "loss": 0.0508, "step": 137400 }, { "epoch": 38.64, "learning_rate": 2.5284728079217816e-05, "loss": 0.0531, "step": 137430 }, { "epoch": 38.64, "learning_rate": 2.5265985693312094e-05, "loss": 0.049, "step": 137460 }, { "epoch": 38.65, "learning_rate": 2.5247243307406365e-05, "loss": 0.0497, "step": 137490 }, { "epoch": 38.66, "learning_rate": 2.5228500921500642e-05, "loss": 0.0526, "step": 137520 }, { "epoch": 38.67, "learning_rate": 2.520975853559492e-05, "loss": 0.0469, "step": 137550 }, { "epoch": 38.68, "learning_rate": 2.519101614968919e-05, "loss": 0.0548, "step": 137580 }, { "epoch": 38.69, "learning_rate": 2.5172273763783465e-05, "loss": 0.048, "step": 137610 }, { "epoch": 38.7, "learning_rate": 2.5153531377877736e-05, "loss": 0.0488, "step": 137640 }, { "epoch": 38.7, "learning_rate": 2.5134788991972013e-05, "loss": 0.0507, "step": 137670 }, { "epoch": 38.71, "learning_rate": 2.5116046606066284e-05, "loss": 0.0436, "step": 137700 }, { "epoch": 38.72, "learning_rate": 2.5097304220160562e-05, "loss": 0.05, "step": 137730 }, { "epoch": 38.73, "learning_rate": 2.507856183425484e-05, "loss": 0.0472, "step": 137760 }, { "epoch": 38.74, "learning_rate": 2.505981944834911e-05, "loss": 0.0484, "step": 137790 }, { "epoch": 38.75, "learning_rate": 2.5041077062443384e-05, "loss": 0.0549, "step": 137820 }, { "epoch": 38.75, "learning_rate": 2.5022334676537655e-05, "loss": 0.0427, "step": 137850 }, { "epoch": 38.76, "learning_rate": 2.5003592290631933e-05, "loss": 0.049, "step": 137880 }, { "epoch": 38.77, "learning_rate": 2.4984849904726207e-05, "loss": 0.0511, "step": 137910 }, { "epoch": 38.78, "learning_rate": 2.496610751882048e-05, "loss": 0.0531, "step": 137940 }, { "epoch": 38.79, "learning_rate": 2.4947365132914755e-05, "loss": 0.0552, "step": 137970 }, { "epoch": 38.8, "learning_rate": 2.492862274700903e-05, "loss": 0.0423, "step": 138000 }, { "epoch": 38.81, "learning_rate": 2.4909880361103304e-05, "loss": 0.0531, "step": 138030 }, { "epoch": 38.81, "learning_rate": 2.4891137975197574e-05, "loss": 0.0495, "step": 138060 }, { "epoch": 38.82, "learning_rate": 2.4872395589291852e-05, "loss": 0.0525, "step": 138090 }, { "epoch": 38.83, "learning_rate": 2.4853653203386126e-05, "loss": 0.0569, "step": 138120 }, { "epoch": 38.84, "learning_rate": 2.48349108174804e-05, "loss": 0.0427, "step": 138150 }, { "epoch": 38.85, "learning_rate": 2.4816168431574675e-05, "loss": 0.0517, "step": 138180 }, { "epoch": 38.86, "learning_rate": 2.479742604566895e-05, "loss": 0.0502, "step": 138210 }, { "epoch": 38.86, "learning_rate": 2.4778683659763223e-05, "loss": 0.0503, "step": 138240 }, { "epoch": 38.87, "learning_rate": 2.4759941273857494e-05, "loss": 0.0548, "step": 138270 }, { "epoch": 38.88, "learning_rate": 2.474119888795177e-05, "loss": 0.0434, "step": 138300 }, { "epoch": 38.89, "learning_rate": 2.4722456502046046e-05, "loss": 0.0521, "step": 138330 }, { "epoch": 38.9, "learning_rate": 2.470371411614032e-05, "loss": 0.0496, "step": 138360 }, { "epoch": 38.91, "learning_rate": 2.4684971730234594e-05, "loss": 0.0475, "step": 138390 }, { "epoch": 38.91, "learning_rate": 2.4666229344328868e-05, "loss": 0.0546, "step": 138420 }, { "epoch": 38.92, "learning_rate": 2.4647486958423142e-05, "loss": 0.0424, "step": 138450 }, { "epoch": 38.93, "learning_rate": 2.4628744572517417e-05, "loss": 0.049, "step": 138480 }, { "epoch": 38.94, "learning_rate": 2.461000218661169e-05, "loss": 0.0477, "step": 138510 }, { "epoch": 38.95, "learning_rate": 2.4591259800705965e-05, "loss": 0.049, "step": 138540 }, { "epoch": 38.96, "learning_rate": 2.457251741480024e-05, "loss": 0.0525, "step": 138570 }, { "epoch": 38.97, "learning_rate": 2.4553775028894513e-05, "loss": 0.0475, "step": 138600 }, { "epoch": 38.97, "learning_rate": 2.4535032642988787e-05, "loss": 0.0506, "step": 138630 }, { "epoch": 38.98, "learning_rate": 2.451629025708306e-05, "loss": 0.0492, "step": 138660 }, { "epoch": 38.99, "learning_rate": 2.4497547871177336e-05, "loss": 0.0504, "step": 138690 }, { "epoch": 39.0, "learning_rate": 2.447880548527161e-05, "loss": 0.0528, "step": 138720 }, { "epoch": 39.0, "eval_loss": 0.10912308096885681, "eval_runtime": 638.8233, "eval_samples_per_second": 25.098, "eval_steps_per_second": 0.786, "eval_wer": 0.09225772112510748, "step": 138723 }, { "epoch": 39.01, "learning_rate": 2.4460063099365884e-05, "loss": 0.0436, "step": 138750 }, { "epoch": 39.02, "learning_rate": 2.444132071346016e-05, "loss": 0.0513, "step": 138780 }, { "epoch": 39.02, "learning_rate": 2.4422578327554433e-05, "loss": 0.0455, "step": 138810 }, { "epoch": 39.03, "learning_rate": 2.4403835941648707e-05, "loss": 0.0498, "step": 138840 }, { "epoch": 39.04, "learning_rate": 2.438509355574298e-05, "loss": 0.0536, "step": 138870 }, { "epoch": 39.05, "learning_rate": 2.4366351169837255e-05, "loss": 0.0494, "step": 138900 }, { "epoch": 39.06, "learning_rate": 2.434760878393153e-05, "loss": 0.0533, "step": 138930 }, { "epoch": 39.07, "learning_rate": 2.4328866398025804e-05, "loss": 0.0448, "step": 138960 }, { "epoch": 39.08, "learning_rate": 2.4310124012120078e-05, "loss": 0.0487, "step": 138990 }, { "epoch": 39.08, "learning_rate": 2.4291381626214352e-05, "loss": 0.0519, "step": 139020 }, { "epoch": 39.09, "learning_rate": 2.4272639240308626e-05, "loss": 0.0456, "step": 139050 }, { "epoch": 39.1, "learning_rate": 2.42538968544029e-05, "loss": 0.0544, "step": 139080 }, { "epoch": 39.11, "learning_rate": 2.4235154468497175e-05, "loss": 0.0442, "step": 139110 }, { "epoch": 39.12, "learning_rate": 2.4216412082591445e-05, "loss": 0.0504, "step": 139140 }, { "epoch": 39.13, "learning_rate": 2.4197669696685723e-05, "loss": 0.0515, "step": 139170 }, { "epoch": 39.13, "learning_rate": 2.4178927310779997e-05, "loss": 0.048, "step": 139200 }, { "epoch": 39.14, "learning_rate": 2.4160809671071128e-05, "loss": 0.0524, "step": 139230 }, { "epoch": 39.15, "learning_rate": 2.4142067285165405e-05, "loss": 0.0433, "step": 139260 }, { "epoch": 39.16, "learning_rate": 2.4123324899259676e-05, "loss": 0.0522, "step": 139290 }, { "epoch": 39.17, "learning_rate": 2.410458251335395e-05, "loss": 0.0488, "step": 139320 }, { "epoch": 39.18, "learning_rate": 2.4085840127448225e-05, "loss": 0.0492, "step": 139350 }, { "epoch": 39.18, "learning_rate": 2.40670977415425e-05, "loss": 0.0539, "step": 139380 }, { "epoch": 39.19, "learning_rate": 2.4048355355636773e-05, "loss": 0.0471, "step": 139410 }, { "epoch": 39.2, "learning_rate": 2.4029612969731047e-05, "loss": 0.0495, "step": 139440 }, { "epoch": 39.21, "learning_rate": 2.4010870583825325e-05, "loss": 0.0476, "step": 139470 }, { "epoch": 39.22, "learning_rate": 2.3992128197919596e-05, "loss": 0.0442, "step": 139500 }, { "epoch": 39.23, "learning_rate": 2.3974010558210726e-05, "loss": 0.056, "step": 139530 }, { "epoch": 39.24, "learning_rate": 2.3955268172305e-05, "loss": 0.0435, "step": 139560 }, { "epoch": 39.24, "learning_rate": 2.3936525786399278e-05, "loss": 0.0481, "step": 139590 }, { "epoch": 39.25, "learning_rate": 2.3917783400493552e-05, "loss": 0.0475, "step": 139620 }, { "epoch": 39.26, "learning_rate": 2.3899041014587827e-05, "loss": 0.046, "step": 139650 }, { "epoch": 39.27, "learning_rate": 2.3880298628682097e-05, "loss": 0.0509, "step": 139680 }, { "epoch": 39.28, "learning_rate": 2.386155624277637e-05, "loss": 0.0425, "step": 139710 }, { "epoch": 39.29, "learning_rate": 2.3842813856870646e-05, "loss": 0.0489, "step": 139740 }, { "epoch": 39.29, "learning_rate": 2.382407147096492e-05, "loss": 0.0473, "step": 139770 }, { "epoch": 39.3, "learning_rate": 2.3805329085059198e-05, "loss": 0.0466, "step": 139800 }, { "epoch": 39.31, "learning_rate": 2.3786586699153472e-05, "loss": 0.0507, "step": 139830 }, { "epoch": 39.32, "learning_rate": 2.3767844313247746e-05, "loss": 0.0441, "step": 139860 }, { "epoch": 39.33, "learning_rate": 2.374910192734202e-05, "loss": 0.0471, "step": 139890 }, { "epoch": 39.34, "learning_rate": 2.373035954143629e-05, "loss": 0.0481, "step": 139920 }, { "epoch": 39.34, "learning_rate": 2.3711617155530565e-05, "loss": 0.0456, "step": 139950 }, { "epoch": 39.35, "learning_rate": 2.369287476962484e-05, "loss": 0.051, "step": 139980 }, { "epoch": 39.36, "learning_rate": 2.3674757129915974e-05, "loss": 0.0442, "step": 140010 }, { "epoch": 39.37, "learning_rate": 2.3656014744010248e-05, "loss": 0.0502, "step": 140040 }, { "epoch": 39.38, "learning_rate": 2.3637272358104522e-05, "loss": 0.0486, "step": 140070 }, { "epoch": 39.39, "learning_rate": 2.3618529972198793e-05, "loss": 0.0443, "step": 140100 }, { "epoch": 39.4, "learning_rate": 2.359978758629307e-05, "loss": 0.0518, "step": 140130 }, { "epoch": 39.4, "learning_rate": 2.3581045200387344e-05, "loss": 0.0425, "step": 140160 }, { "epoch": 39.41, "learning_rate": 2.356230281448162e-05, "loss": 0.0484, "step": 140190 }, { "epoch": 39.42, "learning_rate": 2.3543560428575893e-05, "loss": 0.0488, "step": 140220 }, { "epoch": 39.43, "learning_rate": 2.3524818042670167e-05, "loss": 0.0442, "step": 140250 }, { "epoch": 39.44, "learning_rate": 2.350607565676444e-05, "loss": 0.0506, "step": 140280 }, { "epoch": 39.45, "learning_rate": 2.3487333270858712e-05, "loss": 0.0439, "step": 140310 }, { "epoch": 39.45, "learning_rate": 2.346859088495299e-05, "loss": 0.0493, "step": 140340 }, { "epoch": 39.46, "learning_rate": 2.3449848499047264e-05, "loss": 0.0473, "step": 140370 }, { "epoch": 39.47, "learning_rate": 2.3431106113141538e-05, "loss": 0.0457, "step": 140400 }, { "epoch": 39.48, "learning_rate": 2.3412363727235812e-05, "loss": 0.0582, "step": 140430 }, { "epoch": 39.49, "learning_rate": 2.3393621341330086e-05, "loss": 0.0452, "step": 140460 }, { "epoch": 39.5, "learning_rate": 2.337487895542436e-05, "loss": 0.0515, "step": 140490 }, { "epoch": 39.51, "learning_rate": 2.335613656951863e-05, "loss": 0.0503, "step": 140520 }, { "epoch": 39.51, "learning_rate": 2.333739418361291e-05, "loss": 0.0451, "step": 140550 }, { "epoch": 39.52, "learning_rate": 2.3318651797707183e-05, "loss": 0.0513, "step": 140580 }, { "epoch": 39.53, "learning_rate": 2.3299909411801457e-05, "loss": 0.0424, "step": 140610 }, { "epoch": 39.54, "learning_rate": 2.328116702589573e-05, "loss": 0.0492, "step": 140640 }, { "epoch": 39.55, "learning_rate": 2.3262424639990006e-05, "loss": 0.0483, "step": 140670 }, { "epoch": 39.56, "learning_rate": 2.324368225408428e-05, "loss": 0.0481, "step": 140700 }, { "epoch": 39.56, "learning_rate": 2.322493986817855e-05, "loss": 0.0511, "step": 140730 }, { "epoch": 39.57, "learning_rate": 2.3206197482272828e-05, "loss": 0.0433, "step": 140760 }, { "epoch": 39.58, "learning_rate": 2.3187455096367102e-05, "loss": 0.0507, "step": 140790 }, { "epoch": 39.59, "learning_rate": 2.3168712710461377e-05, "loss": 0.0484, "step": 140820 }, { "epoch": 39.6, "learning_rate": 2.314997032455565e-05, "loss": 0.0444, "step": 140850 }, { "epoch": 39.61, "learning_rate": 2.3131227938649925e-05, "loss": 0.0502, "step": 140880 }, { "epoch": 39.61, "learning_rate": 2.31124855527442e-05, "loss": 0.0455, "step": 140910 }, { "epoch": 39.62, "learning_rate": 2.3093743166838473e-05, "loss": 0.0492, "step": 140940 }, { "epoch": 39.63, "learning_rate": 2.3075000780932748e-05, "loss": 0.0495, "step": 140970 }, { "epoch": 39.64, "learning_rate": 2.3056258395027022e-05, "loss": 0.0457, "step": 141000 }, { "epoch": 39.65, "learning_rate": 2.3037516009121296e-05, "loss": 0.0528, "step": 141030 }, { "epoch": 39.66, "learning_rate": 2.301877362321557e-05, "loss": 0.0445, "step": 141060 }, { "epoch": 39.67, "learning_rate": 2.3000031237309844e-05, "loss": 0.0516, "step": 141090 }, { "epoch": 39.67, "learning_rate": 2.298128885140412e-05, "loss": 0.0505, "step": 141120 }, { "epoch": 39.68, "learning_rate": 2.2962546465498393e-05, "loss": 0.0474, "step": 141150 }, { "epoch": 39.69, "learning_rate": 2.2943804079592667e-05, "loss": 0.053, "step": 141180 }, { "epoch": 39.7, "learning_rate": 2.292506169368694e-05, "loss": 0.0444, "step": 141210 }, { "epoch": 39.71, "learning_rate": 2.2906319307781215e-05, "loss": 0.0514, "step": 141240 }, { "epoch": 39.72, "learning_rate": 2.288757692187549e-05, "loss": 0.0473, "step": 141270 }, { "epoch": 39.72, "learning_rate": 2.2868834535969764e-05, "loss": 0.0458, "step": 141300 }, { "epoch": 39.73, "learning_rate": 2.2850092150064038e-05, "loss": 0.0488, "step": 141330 }, { "epoch": 39.74, "learning_rate": 2.2831349764158312e-05, "loss": 0.0445, "step": 141360 }, { "epoch": 39.75, "learning_rate": 2.2812607378252586e-05, "loss": 0.0499, "step": 141390 }, { "epoch": 39.76, "learning_rate": 2.279386499234686e-05, "loss": 0.0468, "step": 141420 }, { "epoch": 39.77, "learning_rate": 2.2775122606441135e-05, "loss": 0.0469, "step": 141450 }, { "epoch": 39.77, "learning_rate": 2.275638022053541e-05, "loss": 0.051, "step": 141480 }, { "epoch": 39.78, "learning_rate": 2.2737637834629683e-05, "loss": 0.0447, "step": 141510 }, { "epoch": 39.79, "learning_rate": 2.2718895448723957e-05, "loss": 0.0507, "step": 141540 }, { "epoch": 39.8, "learning_rate": 2.270015306281823e-05, "loss": 0.0491, "step": 141570 }, { "epoch": 39.81, "learning_rate": 2.2681410676912506e-05, "loss": 0.0457, "step": 141600 }, { "epoch": 39.82, "learning_rate": 2.266266829100678e-05, "loss": 0.0533, "step": 141630 }, { "epoch": 39.83, "learning_rate": 2.2643925905101054e-05, "loss": 0.0461, "step": 141660 }, { "epoch": 39.83, "learning_rate": 2.2625183519195328e-05, "loss": 0.0498, "step": 141690 }, { "epoch": 39.84, "learning_rate": 2.2606441133289602e-05, "loss": 0.0464, "step": 141720 }, { "epoch": 39.85, "learning_rate": 2.2587698747383877e-05, "loss": 0.0485, "step": 141750 }, { "epoch": 39.86, "learning_rate": 2.256895636147815e-05, "loss": 0.0518, "step": 141780 }, { "epoch": 39.87, "learning_rate": 2.2550213975572425e-05, "loss": 0.0455, "step": 141810 }, { "epoch": 39.88, "learning_rate": 2.25314715896667e-05, "loss": 0.0485, "step": 141840 }, { "epoch": 39.88, "learning_rate": 2.2512729203760973e-05, "loss": 0.0484, "step": 141870 }, { "epoch": 39.89, "learning_rate": 2.2493986817855248e-05, "loss": 0.0443, "step": 141900 }, { "epoch": 39.9, "learning_rate": 2.2475244431949522e-05, "loss": 0.0533, "step": 141930 }, { "epoch": 39.91, "learning_rate": 2.2456502046043796e-05, "loss": 0.0425, "step": 141960 }, { "epoch": 39.92, "learning_rate": 2.243775966013807e-05, "loss": 0.0512, "step": 141990 }, { "epoch": 39.93, "learning_rate": 2.2419017274232344e-05, "loss": 0.048, "step": 142020 }, { "epoch": 39.94, "learning_rate": 2.240027488832662e-05, "loss": 0.0449, "step": 142050 }, { "epoch": 39.94, "learning_rate": 2.2381532502420893e-05, "loss": 0.0504, "step": 142080 }, { "epoch": 39.95, "learning_rate": 2.2362790116515167e-05, "loss": 0.046, "step": 142110 }, { "epoch": 39.96, "learning_rate": 2.234404773060944e-05, "loss": 0.0503, "step": 142140 }, { "epoch": 39.97, "learning_rate": 2.2325305344703715e-05, "loss": 0.048, "step": 142170 }, { "epoch": 39.98, "learning_rate": 2.230656295879799e-05, "loss": 0.0443, "step": 142200 }, { "epoch": 39.99, "learning_rate": 2.2287820572892264e-05, "loss": 0.0524, "step": 142230 }, { "epoch": 39.99, "learning_rate": 2.2269078186986538e-05, "loss": 0.0439, "step": 142260 }, { "epoch": 40.0, "eval_loss": 0.11113700270652771, "eval_runtime": 639.3379, "eval_samples_per_second": 25.078, "eval_steps_per_second": 0.785, "eval_wer": 0.09283774378011, "step": 142280 }, { "epoch": 40.0, "learning_rate": 2.2250335801080812e-05, "loss": 0.0503, "step": 142290 }, { "epoch": 40.01, "learning_rate": 2.2231593415175086e-05, "loss": 0.0457, "step": 142320 }, { "epoch": 40.02, "learning_rate": 2.221285102926936e-05, "loss": 0.0462, "step": 142350 }, { "epoch": 40.03, "learning_rate": 2.2194108643363635e-05, "loss": 0.0556, "step": 142380 }, { "epoch": 40.04, "learning_rate": 2.217536625745791e-05, "loss": 0.0438, "step": 142410 }, { "epoch": 40.04, "learning_rate": 2.2156623871552183e-05, "loss": 0.0529, "step": 142440 }, { "epoch": 40.05, "learning_rate": 2.2137881485646457e-05, "loss": 0.0455, "step": 142470 }, { "epoch": 40.06, "learning_rate": 2.211913909974073e-05, "loss": 0.0481, "step": 142500 }, { "epoch": 40.07, "learning_rate": 2.2100396713835006e-05, "loss": 0.0507, "step": 142530 }, { "epoch": 40.08, "learning_rate": 2.208165432792928e-05, "loss": 0.0408, "step": 142560 }, { "epoch": 40.09, "learning_rate": 2.2062911942023554e-05, "loss": 0.0499, "step": 142590 }, { "epoch": 40.1, "learning_rate": 2.2044169556117828e-05, "loss": 0.047, "step": 142620 }, { "epoch": 40.1, "learning_rate": 2.2025427170212102e-05, "loss": 0.0508, "step": 142650 }, { "epoch": 40.11, "learning_rate": 2.2006684784306376e-05, "loss": 0.0545, "step": 142680 }, { "epoch": 40.12, "learning_rate": 2.198794239840065e-05, "loss": 0.0441, "step": 142710 }, { "epoch": 40.13, "learning_rate": 2.1969200012494925e-05, "loss": 0.0481, "step": 142740 }, { "epoch": 40.14, "learning_rate": 2.19504576265892e-05, "loss": 0.0413, "step": 142770 }, { "epoch": 40.15, "learning_rate": 2.1931715240683473e-05, "loss": 0.0474, "step": 142800 }, { "epoch": 40.15, "learning_rate": 2.1912972854777747e-05, "loss": 0.0528, "step": 142830 }, { "epoch": 40.16, "learning_rate": 2.189423046887202e-05, "loss": 0.0418, "step": 142860 }, { "epoch": 40.17, "learning_rate": 2.1875488082966296e-05, "loss": 0.052, "step": 142890 }, { "epoch": 40.18, "learning_rate": 2.185674569706057e-05, "loss": 0.046, "step": 142920 }, { "epoch": 40.19, "learning_rate": 2.1838003311154844e-05, "loss": 0.051, "step": 142950 }, { "epoch": 40.2, "learning_rate": 2.181926092524912e-05, "loss": 0.0523, "step": 142980 }, { "epoch": 40.21, "learning_rate": 2.1800518539343393e-05, "loss": 0.0429, "step": 143010 }, { "epoch": 40.21, "learning_rate": 2.1781776153437667e-05, "loss": 0.0557, "step": 143040 }, { "epoch": 40.22, "learning_rate": 2.176303376753194e-05, "loss": 0.0443, "step": 143070 }, { "epoch": 40.23, "learning_rate": 2.1744291381626215e-05, "loss": 0.0497, "step": 143100 }, { "epoch": 40.24, "learning_rate": 2.172554899572049e-05, "loss": 0.0501, "step": 143130 }, { "epoch": 40.25, "learning_rate": 2.1706806609814764e-05, "loss": 0.0427, "step": 143160 }, { "epoch": 40.26, "learning_rate": 2.1688064223909038e-05, "loss": 0.0508, "step": 143190 }, { "epoch": 40.26, "learning_rate": 2.1669321838003312e-05, "loss": 0.0432, "step": 143220 }, { "epoch": 40.27, "learning_rate": 2.1650579452097586e-05, "loss": 0.0461, "step": 143250 }, { "epoch": 40.28, "learning_rate": 2.163183706619186e-05, "loss": 0.0521, "step": 143280 }, { "epoch": 40.29, "learning_rate": 2.1613094680286134e-05, "loss": 0.0412, "step": 143310 }, { "epoch": 40.3, "learning_rate": 2.159435229438041e-05, "loss": 0.0514, "step": 143340 }, { "epoch": 40.31, "learning_rate": 2.1575609908474683e-05, "loss": 0.0456, "step": 143370 }, { "epoch": 40.31, "learning_rate": 2.1556867522568957e-05, "loss": 0.0478, "step": 143400 }, { "epoch": 40.32, "learning_rate": 2.153812513666323e-05, "loss": 0.0549, "step": 143430 }, { "epoch": 40.33, "learning_rate": 2.1519382750757505e-05, "loss": 0.0435, "step": 143460 }, { "epoch": 40.34, "learning_rate": 2.150064036485178e-05, "loss": 0.0512, "step": 143490 }, { "epoch": 40.35, "learning_rate": 2.1481897978946054e-05, "loss": 0.0442, "step": 143520 }, { "epoch": 40.36, "learning_rate": 2.1463155593040328e-05, "loss": 0.0485, "step": 143550 }, { "epoch": 40.37, "learning_rate": 2.1444413207134602e-05, "loss": 0.0531, "step": 143580 }, { "epoch": 40.37, "learning_rate": 2.1425670821228876e-05, "loss": 0.0427, "step": 143610 }, { "epoch": 40.38, "learning_rate": 2.140692843532315e-05, "loss": 0.0512, "step": 143640 }, { "epoch": 40.39, "learning_rate": 2.1388186049417425e-05, "loss": 0.0457, "step": 143670 }, { "epoch": 40.4, "learning_rate": 2.13694436635117e-05, "loss": 0.0507, "step": 143700 }, { "epoch": 40.41, "learning_rate": 2.1350701277605973e-05, "loss": 0.0557, "step": 143730 }, { "epoch": 40.42, "learning_rate": 2.1331958891700247e-05, "loss": 0.0413, "step": 143760 }, { "epoch": 40.42, "learning_rate": 2.131321650579452e-05, "loss": 0.0532, "step": 143790 }, { "epoch": 40.43, "learning_rate": 2.1294474119888796e-05, "loss": 0.0416, "step": 143820 }, { "epoch": 40.44, "learning_rate": 2.127573173398307e-05, "loss": 0.0473, "step": 143850 }, { "epoch": 40.45, "learning_rate": 2.1256989348077344e-05, "loss": 0.0498, "step": 143880 }, { "epoch": 40.46, "learning_rate": 2.1238246962171618e-05, "loss": 0.0436, "step": 143910 }, { "epoch": 40.47, "learning_rate": 2.1219504576265892e-05, "loss": 0.0515, "step": 143940 }, { "epoch": 40.48, "learning_rate": 2.1200762190360167e-05, "loss": 0.0457, "step": 143970 }, { "epoch": 40.48, "learning_rate": 2.118201980445444e-05, "loss": 0.0488, "step": 144000 }, { "epoch": 40.49, "learning_rate": 2.1163277418548715e-05, "loss": 0.0554, "step": 144030 }, { "epoch": 40.5, "learning_rate": 2.114453503264299e-05, "loss": 0.0446, "step": 144060 }, { "epoch": 40.51, "learning_rate": 2.1125792646737263e-05, "loss": 0.0502, "step": 144090 }, { "epoch": 40.52, "learning_rate": 2.1107050260831538e-05, "loss": 0.044, "step": 144120 }, { "epoch": 40.53, "learning_rate": 2.1088307874925812e-05, "loss": 0.0516, "step": 144150 }, { "epoch": 40.53, "learning_rate": 2.106956548902009e-05, "loss": 0.051, "step": 144180 }, { "epoch": 40.54, "learning_rate": 2.105082310311436e-05, "loss": 0.0438, "step": 144210 }, { "epoch": 40.55, "learning_rate": 2.1032080717208634e-05, "loss": 0.0522, "step": 144240 }, { "epoch": 40.56, "learning_rate": 2.101333833130291e-05, "loss": 0.0459, "step": 144270 }, { "epoch": 40.57, "learning_rate": 2.0995220691594043e-05, "loss": 0.0482, "step": 144300 }, { "epoch": 40.58, "learning_rate": 2.0976478305688317e-05, "loss": 0.0515, "step": 144330 }, { "epoch": 40.58, "learning_rate": 2.095773591978259e-05, "loss": 0.0426, "step": 144360 }, { "epoch": 40.59, "learning_rate": 2.0938993533876862e-05, "loss": 0.0516, "step": 144390 }, { "epoch": 40.6, "learning_rate": 2.0920251147971136e-05, "loss": 0.0457, "step": 144420 }, { "epoch": 40.61, "learning_rate": 2.090150876206541e-05, "loss": 0.0468, "step": 144450 }, { "epoch": 40.62, "learning_rate": 2.0882766376159685e-05, "loss": 0.0532, "step": 144480 }, { "epoch": 40.63, "learning_rate": 2.0864023990253962e-05, "loss": 0.0425, "step": 144510 }, { "epoch": 40.64, "learning_rate": 2.0845281604348236e-05, "loss": 0.0508, "step": 144540 }, { "epoch": 40.64, "learning_rate": 2.082653921844251e-05, "loss": 0.0456, "step": 144570 }, { "epoch": 40.65, "learning_rate": 2.080779683253678e-05, "loss": 0.0467, "step": 144600 }, { "epoch": 40.66, "learning_rate": 2.0789054446631055e-05, "loss": 0.0505, "step": 144630 }, { "epoch": 40.67, "learning_rate": 2.077031206072533e-05, "loss": 0.0424, "step": 144660 }, { "epoch": 40.68, "learning_rate": 2.0751569674819604e-05, "loss": 0.0491, "step": 144690 }, { "epoch": 40.69, "learning_rate": 2.073282728891388e-05, "loss": 0.0431, "step": 144720 }, { "epoch": 40.69, "learning_rate": 2.0714084903008156e-05, "loss": 0.0458, "step": 144750 }, { "epoch": 40.7, "learning_rate": 2.069534251710243e-05, "loss": 0.0513, "step": 144780 }, { "epoch": 40.71, "learning_rate": 2.06766001311967e-05, "loss": 0.041, "step": 144810 }, { "epoch": 40.72, "learning_rate": 2.0657857745290975e-05, "loss": 0.0546, "step": 144840 }, { "epoch": 40.73, "learning_rate": 2.063911535938525e-05, "loss": 0.0447, "step": 144870 }, { "epoch": 40.74, "learning_rate": 2.0620372973479523e-05, "loss": 0.0511, "step": 144900 }, { "epoch": 40.74, "learning_rate": 2.06016305875738e-05, "loss": 0.0482, "step": 144930 }, { "epoch": 40.75, "learning_rate": 2.0582888201668075e-05, "loss": 0.0414, "step": 144960 }, { "epoch": 40.76, "learning_rate": 2.056414581576235e-05, "loss": 0.0523, "step": 144990 }, { "epoch": 40.77, "learning_rate": 2.0545403429856623e-05, "loss": 0.0448, "step": 145020 }, { "epoch": 40.78, "learning_rate": 2.0526661043950894e-05, "loss": 0.0475, "step": 145050 }, { "epoch": 40.79, "learning_rate": 2.050791865804517e-05, "loss": 0.054, "step": 145080 }, { "epoch": 40.8, "learning_rate": 2.0489176272139443e-05, "loss": 0.0422, "step": 145110 }, { "epoch": 40.8, "learning_rate": 2.047043388623372e-05, "loss": 0.0482, "step": 145140 }, { "epoch": 40.81, "learning_rate": 2.0451691500327994e-05, "loss": 0.0455, "step": 145170 }, { "epoch": 40.82, "learning_rate": 2.043294911442227e-05, "loss": 0.0511, "step": 145200 }, { "epoch": 40.83, "learning_rate": 2.0414206728516543e-05, "loss": 0.0521, "step": 145230 }, { "epoch": 40.84, "learning_rate": 2.0395464342610814e-05, "loss": 0.0433, "step": 145260 }, { "epoch": 40.85, "learning_rate": 2.0376721956705088e-05, "loss": 0.0507, "step": 145290 }, { "epoch": 40.85, "learning_rate": 2.0357979570799362e-05, "loss": 0.0464, "step": 145320 }, { "epoch": 40.86, "learning_rate": 2.033923718489364e-05, "loss": 0.0489, "step": 145350 }, { "epoch": 40.87, "learning_rate": 2.0320494798987914e-05, "loss": 0.0514, "step": 145380 }, { "epoch": 40.88, "learning_rate": 2.0301752413082188e-05, "loss": 0.0415, "step": 145410 }, { "epoch": 40.89, "learning_rate": 2.0283010027176462e-05, "loss": 0.0503, "step": 145440 }, { "epoch": 40.9, "learning_rate": 2.0264267641270733e-05, "loss": 0.0423, "step": 145470 }, { "epoch": 40.91, "learning_rate": 2.0245525255365007e-05, "loss": 0.046, "step": 145500 }, { "epoch": 40.91, "learning_rate": 2.022678286945928e-05, "loss": 0.0506, "step": 145530 }, { "epoch": 40.92, "learning_rate": 2.020804048355356e-05, "loss": 0.0412, "step": 145560 }, { "epoch": 40.93, "learning_rate": 2.0189298097647833e-05, "loss": 0.0478, "step": 145590 }, { "epoch": 40.94, "learning_rate": 2.0170555711742107e-05, "loss": 0.0421, "step": 145620 }, { "epoch": 40.95, "learning_rate": 2.015181332583638e-05, "loss": 0.0475, "step": 145650 }, { "epoch": 40.96, "learning_rate": 2.0133070939930652e-05, "loss": 0.0545, "step": 145680 }, { "epoch": 40.96, "learning_rate": 2.0114328554024926e-05, "loss": 0.0397, "step": 145710 }, { "epoch": 40.97, "learning_rate": 2.00955861681192e-05, "loss": 0.0521, "step": 145740 }, { "epoch": 40.98, "learning_rate": 2.0076843782213478e-05, "loss": 0.0468, "step": 145770 }, { "epoch": 40.99, "learning_rate": 2.0058101396307752e-05, "loss": 0.0452, "step": 145800 }, { "epoch": 41.0, "learning_rate": 2.0039359010402027e-05, "loss": 0.0467, "step": 145830 }, { "epoch": 41.0, "eval_loss": 0.11312602460384369, "eval_runtime": 638.4663, "eval_samples_per_second": 25.112, "eval_steps_per_second": 0.786, "eval_wer": 0.0942707409277633, "step": 145837 }, { "epoch": 41.01, "learning_rate": 2.00206166244963e-05, "loss": 0.0413, "step": 145860 }, { "epoch": 41.01, "learning_rate": 2.0001874238590575e-05, "loss": 0.0531, "step": 145890 }, { "epoch": 41.02, "learning_rate": 1.9983131852684846e-05, "loss": 0.0386, "step": 145920 }, { "epoch": 41.03, "learning_rate": 1.996438946677912e-05, "loss": 0.052, "step": 145950 }, { "epoch": 41.04, "learning_rate": 1.9945647080873397e-05, "loss": 0.045, "step": 145980 }, { "epoch": 41.05, "learning_rate": 1.992690469496767e-05, "loss": 0.0489, "step": 146010 }, { "epoch": 41.06, "learning_rate": 1.9908162309061946e-05, "loss": 0.0522, "step": 146040 }, { "epoch": 41.07, "learning_rate": 1.988941992315622e-05, "loss": 0.0404, "step": 146070 }, { "epoch": 41.07, "learning_rate": 1.9870677537250494e-05, "loss": 0.0487, "step": 146100 }, { "epoch": 41.08, "learning_rate": 1.9851935151344765e-05, "loss": 0.0445, "step": 146130 }, { "epoch": 41.09, "learning_rate": 1.983319276543904e-05, "loss": 0.0485, "step": 146160 }, { "epoch": 41.1, "learning_rate": 1.9814450379533313e-05, "loss": 0.0515, "step": 146190 }, { "epoch": 41.11, "learning_rate": 1.979570799362759e-05, "loss": 0.0427, "step": 146220 }, { "epoch": 41.12, "learning_rate": 1.9776965607721865e-05, "loss": 0.0506, "step": 146250 }, { "epoch": 41.12, "learning_rate": 1.975822322181614e-05, "loss": 0.0434, "step": 146280 }, { "epoch": 41.13, "learning_rate": 1.9739480835910414e-05, "loss": 0.0502, "step": 146310 }, { "epoch": 41.14, "learning_rate": 1.9720738450004684e-05, "loss": 0.0519, "step": 146340 }, { "epoch": 41.15, "learning_rate": 1.970199606409896e-05, "loss": 0.0417, "step": 146370 }, { "epoch": 41.16, "learning_rate": 1.9683253678193233e-05, "loss": 0.0464, "step": 146400 }, { "epoch": 41.17, "learning_rate": 1.966451129228751e-05, "loss": 0.0434, "step": 146430 }, { "epoch": 41.18, "learning_rate": 1.9645768906381785e-05, "loss": 0.0471, "step": 146460 }, { "epoch": 41.18, "learning_rate": 1.962702652047606e-05, "loss": 0.0537, "step": 146490 }, { "epoch": 41.19, "learning_rate": 1.9608284134570333e-05, "loss": 0.0401, "step": 146520 }, { "epoch": 41.2, "learning_rate": 1.9590166494861464e-05, "loss": 0.0486, "step": 146550 }, { "epoch": 41.21, "learning_rate": 1.9571424108955738e-05, "loss": 0.0462, "step": 146580 }, { "epoch": 41.22, "learning_rate": 1.9552681723050012e-05, "loss": 0.0493, "step": 146610 }, { "epoch": 41.23, "learning_rate": 1.9533939337144286e-05, "loss": 0.0523, "step": 146640 }, { "epoch": 41.23, "learning_rate": 1.951519695123856e-05, "loss": 0.0411, "step": 146670 }, { "epoch": 41.24, "learning_rate": 1.9496454565332835e-05, "loss": 0.0496, "step": 146700 }, { "epoch": 41.25, "learning_rate": 1.947771217942711e-05, "loss": 0.0441, "step": 146730 }, { "epoch": 41.26, "learning_rate": 1.9458969793521383e-05, "loss": 0.0498, "step": 146760 }, { "epoch": 41.27, "learning_rate": 1.9440227407615657e-05, "loss": 0.0515, "step": 146790 }, { "epoch": 41.28, "learning_rate": 1.942148502170993e-05, "loss": 0.0423, "step": 146820 }, { "epoch": 41.28, "learning_rate": 1.9402742635804206e-05, "loss": 0.0516, "step": 146850 }, { "epoch": 41.29, "learning_rate": 1.938400024989848e-05, "loss": 0.0434, "step": 146880 }, { "epoch": 41.3, "learning_rate": 1.9365257863992754e-05, "loss": 0.0443, "step": 146910 }, { "epoch": 41.31, "learning_rate": 1.9346515478087028e-05, "loss": 0.0485, "step": 146940 }, { "epoch": 41.32, "learning_rate": 1.9327773092181302e-05, "loss": 0.04, "step": 146970 }, { "epoch": 41.33, "learning_rate": 1.9309030706275577e-05, "loss": 0.0501, "step": 147000 }, { "epoch": 41.34, "learning_rate": 1.929028832036985e-05, "loss": 0.044, "step": 147030 }, { "epoch": 41.34, "learning_rate": 1.9271545934464125e-05, "loss": 0.0485, "step": 147060 }, { "epoch": 41.35, "learning_rate": 1.92528035485584e-05, "loss": 0.0517, "step": 147090 }, { "epoch": 41.36, "learning_rate": 1.9234061162652673e-05, "loss": 0.0399, "step": 147120 }, { "epoch": 41.37, "learning_rate": 1.9215318776746948e-05, "loss": 0.0464, "step": 147150 }, { "epoch": 41.38, "learning_rate": 1.9196576390841222e-05, "loss": 0.0431, "step": 147180 }, { "epoch": 41.39, "learning_rate": 1.9177834004935496e-05, "loss": 0.0474, "step": 147210 }, { "epoch": 41.39, "learning_rate": 1.915909161902977e-05, "loss": 0.0512, "step": 147240 }, { "epoch": 41.4, "learning_rate": 1.9140349233124044e-05, "loss": 0.0411, "step": 147270 }, { "epoch": 41.41, "learning_rate": 1.912160684721832e-05, "loss": 0.0512, "step": 147300 }, { "epoch": 41.42, "learning_rate": 1.9102864461312593e-05, "loss": 0.0447, "step": 147330 }, { "epoch": 41.43, "learning_rate": 1.9084122075406867e-05, "loss": 0.0464, "step": 147360 }, { "epoch": 41.44, "learning_rate": 1.906537968950114e-05, "loss": 0.0502, "step": 147390 }, { "epoch": 41.44, "learning_rate": 1.9046637303595415e-05, "loss": 0.0453, "step": 147420 }, { "epoch": 41.45, "learning_rate": 1.902789491768969e-05, "loss": 0.0513, "step": 147450 }, { "epoch": 41.46, "learning_rate": 1.9009152531783964e-05, "loss": 0.0459, "step": 147480 }, { "epoch": 41.47, "learning_rate": 1.8990410145878238e-05, "loss": 0.0495, "step": 147510 }, { "epoch": 41.48, "learning_rate": 1.8971667759972512e-05, "loss": 0.0525, "step": 147540 }, { "epoch": 41.49, "learning_rate": 1.8952925374066786e-05, "loss": 0.0421, "step": 147570 }, { "epoch": 41.5, "learning_rate": 1.893418298816106e-05, "loss": 0.0518, "step": 147600 }, { "epoch": 41.5, "learning_rate": 1.8915440602255335e-05, "loss": 0.0475, "step": 147630 }, { "epoch": 41.51, "learning_rate": 1.889669821634961e-05, "loss": 0.0458, "step": 147660 }, { "epoch": 41.52, "learning_rate": 1.8877955830443883e-05, "loss": 0.0468, "step": 147690 }, { "epoch": 41.53, "learning_rate": 1.8859213444538157e-05, "loss": 0.0425, "step": 147720 }, { "epoch": 41.54, "learning_rate": 1.884047105863243e-05, "loss": 0.0476, "step": 147750 }, { "epoch": 41.55, "learning_rate": 1.8821728672726706e-05, "loss": 0.0477, "step": 147780 }, { "epoch": 41.55, "learning_rate": 1.880298628682098e-05, "loss": 0.0452, "step": 147810 }, { "epoch": 41.56, "learning_rate": 1.8784243900915254e-05, "loss": 0.0555, "step": 147840 }, { "epoch": 41.57, "learning_rate": 1.8765501515009528e-05, "loss": 0.0411, "step": 147870 }, { "epoch": 41.58, "learning_rate": 1.8746759129103802e-05, "loss": 0.0509, "step": 147900 }, { "epoch": 41.59, "learning_rate": 1.8728016743198076e-05, "loss": 0.0476, "step": 147930 }, { "epoch": 41.6, "learning_rate": 1.870927435729235e-05, "loss": 0.0464, "step": 147960 }, { "epoch": 41.61, "learning_rate": 1.8690531971386625e-05, "loss": 0.0508, "step": 147990 }, { "epoch": 41.61, "learning_rate": 1.86717895854809e-05, "loss": 0.0404, "step": 148020 }, { "epoch": 41.62, "learning_rate": 1.8653047199575173e-05, "loss": 0.0501, "step": 148050 }, { "epoch": 41.63, "learning_rate": 1.8634304813669447e-05, "loss": 0.0441, "step": 148080 }, { "epoch": 41.64, "learning_rate": 1.861556242776372e-05, "loss": 0.0497, "step": 148110 }, { "epoch": 41.65, "learning_rate": 1.8596820041857996e-05, "loss": 0.0502, "step": 148140 }, { "epoch": 41.66, "learning_rate": 1.857807765595227e-05, "loss": 0.0446, "step": 148170 }, { "epoch": 41.66, "learning_rate": 1.8559335270046544e-05, "loss": 0.0494, "step": 148200 }, { "epoch": 41.67, "learning_rate": 1.854059288414082e-05, "loss": 0.046, "step": 148230 }, { "epoch": 41.68, "learning_rate": 1.8521850498235093e-05, "loss": 0.0496, "step": 148260 }, { "epoch": 41.69, "learning_rate": 1.8503108112329367e-05, "loss": 0.0507, "step": 148290 }, { "epoch": 41.7, "learning_rate": 1.848436572642364e-05, "loss": 0.0428, "step": 148320 }, { "epoch": 41.71, "learning_rate": 1.8465623340517915e-05, "loss": 0.0497, "step": 148350 }, { "epoch": 41.71, "learning_rate": 1.844688095461219e-05, "loss": 0.0442, "step": 148380 }, { "epoch": 41.72, "learning_rate": 1.8428138568706464e-05, "loss": 0.046, "step": 148410 }, { "epoch": 41.73, "learning_rate": 1.8409396182800738e-05, "loss": 0.0528, "step": 148440 }, { "epoch": 41.74, "learning_rate": 1.8390653796895012e-05, "loss": 0.0437, "step": 148470 }, { "epoch": 41.75, "learning_rate": 1.8371911410989286e-05, "loss": 0.0488, "step": 148500 }, { "epoch": 41.76, "learning_rate": 1.835316902508356e-05, "loss": 0.0432, "step": 148530 }, { "epoch": 41.77, "learning_rate": 1.8334426639177834e-05, "loss": 0.0449, "step": 148560 }, { "epoch": 41.77, "learning_rate": 1.831568425327211e-05, "loss": 0.0497, "step": 148590 }, { "epoch": 41.78, "learning_rate": 1.8296941867366383e-05, "loss": 0.0405, "step": 148620 }, { "epoch": 41.79, "learning_rate": 1.827819948146066e-05, "loss": 0.0477, "step": 148650 }, { "epoch": 41.8, "learning_rate": 1.825945709555493e-05, "loss": 0.0475, "step": 148680 }, { "epoch": 41.81, "learning_rate": 1.8240714709649205e-05, "loss": 0.0458, "step": 148710 }, { "epoch": 41.82, "learning_rate": 1.8222597069940336e-05, "loss": 0.0518, "step": 148740 }, { "epoch": 41.82, "learning_rate": 1.8203854684034614e-05, "loss": 0.0404, "step": 148770 }, { "epoch": 41.83, "learning_rate": 1.8185112298128888e-05, "loss": 0.0518, "step": 148800 }, { "epoch": 41.84, "learning_rate": 1.8166369912223162e-05, "loss": 0.0473, "step": 148830 }, { "epoch": 41.85, "learning_rate": 1.8147627526317433e-05, "loss": 0.0467, "step": 148860 }, { "epoch": 41.86, "learning_rate": 1.8128885140411707e-05, "loss": 0.0526, "step": 148890 }, { "epoch": 41.87, "learning_rate": 1.811014275450598e-05, "loss": 0.0419, "step": 148920 }, { "epoch": 41.88, "learning_rate": 1.8091400368600256e-05, "loss": 0.0469, "step": 148950 }, { "epoch": 41.88, "learning_rate": 1.8072657982694533e-05, "loss": 0.0447, "step": 148980 }, { "epoch": 41.89, "learning_rate": 1.8053915596788807e-05, "loss": 0.0468, "step": 149010 }, { "epoch": 41.9, "learning_rate": 1.803517321088308e-05, "loss": 0.0538, "step": 149040 }, { "epoch": 41.91, "learning_rate": 1.8016430824977352e-05, "loss": 0.0428, "step": 149070 }, { "epoch": 41.92, "learning_rate": 1.7997688439071627e-05, "loss": 0.0545, "step": 149100 }, { "epoch": 41.93, "learning_rate": 1.79789460531659e-05, "loss": 0.0454, "step": 149130 }, { "epoch": 41.93, "learning_rate": 1.7960203667260175e-05, "loss": 0.0485, "step": 149160 }, { "epoch": 41.94, "learning_rate": 1.7941461281354453e-05, "loss": 0.0502, "step": 149190 }, { "epoch": 41.95, "learning_rate": 1.7922718895448727e-05, "loss": 0.0414, "step": 149220 }, { "epoch": 41.96, "learning_rate": 1.7903976509543e-05, "loss": 0.0513, "step": 149250 }, { "epoch": 41.97, "learning_rate": 1.788523412363727e-05, "loss": 0.045, "step": 149280 }, { "epoch": 41.98, "learning_rate": 1.7866491737731546e-05, "loss": 0.0451, "step": 149310 }, { "epoch": 41.98, "learning_rate": 1.784774935182582e-05, "loss": 0.0508, "step": 149340 }, { "epoch": 41.99, "learning_rate": 1.7829006965920094e-05, "loss": 0.0407, "step": 149370 }, { "epoch": 42.0, "eval_loss": 0.11148813366889954, "eval_runtime": 636.4424, "eval_samples_per_second": 25.192, "eval_steps_per_second": 0.789, "eval_wer": 0.09436627407094018, "step": 149394 }, { "epoch": 42.0, "learning_rate": 1.781088932621123e-05, "loss": 0.0539, "step": 149400 }, { "epoch": 42.01, "learning_rate": 1.7792146940305503e-05, "loss": 0.0409, "step": 149430 }, { "epoch": 42.02, "learning_rate": 1.7773404554399773e-05, "loss": 0.048, "step": 149460 }, { "epoch": 42.03, "learning_rate": 1.7754662168494048e-05, "loss": 0.0473, "step": 149490 }, { "epoch": 42.04, "learning_rate": 1.7735919782588325e-05, "loss": 0.0433, "step": 149520 }, { "epoch": 42.04, "learning_rate": 1.77171773966826e-05, "loss": 0.052, "step": 149550 }, { "epoch": 42.05, "learning_rate": 1.7698435010776874e-05, "loss": 0.0433, "step": 149580 }, { "epoch": 42.06, "learning_rate": 1.7679692624871148e-05, "loss": 0.0482, "step": 149610 }, { "epoch": 42.07, "learning_rate": 1.7660950238965422e-05, "loss": 0.0459, "step": 149640 }, { "epoch": 42.08, "learning_rate": 1.7642207853059696e-05, "loss": 0.0441, "step": 149670 }, { "epoch": 42.09, "learning_rate": 1.7623465467153967e-05, "loss": 0.0496, "step": 149700 }, { "epoch": 42.09, "learning_rate": 1.7604723081248245e-05, "loss": 0.0389, "step": 149730 }, { "epoch": 42.1, "learning_rate": 1.758598069534252e-05, "loss": 0.053, "step": 149760 }, { "epoch": 42.11, "learning_rate": 1.7567238309436793e-05, "loss": 0.0473, "step": 149790 }, { "epoch": 42.12, "learning_rate": 1.7548495923531067e-05, "loss": 0.0428, "step": 149820 }, { "epoch": 42.13, "learning_rate": 1.752975353762534e-05, "loss": 0.0514, "step": 149850 }, { "epoch": 42.14, "learning_rate": 1.7511011151719616e-05, "loss": 0.0408, "step": 149880 }, { "epoch": 42.15, "learning_rate": 1.7492268765813886e-05, "loss": 0.0472, "step": 149910 }, { "epoch": 42.15, "learning_rate": 1.7473526379908164e-05, "loss": 0.0492, "step": 149940 }, { "epoch": 42.16, "learning_rate": 1.7454783994002438e-05, "loss": 0.0426, "step": 149970 }, { "epoch": 42.17, "learning_rate": 1.7436041608096712e-05, "loss": 0.0493, "step": 150000 }, { "epoch": 42.18, "learning_rate": 1.7417299222190986e-05, "loss": 0.0446, "step": 150030 }, { "epoch": 42.19, "learning_rate": 1.739855683628526e-05, "loss": 0.0493, "step": 150060 }, { "epoch": 42.2, "learning_rate": 1.7379814450379535e-05, "loss": 0.0479, "step": 150090 }, { "epoch": 42.2, "learning_rate": 1.7361072064473806e-05, "loss": 0.0453, "step": 150120 }, { "epoch": 42.21, "learning_rate": 1.7342329678568083e-05, "loss": 0.0462, "step": 150150 }, { "epoch": 42.22, "learning_rate": 1.7323587292662357e-05, "loss": 0.0405, "step": 150180 }, { "epoch": 42.23, "learning_rate": 1.730484490675663e-05, "loss": 0.0468, "step": 150210 }, { "epoch": 42.24, "learning_rate": 1.7286102520850906e-05, "loss": 0.0468, "step": 150240 }, { "epoch": 42.25, "learning_rate": 1.726736013494518e-05, "loss": 0.0441, "step": 150270 }, { "epoch": 42.25, "learning_rate": 1.7248617749039454e-05, "loss": 0.052, "step": 150300 }, { "epoch": 42.26, "learning_rate": 1.722987536313373e-05, "loss": 0.0412, "step": 150330 }, { "epoch": 42.27, "learning_rate": 1.7211132977228003e-05, "loss": 0.0487, "step": 150360 }, { "epoch": 42.28, "learning_rate": 1.7192390591322277e-05, "loss": 0.0435, "step": 150390 }, { "epoch": 42.29, "learning_rate": 1.717364820541655e-05, "loss": 0.0477, "step": 150420 }, { "epoch": 42.3, "learning_rate": 1.7154905819510825e-05, "loss": 0.0489, "step": 150450 }, { "epoch": 42.31, "learning_rate": 1.71361634336051e-05, "loss": 0.0396, "step": 150480 }, { "epoch": 42.31, "learning_rate": 1.7117421047699374e-05, "loss": 0.0493, "step": 150510 }, { "epoch": 42.32, "learning_rate": 1.7098678661793648e-05, "loss": 0.0462, "step": 150540 }, { "epoch": 42.33, "learning_rate": 1.707993627588792e-05, "loss": 0.0435, "step": 150570 }, { "epoch": 42.34, "learning_rate": 1.7061193889982196e-05, "loss": 0.0469, "step": 150600 }, { "epoch": 42.35, "learning_rate": 1.704245150407647e-05, "loss": 0.0437, "step": 150630 }, { "epoch": 42.36, "learning_rate": 1.7023709118170744e-05, "loss": 0.0497, "step": 150660 }, { "epoch": 42.36, "learning_rate": 1.700496673226502e-05, "loss": 0.046, "step": 150690 }, { "epoch": 42.37, "learning_rate": 1.6986224346359293e-05, "loss": 0.0441, "step": 150720 }, { "epoch": 42.38, "learning_rate": 1.6967481960453567e-05, "loss": 0.0489, "step": 150750 }, { "epoch": 42.39, "learning_rate": 1.6948739574547838e-05, "loss": 0.0424, "step": 150780 }, { "epoch": 42.4, "learning_rate": 1.6929997188642115e-05, "loss": 0.0485, "step": 150810 }, { "epoch": 42.41, "learning_rate": 1.691125480273639e-05, "loss": 0.0467, "step": 150840 }, { "epoch": 42.41, "learning_rate": 1.6892512416830664e-05, "loss": 0.0445, "step": 150870 }, { "epoch": 42.42, "learning_rate": 1.6873770030924938e-05, "loss": 0.0545, "step": 150900 }, { "epoch": 42.43, "learning_rate": 1.6855027645019212e-05, "loss": 0.0424, "step": 150930 }, { "epoch": 42.44, "learning_rate": 1.6836285259113486e-05, "loss": 0.0482, "step": 150960 }, { "epoch": 42.45, "learning_rate": 1.681754287320776e-05, "loss": 0.0488, "step": 150990 }, { "epoch": 42.46, "learning_rate": 1.6798800487302035e-05, "loss": 0.0445, "step": 151020 }, { "epoch": 42.47, "learning_rate": 1.678005810139631e-05, "loss": 0.0499, "step": 151050 }, { "epoch": 42.47, "learning_rate": 1.6761315715490583e-05, "loss": 0.0422, "step": 151080 }, { "epoch": 42.48, "learning_rate": 1.6742573329584857e-05, "loss": 0.0489, "step": 151110 }, { "epoch": 42.49, "learning_rate": 1.672383094367913e-05, "loss": 0.0473, "step": 151140 }, { "epoch": 42.5, "learning_rate": 1.6705088557773406e-05, "loss": 0.0437, "step": 151170 }, { "epoch": 42.51, "learning_rate": 1.668634617186768e-05, "loss": 0.051, "step": 151200 }, { "epoch": 42.52, "learning_rate": 1.6667603785961954e-05, "loss": 0.0397, "step": 151230 }, { "epoch": 42.52, "learning_rate": 1.6648861400056228e-05, "loss": 0.0487, "step": 151260 }, { "epoch": 42.53, "learning_rate": 1.6630119014150502e-05, "loss": 0.0448, "step": 151290 }, { "epoch": 42.54, "learning_rate": 1.6611376628244777e-05, "loss": 0.0438, "step": 151320 }, { "epoch": 42.55, "learning_rate": 1.659263424233905e-05, "loss": 0.0492, "step": 151350 }, { "epoch": 42.56, "learning_rate": 1.6573891856433325e-05, "loss": 0.043, "step": 151380 }, { "epoch": 42.57, "learning_rate": 1.65551494705276e-05, "loss": 0.0486, "step": 151410 }, { "epoch": 42.58, "learning_rate": 1.6536407084621873e-05, "loss": 0.0469, "step": 151440 }, { "epoch": 42.58, "learning_rate": 1.6517664698716148e-05, "loss": 0.0445, "step": 151470 }, { "epoch": 42.59, "learning_rate": 1.6498922312810422e-05, "loss": 0.0519, "step": 151500 }, { "epoch": 42.6, "learning_rate": 1.6480179926904696e-05, "loss": 0.0429, "step": 151530 }, { "epoch": 42.61, "learning_rate": 1.646206228719583e-05, "loss": 0.0501, "step": 151560 }, { "epoch": 42.62, "learning_rate": 1.64433199012901e-05, "loss": 0.0467, "step": 151590 }, { "epoch": 42.63, "learning_rate": 1.6424577515384375e-05, "loss": 0.0463, "step": 151620 }, { "epoch": 42.63, "learning_rate": 1.640583512947865e-05, "loss": 0.0507, "step": 151650 }, { "epoch": 42.64, "learning_rate": 1.6387092743572924e-05, "loss": 0.0424, "step": 151680 }, { "epoch": 42.65, "learning_rate": 1.6368350357667198e-05, "loss": 0.0499, "step": 151710 }, { "epoch": 42.66, "learning_rate": 1.6349607971761472e-05, "loss": 0.0477, "step": 151740 }, { "epoch": 42.67, "learning_rate": 1.633086558585575e-05, "loss": 0.0471, "step": 151770 }, { "epoch": 42.68, "learning_rate": 1.631212319995002e-05, "loss": 0.0508, "step": 151800 }, { "epoch": 42.68, "learning_rate": 1.6293380814044295e-05, "loss": 0.044, "step": 151830 }, { "epoch": 42.69, "learning_rate": 1.627463842813857e-05, "loss": 0.0477, "step": 151860 }, { "epoch": 42.7, "learning_rate": 1.6255896042232843e-05, "loss": 0.0462, "step": 151890 }, { "epoch": 42.71, "learning_rate": 1.6237153656327117e-05, "loss": 0.0474, "step": 151920 }, { "epoch": 42.72, "learning_rate": 1.621841127042139e-05, "loss": 0.0489, "step": 151950 }, { "epoch": 42.73, "learning_rate": 1.619966888451567e-05, "loss": 0.04, "step": 151980 }, { "epoch": 42.74, "learning_rate": 1.618092649860994e-05, "loss": 0.0465, "step": 152010 }, { "epoch": 42.74, "learning_rate": 1.6162184112704214e-05, "loss": 0.0474, "step": 152040 }, { "epoch": 42.75, "learning_rate": 1.6143441726798488e-05, "loss": 0.0441, "step": 152070 }, { "epoch": 42.76, "learning_rate": 1.6124699340892762e-05, "loss": 0.0519, "step": 152100 }, { "epoch": 42.77, "learning_rate": 1.6105956954987036e-05, "loss": 0.039, "step": 152130 }, { "epoch": 42.78, "learning_rate": 1.608721456908131e-05, "loss": 0.0451, "step": 152160 }, { "epoch": 42.79, "learning_rate": 1.6068472183175588e-05, "loss": 0.0458, "step": 152190 }, { "epoch": 42.79, "learning_rate": 1.604972979726986e-05, "loss": 0.044, "step": 152220 }, { "epoch": 42.8, "learning_rate": 1.6030987411364133e-05, "loss": 0.0516, "step": 152250 }, { "epoch": 42.81, "learning_rate": 1.6012245025458407e-05, "loss": 0.041, "step": 152280 }, { "epoch": 42.82, "learning_rate": 1.599350263955268e-05, "loss": 0.0461, "step": 152310 }, { "epoch": 42.83, "learning_rate": 1.5974760253646956e-05, "loss": 0.0438, "step": 152340 }, { "epoch": 42.84, "learning_rate": 1.595601786774123e-05, "loss": 0.0424, "step": 152370 }, { "epoch": 42.84, "learning_rate": 1.5937275481835508e-05, "loss": 0.0495, "step": 152400 }, { "epoch": 42.85, "learning_rate": 1.5918533095929782e-05, "loss": 0.0437, "step": 152430 }, { "epoch": 42.86, "learning_rate": 1.5899790710024053e-05, "loss": 0.046, "step": 152460 }, { "epoch": 42.87, "learning_rate": 1.5881048324118327e-05, "loss": 0.0459, "step": 152490 }, { "epoch": 42.88, "learning_rate": 1.58623059382126e-05, "loss": 0.044, "step": 152520 }, { "epoch": 42.89, "learning_rate": 1.5843563552306875e-05, "loss": 0.0482, "step": 152550 }, { "epoch": 42.9, "learning_rate": 1.582482116640115e-05, "loss": 0.0415, "step": 152580 }, { "epoch": 42.9, "learning_rate": 1.5806078780495427e-05, "loss": 0.0499, "step": 152610 }, { "epoch": 42.91, "learning_rate": 1.57873363945897e-05, "loss": 0.0453, "step": 152640 }, { "epoch": 42.92, "learning_rate": 1.5768594008683972e-05, "loss": 0.0447, "step": 152670 }, { "epoch": 42.93, "learning_rate": 1.5749851622778246e-05, "loss": 0.0506, "step": 152700 }, { "epoch": 42.94, "learning_rate": 1.573110923687252e-05, "loss": 0.0413, "step": 152730 }, { "epoch": 42.95, "learning_rate": 1.5712366850966794e-05, "loss": 0.0484, "step": 152760 }, { "epoch": 42.95, "learning_rate": 1.569362446506107e-05, "loss": 0.0472, "step": 152790 }, { "epoch": 42.96, "learning_rate": 1.5674882079155346e-05, "loss": 0.0463, "step": 152820 }, { "epoch": 42.97, "learning_rate": 1.565613969324962e-05, "loss": 0.0486, "step": 152850 }, { "epoch": 42.98, "learning_rate": 1.563739730734389e-05, "loss": 0.0416, "step": 152880 }, { "epoch": 42.99, "learning_rate": 1.5618654921438165e-05, "loss": 0.0505, "step": 152910 }, { "epoch": 43.0, "learning_rate": 1.559991253553244e-05, "loss": 0.046, "step": 152940 }, { "epoch": 43.0, "eval_loss": 0.11060696840286255, "eval_runtime": 639.3277, "eval_samples_per_second": 25.078, "eval_steps_per_second": 0.785, "eval_wer": 0.09347918059858339, "step": 152951 }, { "epoch": 43.01, "learning_rate": 1.5581170149626714e-05, "loss": 0.0466, "step": 152970 }, { "epoch": 43.01, "learning_rate": 1.5562427763720988e-05, "loss": 0.0497, "step": 153000 }, { "epoch": 43.02, "learning_rate": 1.5543685377815266e-05, "loss": 0.0419, "step": 153030 }, { "epoch": 43.03, "learning_rate": 1.552494299190954e-05, "loss": 0.0468, "step": 153060 }, { "epoch": 43.04, "learning_rate": 1.5506200606003814e-05, "loss": 0.0441, "step": 153090 }, { "epoch": 43.05, "learning_rate": 1.5487458220098085e-05, "loss": 0.0452, "step": 153120 }, { "epoch": 43.06, "learning_rate": 1.546871583419236e-05, "loss": 0.0439, "step": 153150 }, { "epoch": 43.06, "learning_rate": 1.5449973448286633e-05, "loss": 0.0423, "step": 153180 }, { "epoch": 43.07, "learning_rate": 1.5431231062380907e-05, "loss": 0.0489, "step": 153210 }, { "epoch": 43.08, "learning_rate": 1.541248867647518e-05, "loss": 0.0438, "step": 153240 }, { "epoch": 43.09, "learning_rate": 1.539374629056946e-05, "loss": 0.0439, "step": 153270 }, { "epoch": 43.1, "learning_rate": 1.5375003904663733e-05, "loss": 0.0492, "step": 153300 }, { "epoch": 43.11, "learning_rate": 1.5356261518758004e-05, "loss": 0.0436, "step": 153330 }, { "epoch": 43.11, "learning_rate": 1.5337519132852278e-05, "loss": 0.05, "step": 153360 }, { "epoch": 43.12, "learning_rate": 1.5318776746946552e-05, "loss": 0.042, "step": 153390 }, { "epoch": 43.13, "learning_rate": 1.5300034361040827e-05, "loss": 0.0491, "step": 153420 }, { "epoch": 43.14, "learning_rate": 1.52812919751351e-05, "loss": 0.0476, "step": 153450 }, { "epoch": 43.15, "learning_rate": 1.526254958922938e-05, "loss": 0.0406, "step": 153480 }, { "epoch": 43.16, "learning_rate": 1.5243807203323651e-05, "loss": 0.0474, "step": 153510 }, { "epoch": 43.17, "learning_rate": 1.5225064817417925e-05, "loss": 0.0413, "step": 153540 }, { "epoch": 43.17, "learning_rate": 1.52063224315122e-05, "loss": 0.0467, "step": 153570 }, { "epoch": 43.18, "learning_rate": 1.5187580045606473e-05, "loss": 0.0462, "step": 153600 }, { "epoch": 43.19, "learning_rate": 1.5168837659700746e-05, "loss": 0.0437, "step": 153630 }, { "epoch": 43.2, "learning_rate": 1.515009527379502e-05, "loss": 0.0502, "step": 153660 }, { "epoch": 43.21, "learning_rate": 1.5131352887889296e-05, "loss": 0.0437, "step": 153690 }, { "epoch": 43.22, "learning_rate": 1.511261050198357e-05, "loss": 0.0472, "step": 153720 }, { "epoch": 43.22, "learning_rate": 1.5093868116077844e-05, "loss": 0.0489, "step": 153750 }, { "epoch": 43.23, "learning_rate": 1.5075125730172119e-05, "loss": 0.0416, "step": 153780 }, { "epoch": 43.24, "learning_rate": 1.5056383344266393e-05, "loss": 0.049, "step": 153810 }, { "epoch": 43.25, "learning_rate": 1.5037640958360665e-05, "loss": 0.0433, "step": 153840 }, { "epoch": 43.26, "learning_rate": 1.501889857245494e-05, "loss": 0.0456, "step": 153870 }, { "epoch": 43.27, "learning_rate": 1.5000156186549217e-05, "loss": 0.0471, "step": 153900 }, { "epoch": 43.28, "learning_rate": 1.498141380064349e-05, "loss": 0.0421, "step": 153930 }, { "epoch": 43.28, "learning_rate": 1.4962671414737764e-05, "loss": 0.0486, "step": 153960 }, { "epoch": 43.29, "learning_rate": 1.4943929028832038e-05, "loss": 0.0429, "step": 153990 }, { "epoch": 43.3, "learning_rate": 1.4925186642926312e-05, "loss": 0.0475, "step": 154020 }, { "epoch": 43.31, "learning_rate": 1.4906444257020585e-05, "loss": 0.0498, "step": 154050 }, { "epoch": 43.32, "learning_rate": 1.4887701871114859e-05, "loss": 0.0424, "step": 154080 }, { "epoch": 43.33, "learning_rate": 1.4868959485209136e-05, "loss": 0.0492, "step": 154110 }, { "epoch": 43.33, "learning_rate": 1.4850217099303409e-05, "loss": 0.0445, "step": 154140 }, { "epoch": 43.34, "learning_rate": 1.4831474713397683e-05, "loss": 0.0498, "step": 154170 }, { "epoch": 43.35, "learning_rate": 1.4812732327491957e-05, "loss": 0.048, "step": 154200 }, { "epoch": 43.36, "learning_rate": 1.4793989941586231e-05, "loss": 0.0453, "step": 154230 }, { "epoch": 43.37, "learning_rate": 1.4775247555680504e-05, "loss": 0.0503, "step": 154260 }, { "epoch": 43.38, "learning_rate": 1.4756505169774778e-05, "loss": 0.0425, "step": 154290 }, { "epoch": 43.38, "learning_rate": 1.4737762783869056e-05, "loss": 0.0438, "step": 154320 }, { "epoch": 43.39, "learning_rate": 1.4719020397963328e-05, "loss": 0.0476, "step": 154350 }, { "epoch": 43.4, "learning_rate": 1.4700278012057602e-05, "loss": 0.0442, "step": 154380 }, { "epoch": 43.41, "learning_rate": 1.4681535626151877e-05, "loss": 0.0491, "step": 154410 }, { "epoch": 43.42, "learning_rate": 1.466279324024615e-05, "loss": 0.0404, "step": 154440 }, { "epoch": 43.43, "learning_rate": 1.4644050854340425e-05, "loss": 0.0502, "step": 154470 }, { "epoch": 43.44, "learning_rate": 1.4625308468434698e-05, "loss": 0.0447, "step": 154500 }, { "epoch": 43.44, "learning_rate": 1.4606566082528975e-05, "loss": 0.039, "step": 154530 }, { "epoch": 43.45, "learning_rate": 1.458782369662325e-05, "loss": 0.0487, "step": 154560 }, { "epoch": 43.46, "learning_rate": 1.4569081310717522e-05, "loss": 0.0406, "step": 154590 }, { "epoch": 43.47, "learning_rate": 1.4550338924811796e-05, "loss": 0.0464, "step": 154620 }, { "epoch": 43.48, "learning_rate": 1.453159653890607e-05, "loss": 0.0462, "step": 154650 }, { "epoch": 43.49, "learning_rate": 1.4512854153000344e-05, "loss": 0.0448, "step": 154680 }, { "epoch": 43.49, "learning_rate": 1.4494111767094617e-05, "loss": 0.0487, "step": 154710 }, { "epoch": 43.5, "learning_rate": 1.4475369381188894e-05, "loss": 0.041, "step": 154740 }, { "epoch": 43.51, "learning_rate": 1.4456626995283169e-05, "loss": 0.0486, "step": 154770 }, { "epoch": 43.52, "learning_rate": 1.4437884609377441e-05, "loss": 0.0459, "step": 154800 }, { "epoch": 43.53, "learning_rate": 1.4419142223471715e-05, "loss": 0.0438, "step": 154830 }, { "epoch": 43.54, "learning_rate": 1.440039983756599e-05, "loss": 0.0474, "step": 154860 }, { "epoch": 43.55, "learning_rate": 1.4381657451660264e-05, "loss": 0.0424, "step": 154890 }, { "epoch": 43.55, "learning_rate": 1.4362915065754536e-05, "loss": 0.044, "step": 154920 }, { "epoch": 43.56, "learning_rate": 1.434417267984881e-05, "loss": 0.047, "step": 154950 }, { "epoch": 43.57, "learning_rate": 1.4325430293943088e-05, "loss": 0.04, "step": 154980 }, { "epoch": 43.58, "learning_rate": 1.430668790803736e-05, "loss": 0.0476, "step": 155010 }, { "epoch": 43.59, "learning_rate": 1.4287945522131635e-05, "loss": 0.0435, "step": 155040 }, { "epoch": 43.6, "learning_rate": 1.4269203136225909e-05, "loss": 0.0465, "step": 155070 }, { "epoch": 43.6, "learning_rate": 1.4250460750320183e-05, "loss": 0.0462, "step": 155100 }, { "epoch": 43.61, "learning_rate": 1.4231718364414457e-05, "loss": 0.042, "step": 155130 }, { "epoch": 43.62, "learning_rate": 1.421297597850873e-05, "loss": 0.048, "step": 155160 }, { "epoch": 43.63, "learning_rate": 1.4194233592603007e-05, "loss": 0.0421, "step": 155190 }, { "epoch": 43.64, "learning_rate": 1.417549120669728e-05, "loss": 0.0489, "step": 155220 }, { "epoch": 43.65, "learning_rate": 1.4156748820791554e-05, "loss": 0.0486, "step": 155250 }, { "epoch": 43.65, "learning_rate": 1.4138006434885828e-05, "loss": 0.0413, "step": 155280 }, { "epoch": 43.66, "learning_rate": 1.4119264048980102e-05, "loss": 0.0502, "step": 155310 }, { "epoch": 43.67, "learning_rate": 1.4100521663074377e-05, "loss": 0.0429, "step": 155340 }, { "epoch": 43.68, "learning_rate": 1.4081779277168649e-05, "loss": 0.0465, "step": 155370 }, { "epoch": 43.69, "learning_rate": 1.4063036891262927e-05, "loss": 0.0493, "step": 155400 }, { "epoch": 43.7, "learning_rate": 1.40442945053572e-05, "loss": 0.0422, "step": 155430 }, { "epoch": 43.71, "learning_rate": 1.4025552119451473e-05, "loss": 0.0508, "step": 155460 }, { "epoch": 43.71, "learning_rate": 1.4006809733545747e-05, "loss": 0.0429, "step": 155490 }, { "epoch": 43.72, "learning_rate": 1.3988067347640022e-05, "loss": 0.0441, "step": 155520 }, { "epoch": 43.73, "learning_rate": 1.3969324961734296e-05, "loss": 0.0482, "step": 155550 }, { "epoch": 43.74, "learning_rate": 1.3950582575828568e-05, "loss": 0.0426, "step": 155580 }, { "epoch": 43.75, "learning_rate": 1.3931840189922846e-05, "loss": 0.0465, "step": 155610 }, { "epoch": 43.76, "learning_rate": 1.391309780401712e-05, "loss": 0.0429, "step": 155640 }, { "epoch": 43.76, "learning_rate": 1.3894355418111393e-05, "loss": 0.0439, "step": 155670 }, { "epoch": 43.77, "learning_rate": 1.3875613032205667e-05, "loss": 0.0464, "step": 155700 }, { "epoch": 43.78, "learning_rate": 1.3856870646299941e-05, "loss": 0.0428, "step": 155730 }, { "epoch": 43.79, "learning_rate": 1.3838128260394215e-05, "loss": 0.0453, "step": 155760 }, { "epoch": 43.8, "learning_rate": 1.3819385874488488e-05, "loss": 0.0443, "step": 155790 }, { "epoch": 43.81, "learning_rate": 1.3800643488582765e-05, "loss": 0.0434, "step": 155820 }, { "epoch": 43.81, "learning_rate": 1.378190110267704e-05, "loss": 0.0427, "step": 155850 }, { "epoch": 43.82, "learning_rate": 1.3763158716771312e-05, "loss": 0.0423, "step": 155880 }, { "epoch": 43.83, "learning_rate": 1.3744416330865586e-05, "loss": 0.0473, "step": 155910 }, { "epoch": 43.84, "learning_rate": 1.372567394495986e-05, "loss": 0.0414, "step": 155940 }, { "epoch": 43.85, "learning_rate": 1.3706931559054135e-05, "loss": 0.0451, "step": 155970 }, { "epoch": 43.86, "learning_rate": 1.3688189173148409e-05, "loss": 0.0461, "step": 156000 }, { "epoch": 43.87, "learning_rate": 1.3669446787242685e-05, "loss": 0.0423, "step": 156030 }, { "epoch": 43.87, "learning_rate": 1.3650704401336959e-05, "loss": 0.0471, "step": 156060 }, { "epoch": 43.88, "learning_rate": 1.3632586761628088e-05, "loss": 0.0435, "step": 156090 }, { "epoch": 43.89, "learning_rate": 1.3613844375722362e-05, "loss": 0.0454, "step": 156120 }, { "epoch": 43.9, "learning_rate": 1.3595101989816638e-05, "loss": 0.0468, "step": 156150 }, { "epoch": 43.91, "learning_rate": 1.3576359603910912e-05, "loss": 0.0399, "step": 156180 }, { "epoch": 43.92, "learning_rate": 1.3557617218005186e-05, "loss": 0.0487, "step": 156210 }, { "epoch": 43.92, "learning_rate": 1.353887483209946e-05, "loss": 0.0442, "step": 156240 }, { "epoch": 43.93, "learning_rate": 1.3520132446193735e-05, "loss": 0.046, "step": 156270 }, { "epoch": 43.94, "learning_rate": 1.3501390060288007e-05, "loss": 0.0476, "step": 156300 }, { "epoch": 43.95, "learning_rate": 1.3482647674382281e-05, "loss": 0.0397, "step": 156330 }, { "epoch": 43.96, "learning_rate": 1.3463905288476559e-05, "loss": 0.0529, "step": 156360 }, { "epoch": 43.97, "learning_rate": 1.3445162902570832e-05, "loss": 0.0414, "step": 156390 }, { "epoch": 43.98, "learning_rate": 1.3426420516665106e-05, "loss": 0.0452, "step": 156420 }, { "epoch": 43.98, "learning_rate": 1.340767813075938e-05, "loss": 0.0467, "step": 156450 }, { "epoch": 43.99, "learning_rate": 1.3388935744853654e-05, "loss": 0.0447, "step": 156480 }, { "epoch": 44.0, "eval_loss": 0.10826382040977478, "eval_runtime": 640.1758, "eval_samples_per_second": 25.045, "eval_steps_per_second": 0.784, "eval_wer": 0.09191653132804717, "step": 156508 }, { "epoch": 44.0, "learning_rate": 1.3370193358947927e-05, "loss": 0.0516, "step": 156510 }, { "epoch": 44.01, "learning_rate": 1.33514509730422e-05, "loss": 0.0367, "step": 156540 }, { "epoch": 44.02, "learning_rate": 1.3332708587136478e-05, "loss": 0.0511, "step": 156570 }, { "epoch": 44.03, "learning_rate": 1.3313966201230751e-05, "loss": 0.0436, "step": 156600 }, { "epoch": 44.03, "learning_rate": 1.3295223815325025e-05, "loss": 0.0452, "step": 156630 }, { "epoch": 44.04, "learning_rate": 1.32764814294193e-05, "loss": 0.0485, "step": 156660 }, { "epoch": 44.05, "learning_rate": 1.3257739043513573e-05, "loss": 0.0371, "step": 156690 }, { "epoch": 44.06, "learning_rate": 1.3238996657607846e-05, "loss": 0.0472, "step": 156720 }, { "epoch": 44.07, "learning_rate": 1.322025427170212e-05, "loss": 0.0421, "step": 156750 }, { "epoch": 44.08, "learning_rate": 1.3201511885796398e-05, "loss": 0.0452, "step": 156780 }, { "epoch": 44.08, "learning_rate": 1.318276949989067e-05, "loss": 0.049, "step": 156810 }, { "epoch": 44.09, "learning_rate": 1.3164027113984944e-05, "loss": 0.0384, "step": 156840 }, { "epoch": 44.1, "learning_rate": 1.3145284728079219e-05, "loss": 0.0447, "step": 156870 }, { "epoch": 44.11, "learning_rate": 1.3126542342173493e-05, "loss": 0.044, "step": 156900 }, { "epoch": 44.12, "learning_rate": 1.3107799956267767e-05, "loss": 0.0461, "step": 156930 }, { "epoch": 44.13, "learning_rate": 1.308905757036204e-05, "loss": 0.0471, "step": 156960 }, { "epoch": 44.14, "learning_rate": 1.3070315184456317e-05, "loss": 0.0404, "step": 156990 }, { "epoch": 44.14, "learning_rate": 1.305157279855059e-05, "loss": 0.0466, "step": 157020 }, { "epoch": 44.15, "learning_rate": 1.3032830412644864e-05, "loss": 0.0443, "step": 157050 }, { "epoch": 44.16, "learning_rate": 1.3014088026739138e-05, "loss": 0.0435, "step": 157080 }, { "epoch": 44.17, "learning_rate": 1.2995345640833412e-05, "loss": 0.0477, "step": 157110 }, { "epoch": 44.18, "learning_rate": 1.2976603254927686e-05, "loss": 0.0364, "step": 157140 }, { "epoch": 44.19, "learning_rate": 1.2957860869021959e-05, "loss": 0.049, "step": 157170 }, { "epoch": 44.19, "learning_rate": 1.2939118483116236e-05, "loss": 0.0432, "step": 157200 }, { "epoch": 44.2, "learning_rate": 1.292037609721051e-05, "loss": 0.0476, "step": 157230 }, { "epoch": 44.21, "learning_rate": 1.2901633711304783e-05, "loss": 0.051, "step": 157260 }, { "epoch": 44.22, "learning_rate": 1.2882891325399057e-05, "loss": 0.042, "step": 157290 }, { "epoch": 44.23, "learning_rate": 1.2864148939493331e-05, "loss": 0.0464, "step": 157320 }, { "epoch": 44.24, "learning_rate": 1.2845406553587606e-05, "loss": 0.0425, "step": 157350 }, { "epoch": 44.25, "learning_rate": 1.2826664167681878e-05, "loss": 0.0463, "step": 157380 }, { "epoch": 44.25, "learning_rate": 1.2807921781776156e-05, "loss": 0.0507, "step": 157410 }, { "epoch": 44.26, "learning_rate": 1.278917939587043e-05, "loss": 0.0378, "step": 157440 }, { "epoch": 44.27, "learning_rate": 1.2770437009964702e-05, "loss": 0.0477, "step": 157470 }, { "epoch": 44.28, "learning_rate": 1.2751694624058977e-05, "loss": 0.0433, "step": 157500 }, { "epoch": 44.29, "learning_rate": 1.273295223815325e-05, "loss": 0.0446, "step": 157530 }, { "epoch": 44.3, "learning_rate": 1.2714209852247525e-05, "loss": 0.0527, "step": 157560 }, { "epoch": 44.3, "learning_rate": 1.2695467466341797e-05, "loss": 0.0397, "step": 157590 }, { "epoch": 44.31, "learning_rate": 1.2676725080436072e-05, "loss": 0.0475, "step": 157620 }, { "epoch": 44.32, "learning_rate": 1.265798269453035e-05, "loss": 0.0446, "step": 157650 }, { "epoch": 44.33, "learning_rate": 1.2639240308624622e-05, "loss": 0.0479, "step": 157680 }, { "epoch": 44.34, "learning_rate": 1.2620497922718896e-05, "loss": 0.0489, "step": 157710 }, { "epoch": 44.35, "learning_rate": 1.260175553681317e-05, "loss": 0.0411, "step": 157740 }, { "epoch": 44.35, "learning_rate": 1.2583013150907444e-05, "loss": 0.0474, "step": 157770 }, { "epoch": 44.36, "learning_rate": 1.2564270765001718e-05, "loss": 0.0416, "step": 157800 }, { "epoch": 44.37, "learning_rate": 1.2545528379095991e-05, "loss": 0.0452, "step": 157830 }, { "epoch": 44.38, "learning_rate": 1.2526785993190269e-05, "loss": 0.0491, "step": 157860 }, { "epoch": 44.39, "learning_rate": 1.2508043607284543e-05, "loss": 0.0395, "step": 157890 }, { "epoch": 44.4, "learning_rate": 1.2489301221378815e-05, "loss": 0.0451, "step": 157920 }, { "epoch": 44.41, "learning_rate": 1.247055883547309e-05, "loss": 0.0436, "step": 157950 }, { "epoch": 44.41, "learning_rate": 1.2451816449567364e-05, "loss": 0.0451, "step": 157980 }, { "epoch": 44.42, "learning_rate": 1.2433074063661638e-05, "loss": 0.0506, "step": 158010 }, { "epoch": 44.43, "learning_rate": 1.2414331677755912e-05, "loss": 0.0404, "step": 158040 }, { "epoch": 44.44, "learning_rate": 1.2395589291850186e-05, "loss": 0.0471, "step": 158070 }, { "epoch": 44.45, "learning_rate": 1.237684690594446e-05, "loss": 0.0426, "step": 158100 }, { "epoch": 44.46, "learning_rate": 1.2358104520038735e-05, "loss": 0.0452, "step": 158130 }, { "epoch": 44.46, "learning_rate": 1.2339362134133009e-05, "loss": 0.0475, "step": 158160 }, { "epoch": 44.47, "learning_rate": 1.2320619748227283e-05, "loss": 0.0385, "step": 158190 }, { "epoch": 44.48, "learning_rate": 1.2301877362321559e-05, "loss": 0.05, "step": 158220 }, { "epoch": 44.49, "learning_rate": 1.2283134976415831e-05, "loss": 0.0444, "step": 158250 }, { "epoch": 44.5, "learning_rate": 1.2264392590510106e-05, "loss": 0.0439, "step": 158280 }, { "epoch": 44.51, "learning_rate": 1.224565020460438e-05, "loss": 0.0497, "step": 158310 }, { "epoch": 44.51, "learning_rate": 1.2226907818698654e-05, "loss": 0.0392, "step": 158340 }, { "epoch": 44.52, "learning_rate": 1.2208165432792928e-05, "loss": 0.0483, "step": 158370 }, { "epoch": 44.53, "learning_rate": 1.2189423046887202e-05, "loss": 0.0432, "step": 158400 }, { "epoch": 44.54, "learning_rate": 1.2170680660981478e-05, "loss": 0.0439, "step": 158430 }, { "epoch": 44.55, "learning_rate": 1.215193827507575e-05, "loss": 0.0471, "step": 158460 }, { "epoch": 44.56, "learning_rate": 1.2133195889170025e-05, "loss": 0.0387, "step": 158490 }, { "epoch": 44.57, "learning_rate": 1.2114453503264299e-05, "loss": 0.0441, "step": 158520 }, { "epoch": 44.57, "learning_rate": 1.2095711117358573e-05, "loss": 0.0428, "step": 158550 }, { "epoch": 44.58, "learning_rate": 1.2076968731452847e-05, "loss": 0.0413, "step": 158580 }, { "epoch": 44.59, "learning_rate": 1.2058226345547122e-05, "loss": 0.0464, "step": 158610 }, { "epoch": 44.6, "learning_rate": 1.2039483959641398e-05, "loss": 0.04, "step": 158640 }, { "epoch": 44.61, "learning_rate": 1.202074157373567e-05, "loss": 0.0488, "step": 158670 }, { "epoch": 44.62, "learning_rate": 1.2001999187829944e-05, "loss": 0.0424, "step": 158700 }, { "epoch": 44.62, "learning_rate": 1.1983256801924218e-05, "loss": 0.0408, "step": 158730 }, { "epoch": 44.63, "learning_rate": 1.1964514416018494e-05, "loss": 0.0476, "step": 158760 }, { "epoch": 44.64, "learning_rate": 1.1945772030112767e-05, "loss": 0.0405, "step": 158790 }, { "epoch": 44.65, "learning_rate": 1.1927029644207041e-05, "loss": 0.0491, "step": 158820 }, { "epoch": 44.66, "learning_rate": 1.1908287258301315e-05, "loss": 0.0407, "step": 158850 }, { "epoch": 44.67, "learning_rate": 1.188954487239559e-05, "loss": 0.045, "step": 158880 }, { "epoch": 44.68, "learning_rate": 1.1870802486489864e-05, "loss": 0.0477, "step": 158910 }, { "epoch": 44.68, "learning_rate": 1.1852060100584138e-05, "loss": 0.04, "step": 158940 }, { "epoch": 44.69, "learning_rate": 1.1833317714678414e-05, "loss": 0.0465, "step": 158970 }, { "epoch": 44.7, "learning_rate": 1.1814575328772686e-05, "loss": 0.0441, "step": 159000 }, { "epoch": 44.71, "learning_rate": 1.179583294286696e-05, "loss": 0.0468, "step": 159030 }, { "epoch": 44.72, "learning_rate": 1.1777090556961234e-05, "loss": 0.0484, "step": 159060 }, { "epoch": 44.73, "learning_rate": 1.175834817105551e-05, "loss": 0.0381, "step": 159090 }, { "epoch": 44.73, "learning_rate": 1.1739605785149783e-05, "loss": 0.0469, "step": 159120 }, { "epoch": 44.74, "learning_rate": 1.1720863399244057e-05, "loss": 0.043, "step": 159150 }, { "epoch": 44.75, "learning_rate": 1.1702121013338333e-05, "loss": 0.0463, "step": 159180 }, { "epoch": 44.76, "learning_rate": 1.1683378627432605e-05, "loss": 0.0472, "step": 159210 }, { "epoch": 44.77, "learning_rate": 1.166463624152688e-05, "loss": 0.0415, "step": 159240 }, { "epoch": 44.78, "learning_rate": 1.1645893855621154e-05, "loss": 0.051, "step": 159270 }, { "epoch": 44.78, "learning_rate": 1.162715146971543e-05, "loss": 0.0413, "step": 159300 }, { "epoch": 44.79, "learning_rate": 1.1608409083809702e-05, "loss": 0.0423, "step": 159330 }, { "epoch": 44.8, "learning_rate": 1.1589666697903976e-05, "loss": 0.0487, "step": 159360 }, { "epoch": 44.81, "learning_rate": 1.1570924311998252e-05, "loss": 0.0401, "step": 159390 }, { "epoch": 44.82, "learning_rate": 1.1552181926092526e-05, "loss": 0.0482, "step": 159420 }, { "epoch": 44.83, "learning_rate": 1.1533439540186799e-05, "loss": 0.0414, "step": 159450 }, { "epoch": 44.84, "learning_rate": 1.1514697154281073e-05, "loss": 0.0461, "step": 159480 }, { "epoch": 44.84, "learning_rate": 1.1496579514572206e-05, "loss": 0.0478, "step": 159510 }, { "epoch": 44.85, "learning_rate": 1.147783712866648e-05, "loss": 0.0363, "step": 159540 }, { "epoch": 44.86, "learning_rate": 1.1459094742760754e-05, "loss": 0.0434, "step": 159570 }, { "epoch": 44.87, "learning_rate": 1.1440352356855028e-05, "loss": 0.0419, "step": 159600 }, { "epoch": 44.88, "learning_rate": 1.1421609970949302e-05, "loss": 0.0468, "step": 159630 }, { "epoch": 44.89, "learning_rate": 1.1402867585043577e-05, "loss": 0.0493, "step": 159660 }, { "epoch": 44.89, "learning_rate": 1.138412519913785e-05, "loss": 0.0406, "step": 159690 }, { "epoch": 44.9, "learning_rate": 1.1365382813232125e-05, "loss": 0.0461, "step": 159720 }, { "epoch": 44.91, "learning_rate": 1.13466404273264e-05, "loss": 0.0432, "step": 159750 }, { "epoch": 44.92, "learning_rate": 1.1327898041420673e-05, "loss": 0.0423, "step": 159780 }, { "epoch": 44.93, "learning_rate": 1.1309155655514948e-05, "loss": 0.0472, "step": 159810 }, { "epoch": 44.94, "learning_rate": 1.1290413269609222e-05, "loss": 0.0405, "step": 159840 }, { "epoch": 44.95, "learning_rate": 1.1271670883703496e-05, "loss": 0.0463, "step": 159870 }, { "epoch": 44.95, "learning_rate": 1.125292849779777e-05, "loss": 0.0435, "step": 159900 }, { "epoch": 44.96, "learning_rate": 1.1234186111892044e-05, "loss": 0.045, "step": 159930 }, { "epoch": 44.97, "learning_rate": 1.1215443725986319e-05, "loss": 0.0495, "step": 159960 }, { "epoch": 44.98, "learning_rate": 1.1196701340080593e-05, "loss": 0.0389, "step": 159990 }, { "epoch": 44.99, "learning_rate": 1.1177958954174867e-05, "loss": 0.0469, "step": 160020 }, { "epoch": 45.0, "learning_rate": 1.1159216568269141e-05, "loss": 0.0434, "step": 160050 }, { "epoch": 45.0, "eval_loss": 0.10925392806529999, "eval_runtime": 640.2824, "eval_samples_per_second": 25.041, "eval_steps_per_second": 0.784, "eval_wer": 0.09092025712063107, "step": 160065 }, { "epoch": 45.0, "learning_rate": 1.1140474182363415e-05, "loss": 0.0449, "step": 160080 }, { "epoch": 45.01, "learning_rate": 1.112173179645769e-05, "loss": 0.0429, "step": 160110 }, { "epoch": 45.02, "learning_rate": 1.1102989410551964e-05, "loss": 0.0432, "step": 160140 }, { "epoch": 45.03, "learning_rate": 1.1084247024646238e-05, "loss": 0.046, "step": 160170 }, { "epoch": 45.04, "learning_rate": 1.1065504638740512e-05, "loss": 0.0404, "step": 160200 }, { "epoch": 45.05, "learning_rate": 1.1046762252834786e-05, "loss": 0.0478, "step": 160230 }, { "epoch": 45.05, "learning_rate": 1.102801986692906e-05, "loss": 0.0436, "step": 160260 }, { "epoch": 45.06, "learning_rate": 1.1009277481023335e-05, "loss": 0.042, "step": 160290 }, { "epoch": 45.07, "learning_rate": 1.0990535095117609e-05, "loss": 0.0467, "step": 160320 }, { "epoch": 45.08, "learning_rate": 1.0971792709211883e-05, "loss": 0.0386, "step": 160350 }, { "epoch": 45.09, "learning_rate": 1.0953050323306157e-05, "loss": 0.0458, "step": 160380 }, { "epoch": 45.1, "learning_rate": 1.0934307937400431e-05, "loss": 0.0434, "step": 160410 }, { "epoch": 45.11, "learning_rate": 1.0915565551494706e-05, "loss": 0.0466, "step": 160440 }, { "epoch": 45.11, "learning_rate": 1.089682316558898e-05, "loss": 0.0487, "step": 160470 }, { "epoch": 45.12, "learning_rate": 1.0878080779683254e-05, "loss": 0.0414, "step": 160500 }, { "epoch": 45.13, "learning_rate": 1.0859338393777528e-05, "loss": 0.0465, "step": 160530 }, { "epoch": 45.14, "learning_rate": 1.0840596007871802e-05, "loss": 0.0424, "step": 160560 }, { "epoch": 45.15, "learning_rate": 1.0821853621966077e-05, "loss": 0.0402, "step": 160590 }, { "epoch": 45.16, "learning_rate": 1.080311123606035e-05, "loss": 0.0508, "step": 160620 }, { "epoch": 45.16, "learning_rate": 1.0784368850154625e-05, "loss": 0.0407, "step": 160650 }, { "epoch": 45.17, "learning_rate": 1.0765626464248899e-05, "loss": 0.0431, "step": 160680 }, { "epoch": 45.18, "learning_rate": 1.0746884078343173e-05, "loss": 0.0464, "step": 160710 }, { "epoch": 45.19, "learning_rate": 1.0728141692437447e-05, "loss": 0.0424, "step": 160740 }, { "epoch": 45.2, "learning_rate": 1.0709399306531722e-05, "loss": 0.0474, "step": 160770 }, { "epoch": 45.21, "learning_rate": 1.0690656920625996e-05, "loss": 0.0391, "step": 160800 }, { "epoch": 45.22, "learning_rate": 1.067191453472027e-05, "loss": 0.045, "step": 160830 }, { "epoch": 45.22, "learning_rate": 1.0653172148814544e-05, "loss": 0.0431, "step": 160860 }, { "epoch": 45.23, "learning_rate": 1.063442976290882e-05, "loss": 0.0418, "step": 160890 }, { "epoch": 45.24, "learning_rate": 1.0615687377003093e-05, "loss": 0.0493, "step": 160920 }, { "epoch": 45.25, "learning_rate": 1.0596944991097367e-05, "loss": 0.0404, "step": 160950 }, { "epoch": 45.26, "learning_rate": 1.0578202605191641e-05, "loss": 0.0482, "step": 160980 }, { "epoch": 45.27, "learning_rate": 1.0559460219285915e-05, "loss": 0.0464, "step": 161010 }, { "epoch": 45.27, "learning_rate": 1.054071783338019e-05, "loss": 0.0415, "step": 161040 }, { "epoch": 45.28, "learning_rate": 1.0521975447474464e-05, "loss": 0.0475, "step": 161070 }, { "epoch": 45.29, "learning_rate": 1.050323306156874e-05, "loss": 0.0405, "step": 161100 }, { "epoch": 45.3, "learning_rate": 1.0484490675663012e-05, "loss": 0.0459, "step": 161130 }, { "epoch": 45.31, "learning_rate": 1.0465748289757286e-05, "loss": 0.0424, "step": 161160 }, { "epoch": 45.32, "learning_rate": 1.044700590385156e-05, "loss": 0.041, "step": 161190 }, { "epoch": 45.32, "learning_rate": 1.0428263517945836e-05, "loss": 0.0477, "step": 161220 }, { "epoch": 45.33, "learning_rate": 1.0409521132040109e-05, "loss": 0.0398, "step": 161250 }, { "epoch": 45.34, "learning_rate": 1.0390778746134383e-05, "loss": 0.045, "step": 161280 }, { "epoch": 45.35, "learning_rate": 1.0372036360228659e-05, "loss": 0.0441, "step": 161310 }, { "epoch": 45.36, "learning_rate": 1.0353293974322931e-05, "loss": 0.0416, "step": 161340 }, { "epoch": 45.37, "learning_rate": 1.0334551588417205e-05, "loss": 0.0489, "step": 161370 }, { "epoch": 45.38, "learning_rate": 1.031580920251148e-05, "loss": 0.0406, "step": 161400 }, { "epoch": 45.38, "learning_rate": 1.0297066816605756e-05, "loss": 0.0474, "step": 161430 }, { "epoch": 45.39, "learning_rate": 1.0278324430700028e-05, "loss": 0.0453, "step": 161460 }, { "epoch": 45.4, "learning_rate": 1.0259582044794302e-05, "loss": 0.0429, "step": 161490 }, { "epoch": 45.41, "learning_rate": 1.0240839658888576e-05, "loss": 0.047, "step": 161520 }, { "epoch": 45.42, "learning_rate": 1.0222097272982852e-05, "loss": 0.0382, "step": 161550 }, { "epoch": 45.43, "learning_rate": 1.0203354887077125e-05, "loss": 0.0474, "step": 161580 }, { "epoch": 45.43, "learning_rate": 1.0184612501171399e-05, "loss": 0.044, "step": 161610 }, { "epoch": 45.44, "learning_rate": 1.0165870115265675e-05, "loss": 0.0432, "step": 161640 }, { "epoch": 45.45, "learning_rate": 1.0147127729359947e-05, "loss": 0.0456, "step": 161670 }, { "epoch": 45.46, "learning_rate": 1.0128385343454222e-05, "loss": 0.0401, "step": 161700 }, { "epoch": 45.47, "learning_rate": 1.0109642957548496e-05, "loss": 0.0461, "step": 161730 }, { "epoch": 45.48, "learning_rate": 1.0090900571642772e-05, "loss": 0.0423, "step": 161760 }, { "epoch": 45.48, "learning_rate": 1.0072158185737044e-05, "loss": 0.0451, "step": 161790 }, { "epoch": 45.49, "learning_rate": 1.0053415799831318e-05, "loss": 0.0462, "step": 161820 }, { "epoch": 45.5, "learning_rate": 1.0034673413925594e-05, "loss": 0.039, "step": 161850 }, { "epoch": 45.51, "learning_rate": 1.0015931028019868e-05, "loss": 0.0444, "step": 161880 }, { "epoch": 45.52, "learning_rate": 9.997188642114141e-06, "loss": 0.0398, "step": 161910 }, { "epoch": 45.53, "learning_rate": 9.978446256208415e-06, "loss": 0.0429, "step": 161940 }, { "epoch": 45.54, "learning_rate": 9.959703870302691e-06, "loss": 0.0514, "step": 161970 }, { "epoch": 45.54, "learning_rate": 9.940961484396964e-06, "loss": 0.0396, "step": 162000 }, { "epoch": 45.55, "learning_rate": 9.922219098491238e-06, "loss": 0.0469, "step": 162030 }, { "epoch": 45.56, "learning_rate": 9.903476712585514e-06, "loss": 0.041, "step": 162060 }, { "epoch": 45.57, "learning_rate": 9.884734326679788e-06, "loss": 0.0423, "step": 162090 }, { "epoch": 45.58, "learning_rate": 9.86599194077406e-06, "loss": 0.0495, "step": 162120 }, { "epoch": 45.59, "learning_rate": 9.847249554868334e-06, "loss": 0.0397, "step": 162150 }, { "epoch": 45.59, "learning_rate": 9.82850716896261e-06, "loss": 0.0457, "step": 162180 }, { "epoch": 45.6, "learning_rate": 9.809764783056883e-06, "loss": 0.0436, "step": 162210 }, { "epoch": 45.61, "learning_rate": 9.791022397151157e-06, "loss": 0.0412, "step": 162240 }, { "epoch": 45.62, "learning_rate": 9.772280011245433e-06, "loss": 0.0484, "step": 162270 }, { "epoch": 45.63, "learning_rate": 9.753537625339707e-06, "loss": 0.0388, "step": 162300 }, { "epoch": 45.64, "learning_rate": 9.73479523943398e-06, "loss": 0.0463, "step": 162330 }, { "epoch": 45.65, "learning_rate": 9.716052853528254e-06, "loss": 0.0428, "step": 162360 }, { "epoch": 45.65, "learning_rate": 9.69731046762253e-06, "loss": 0.0428, "step": 162390 }, { "epoch": 45.66, "learning_rate": 9.67919282791366e-06, "loss": 0.0507, "step": 162420 }, { "epoch": 45.67, "learning_rate": 9.660450442007935e-06, "loss": 0.041, "step": 162450 }, { "epoch": 45.68, "learning_rate": 9.641708056102209e-06, "loss": 0.0466, "step": 162480 }, { "epoch": 45.69, "learning_rate": 9.622965670196483e-06, "loss": 0.0427, "step": 162510 }, { "epoch": 45.7, "learning_rate": 9.604223284290757e-06, "loss": 0.0395, "step": 162540 }, { "epoch": 45.7, "learning_rate": 9.585480898385031e-06, "loss": 0.0468, "step": 162570 }, { "epoch": 45.71, "learning_rate": 9.566738512479306e-06, "loss": 0.0414, "step": 162600 }, { "epoch": 45.72, "learning_rate": 9.54799612657358e-06, "loss": 0.0458, "step": 162630 }, { "epoch": 45.73, "learning_rate": 9.529253740667854e-06, "loss": 0.0457, "step": 162660 }, { "epoch": 45.74, "learning_rate": 9.510511354762128e-06, "loss": 0.0424, "step": 162690 }, { "epoch": 45.75, "learning_rate": 9.491768968856402e-06, "loss": 0.0476, "step": 162720 }, { "epoch": 45.75, "learning_rate": 9.473026582950677e-06, "loss": 0.038, "step": 162750 }, { "epoch": 45.76, "learning_rate": 9.45428419704495e-06, "loss": 0.0455, "step": 162780 }, { "epoch": 45.77, "learning_rate": 9.435541811139225e-06, "loss": 0.0425, "step": 162810 }, { "epoch": 45.78, "learning_rate": 9.4167994252335e-06, "loss": 0.0477, "step": 162840 }, { "epoch": 45.79, "learning_rate": 9.398057039327773e-06, "loss": 0.0454, "step": 162870 }, { "epoch": 45.8, "learning_rate": 9.379314653422048e-06, "loss": 0.0376, "step": 162900 }, { "epoch": 45.81, "learning_rate": 9.360572267516322e-06, "loss": 0.0446, "step": 162930 }, { "epoch": 45.81, "learning_rate": 9.341829881610596e-06, "loss": 0.0435, "step": 162960 }, { "epoch": 45.82, "learning_rate": 9.32308749570487e-06, "loss": 0.0414, "step": 162990 }, { "epoch": 45.83, "learning_rate": 9.304345109799146e-06, "loss": 0.0479, "step": 163020 }, { "epoch": 45.84, "learning_rate": 9.285602723893418e-06, "loss": 0.0406, "step": 163050 }, { "epoch": 45.85, "learning_rate": 9.266860337987693e-06, "loss": 0.0436, "step": 163080 }, { "epoch": 45.86, "learning_rate": 9.248117952081967e-06, "loss": 0.0445, "step": 163110 }, { "epoch": 45.86, "learning_rate": 9.229375566176241e-06, "loss": 0.0416, "step": 163140 }, { "epoch": 45.87, "learning_rate": 9.210633180270515e-06, "loss": 0.0463, "step": 163170 }, { "epoch": 45.88, "learning_rate": 9.19189079436479e-06, "loss": 0.0397, "step": 163200 }, { "epoch": 45.89, "learning_rate": 9.173148408459064e-06, "loss": 0.0489, "step": 163230 }, { "epoch": 45.9, "learning_rate": 9.154406022553338e-06, "loss": 0.0442, "step": 163260 }, { "epoch": 45.91, "learning_rate": 9.135663636647612e-06, "loss": 0.0416, "step": 163290 }, { "epoch": 45.91, "learning_rate": 9.116921250741886e-06, "loss": 0.0478, "step": 163320 }, { "epoch": 45.92, "learning_rate": 9.098178864836162e-06, "loss": 0.0393, "step": 163350 }, { "epoch": 45.93, "learning_rate": 9.079436478930435e-06, "loss": 0.0456, "step": 163380 }, { "epoch": 45.94, "learning_rate": 9.060694093024709e-06, "loss": 0.045, "step": 163410 }, { "epoch": 45.95, "learning_rate": 9.041951707118983e-06, "loss": 0.0438, "step": 163440 }, { "epoch": 45.96, "learning_rate": 9.023209321213257e-06, "loss": 0.0497, "step": 163470 }, { "epoch": 45.97, "learning_rate": 9.004466935307531e-06, "loss": 0.0407, "step": 163500 }, { "epoch": 45.97, "learning_rate": 8.985724549401806e-06, "loss": 0.0465, "step": 163530 }, { "epoch": 45.98, "learning_rate": 8.966982163496081e-06, "loss": 0.0413, "step": 163560 }, { "epoch": 45.99, "learning_rate": 8.948239777590354e-06, "loss": 0.0459, "step": 163590 }, { "epoch": 46.0, "learning_rate": 8.929497391684628e-06, "loss": 0.0472, "step": 163620 }, { "epoch": 46.0, "eval_loss": 0.10915178805589676, "eval_runtime": 656.9625, "eval_samples_per_second": 24.405, "eval_steps_per_second": 0.764, "eval_wer": 0.09214171659410697, "step": 163622 }, { "epoch": 46.01, "learning_rate": 8.910755005778902e-06, "loss": 0.041, "step": 163650 }, { "epoch": 46.02, "learning_rate": 8.892012619873178e-06, "loss": 0.0449, "step": 163680 }, { "epoch": 46.02, "learning_rate": 8.87327023396745e-06, "loss": 0.0407, "step": 163710 }, { "epoch": 46.03, "learning_rate": 8.854527848061725e-06, "loss": 0.0458, "step": 163740 }, { "epoch": 46.04, "learning_rate": 8.835785462156e-06, "loss": 0.0444, "step": 163770 }, { "epoch": 46.05, "learning_rate": 8.817043076250273e-06, "loss": 0.0398, "step": 163800 }, { "epoch": 46.06, "learning_rate": 8.798300690344547e-06, "loss": 0.0483, "step": 163830 }, { "epoch": 46.07, "learning_rate": 8.779558304438822e-06, "loss": 0.0402, "step": 163860 }, { "epoch": 46.08, "learning_rate": 8.760815918533098e-06, "loss": 0.0444, "step": 163890 }, { "epoch": 46.08, "learning_rate": 8.74207353262737e-06, "loss": 0.0459, "step": 163920 }, { "epoch": 46.09, "learning_rate": 8.723331146721644e-06, "loss": 0.0388, "step": 163950 }, { "epoch": 46.1, "learning_rate": 8.70458876081592e-06, "loss": 0.048, "step": 163980 }, { "epoch": 46.11, "learning_rate": 8.685846374910193e-06, "loss": 0.0393, "step": 164010 }, { "epoch": 46.12, "learning_rate": 8.667103989004467e-06, "loss": 0.0411, "step": 164040 }, { "epoch": 46.13, "learning_rate": 8.648361603098741e-06, "loss": 0.0463, "step": 164070 }, { "epoch": 46.13, "learning_rate": 8.629619217193017e-06, "loss": 0.0403, "step": 164100 }, { "epoch": 46.14, "learning_rate": 8.61087683128729e-06, "loss": 0.0463, "step": 164130 }, { "epoch": 46.15, "learning_rate": 8.592134445381564e-06, "loss": 0.0421, "step": 164160 }, { "epoch": 46.16, "learning_rate": 8.573392059475838e-06, "loss": 0.0467, "step": 164190 }, { "epoch": 46.17, "learning_rate": 8.554649673570114e-06, "loss": 0.0442, "step": 164220 }, { "epoch": 46.18, "learning_rate": 8.535907287664386e-06, "loss": 0.0402, "step": 164250 }, { "epoch": 46.18, "learning_rate": 8.51716490175866e-06, "loss": 0.046, "step": 164280 }, { "epoch": 46.19, "learning_rate": 8.498422515852936e-06, "loss": 0.0392, "step": 164310 }, { "epoch": 46.2, "learning_rate": 8.479680129947209e-06, "loss": 0.0438, "step": 164340 }, { "epoch": 46.21, "learning_rate": 8.460937744041483e-06, "loss": 0.0473, "step": 164370 }, { "epoch": 46.22, "learning_rate": 8.442195358135757e-06, "loss": 0.0431, "step": 164400 }, { "epoch": 46.23, "learning_rate": 8.423452972230033e-06, "loss": 0.0452, "step": 164430 }, { "epoch": 46.24, "learning_rate": 8.404710586324305e-06, "loss": 0.0409, "step": 164460 }, { "epoch": 46.24, "learning_rate": 8.38596820041858e-06, "loss": 0.047, "step": 164490 }, { "epoch": 46.25, "learning_rate": 8.367225814512856e-06, "loss": 0.0439, "step": 164520 }, { "epoch": 46.26, "learning_rate": 8.34848342860713e-06, "loss": 0.0421, "step": 164550 }, { "epoch": 46.27, "learning_rate": 8.329741042701402e-06, "loss": 0.0489, "step": 164580 }, { "epoch": 46.28, "learning_rate": 8.310998656795676e-06, "loss": 0.04, "step": 164610 }, { "epoch": 46.29, "learning_rate": 8.292256270889952e-06, "loss": 0.0432, "step": 164640 }, { "epoch": 46.29, "learning_rate": 8.273513884984225e-06, "loss": 0.0481, "step": 164670 }, { "epoch": 46.3, "learning_rate": 8.254771499078499e-06, "loss": 0.0428, "step": 164700 }, { "epoch": 46.31, "learning_rate": 8.236029113172775e-06, "loss": 0.0482, "step": 164730 }, { "epoch": 46.32, "learning_rate": 8.217286727267049e-06, "loss": 0.042, "step": 164760 }, { "epoch": 46.33, "learning_rate": 8.198544341361322e-06, "loss": 0.0435, "step": 164790 }, { "epoch": 46.34, "learning_rate": 8.179801955455596e-06, "loss": 0.0469, "step": 164820 }, { "epoch": 46.35, "learning_rate": 8.161059569549872e-06, "loss": 0.0398, "step": 164850 }, { "epoch": 46.35, "learning_rate": 8.142317183644146e-06, "loss": 0.048, "step": 164880 }, { "epoch": 46.36, "learning_rate": 8.123574797738418e-06, "loss": 0.0394, "step": 164910 }, { "epoch": 46.37, "learning_rate": 8.10545715802955e-06, "loss": 0.0445, "step": 164940 }, { "epoch": 46.38, "learning_rate": 8.086714772123825e-06, "loss": 0.044, "step": 164970 }, { "epoch": 46.39, "learning_rate": 8.0679723862181e-06, "loss": 0.0404, "step": 165000 }, { "epoch": 46.4, "learning_rate": 8.049230000312373e-06, "loss": 0.0454, "step": 165030 }, { "epoch": 46.4, "learning_rate": 8.030487614406648e-06, "loss": 0.0392, "step": 165060 }, { "epoch": 46.41, "learning_rate": 8.011745228500922e-06, "loss": 0.0465, "step": 165090 }, { "epoch": 46.42, "learning_rate": 7.993002842595196e-06, "loss": 0.0429, "step": 165120 }, { "epoch": 46.43, "learning_rate": 7.97426045668947e-06, "loss": 0.0394, "step": 165150 }, { "epoch": 46.44, "learning_rate": 7.955518070783744e-06, "loss": 0.0443, "step": 165180 }, { "epoch": 46.45, "learning_rate": 7.936775684878019e-06, "loss": 0.0377, "step": 165210 }, { "epoch": 46.45, "learning_rate": 7.918033298972293e-06, "loss": 0.0425, "step": 165240 }, { "epoch": 46.46, "learning_rate": 7.899290913066567e-06, "loss": 0.0444, "step": 165270 }, { "epoch": 46.47, "learning_rate": 7.880548527160841e-06, "loss": 0.0401, "step": 165300 }, { "epoch": 46.48, "learning_rate": 7.861806141255115e-06, "loss": 0.0441, "step": 165330 }, { "epoch": 46.49, "learning_rate": 7.84306375534939e-06, "loss": 0.0437, "step": 165360 }, { "epoch": 46.5, "learning_rate": 7.824321369443664e-06, "loss": 0.0452, "step": 165390 }, { "epoch": 46.51, "learning_rate": 7.805578983537938e-06, "loss": 0.0437, "step": 165420 }, { "epoch": 46.51, "learning_rate": 7.786836597632212e-06, "loss": 0.042, "step": 165450 }, { "epoch": 46.52, "learning_rate": 7.768094211726486e-06, "loss": 0.0472, "step": 165480 }, { "epoch": 46.53, "learning_rate": 7.74935182582076e-06, "loss": 0.0394, "step": 165510 }, { "epoch": 46.54, "learning_rate": 7.730609439915035e-06, "loss": 0.0463, "step": 165540 }, { "epoch": 46.55, "learning_rate": 7.711867054009309e-06, "loss": 0.0452, "step": 165570 }, { "epoch": 46.56, "learning_rate": 7.693124668103583e-06, "loss": 0.0436, "step": 165600 }, { "epoch": 46.56, "learning_rate": 7.674382282197857e-06, "loss": 0.0459, "step": 165630 }, { "epoch": 46.57, "learning_rate": 7.655639896292131e-06, "loss": 0.0417, "step": 165660 }, { "epoch": 46.58, "learning_rate": 7.636897510386407e-06, "loss": 0.0445, "step": 165690 }, { "epoch": 46.59, "learning_rate": 7.618155124480681e-06, "loss": 0.0454, "step": 165720 }, { "epoch": 46.6, "learning_rate": 7.599412738574954e-06, "loss": 0.0425, "step": 165750 }, { "epoch": 46.61, "learning_rate": 7.580670352669228e-06, "loss": 0.0469, "step": 165780 }, { "epoch": 46.62, "learning_rate": 7.561927966763503e-06, "loss": 0.0398, "step": 165810 }, { "epoch": 46.62, "learning_rate": 7.543185580857777e-06, "loss": 0.0464, "step": 165840 }, { "epoch": 46.63, "learning_rate": 7.524443194952051e-06, "loss": 0.0442, "step": 165870 }, { "epoch": 46.64, "learning_rate": 7.505700809046325e-06, "loss": 0.04, "step": 165900 }, { "epoch": 46.65, "learning_rate": 7.4869584231406e-06, "loss": 0.0485, "step": 165930 }, { "epoch": 46.66, "learning_rate": 7.468216037234873e-06, "loss": 0.043, "step": 165960 }, { "epoch": 46.67, "learning_rate": 7.4494736513291475e-06, "loss": 0.0453, "step": 165990 }, { "epoch": 46.67, "learning_rate": 7.4307312654234225e-06, "loss": 0.0435, "step": 166020 }, { "epoch": 46.68, "learning_rate": 7.411988879517697e-06, "loss": 0.039, "step": 166050 }, { "epoch": 46.69, "learning_rate": 7.39324649361197e-06, "loss": 0.0441, "step": 166080 }, { "epoch": 46.7, "learning_rate": 7.374504107706244e-06, "loss": 0.0413, "step": 166110 }, { "epoch": 46.71, "learning_rate": 7.355761721800519e-06, "loss": 0.0438, "step": 166140 }, { "epoch": 46.72, "learning_rate": 7.3370193358947935e-06, "loss": 0.0486, "step": 166170 }, { "epoch": 46.72, "learning_rate": 7.318276949989067e-06, "loss": 0.0413, "step": 166200 }, { "epoch": 46.73, "learning_rate": 7.299534564083342e-06, "loss": 0.0467, "step": 166230 }, { "epoch": 46.74, "learning_rate": 7.280792178177616e-06, "loss": 0.0401, "step": 166260 }, { "epoch": 46.75, "learning_rate": 7.262049792271889e-06, "loss": 0.0453, "step": 166290 }, { "epoch": 46.76, "learning_rate": 7.243307406366164e-06, "loss": 0.0443, "step": 166320 }, { "epoch": 46.77, "learning_rate": 7.224565020460439e-06, "loss": 0.0385, "step": 166350 }, { "epoch": 46.78, "learning_rate": 7.205822634554713e-06, "loss": 0.046, "step": 166380 }, { "epoch": 46.78, "learning_rate": 7.187080248648986e-06, "loss": 0.0381, "step": 166410 }, { "epoch": 46.79, "learning_rate": 7.168337862743261e-06, "loss": 0.0435, "step": 166440 }, { "epoch": 46.8, "learning_rate": 7.149595476837535e-06, "loss": 0.0468, "step": 166470 }, { "epoch": 46.81, "learning_rate": 7.130853090931809e-06, "loss": 0.0435, "step": 166500 }, { "epoch": 46.82, "learning_rate": 7.112110705026083e-06, "loss": 0.0523, "step": 166530 }, { "epoch": 46.83, "learning_rate": 7.093368319120358e-06, "loss": 0.0386, "step": 166560 }, { "epoch": 46.83, "learning_rate": 7.074625933214632e-06, "loss": 0.0455, "step": 166590 }, { "epoch": 46.84, "learning_rate": 7.0558835473089055e-06, "loss": 0.0438, "step": 166620 }, { "epoch": 46.85, "learning_rate": 7.037141161403181e-06, "loss": 0.0387, "step": 166650 }, { "epoch": 46.86, "learning_rate": 7.018398775497455e-06, "loss": 0.0464, "step": 166680 }, { "epoch": 46.87, "learning_rate": 6.999656389591729e-06, "loss": 0.0417, "step": 166710 }, { "epoch": 46.88, "learning_rate": 6.980914003686002e-06, "loss": 0.0456, "step": 166740 }, { "epoch": 46.88, "learning_rate": 6.962171617780277e-06, "loss": 0.0444, "step": 166770 }, { "epoch": 46.89, "learning_rate": 6.9434292318745515e-06, "loss": 0.0398, "step": 166800 }, { "epoch": 46.9, "learning_rate": 6.924686845968825e-06, "loss": 0.0457, "step": 166830 }, { "epoch": 46.91, "learning_rate": 6.905944460063099e-06, "loss": 0.039, "step": 166860 }, { "epoch": 46.92, "learning_rate": 6.887202074157374e-06, "loss": 0.0428, "step": 166890 }, { "epoch": 46.93, "learning_rate": 6.868459688251648e-06, "loss": 0.0496, "step": 166920 }, { "epoch": 46.94, "learning_rate": 6.849717302345922e-06, "loss": 0.0405, "step": 166950 }, { "epoch": 46.94, "learning_rate": 6.830974916440197e-06, "loss": 0.0467, "step": 166980 }, { "epoch": 46.95, "learning_rate": 6.812232530534471e-06, "loss": 0.0402, "step": 167010 }, { "epoch": 46.96, "learning_rate": 6.7941148908256025e-06, "loss": 0.0422, "step": 167040 }, { "epoch": 46.97, "learning_rate": 6.775372504919876e-06, "loss": 0.0447, "step": 167070 }, { "epoch": 46.98, "learning_rate": 6.756630119014151e-06, "loss": 0.0419, "step": 167100 }, { "epoch": 46.99, "learning_rate": 6.737887733108425e-06, "loss": 0.0466, "step": 167130 }, { "epoch": 46.99, "learning_rate": 6.719145347202699e-06, "loss": 0.0414, "step": 167160 }, { "epoch": 47.0, "eval_loss": 0.11058283597230911, "eval_runtime": 643.2521, "eval_samples_per_second": 24.925, "eval_steps_per_second": 0.78, "eval_wer": 0.09220313075757783, "step": 167179 }, { "epoch": 47.0, "learning_rate": 6.700402961296974e-06, "loss": 0.0464, "step": 167190 }, { "epoch": 47.01, "learning_rate": 6.681660575391248e-06, "loss": 0.0417, "step": 167220 }, { "epoch": 47.02, "learning_rate": 6.662918189485522e-06, "loss": 0.0473, "step": 167250 }, { "epoch": 47.03, "learning_rate": 6.644175803579795e-06, "loss": 0.0478, "step": 167280 }, { "epoch": 47.04, "learning_rate": 6.625433417674071e-06, "loss": 0.0377, "step": 167310 }, { "epoch": 47.05, "learning_rate": 6.606691031768344e-06, "loss": 0.0459, "step": 167340 }, { "epoch": 47.05, "learning_rate": 6.587948645862619e-06, "loss": 0.0415, "step": 167370 }, { "epoch": 47.06, "learning_rate": 6.569206259956894e-06, "loss": 0.0398, "step": 167400 }, { "epoch": 47.07, "learning_rate": 6.550463874051167e-06, "loss": 0.0488, "step": 167430 }, { "epoch": 47.08, "learning_rate": 6.531721488145441e-06, "loss": 0.0384, "step": 167460 }, { "epoch": 47.09, "learning_rate": 6.5129791022397145e-06, "loss": 0.0447, "step": 167490 }, { "epoch": 47.1, "learning_rate": 6.49423671633399e-06, "loss": 0.0396, "step": 167520 }, { "epoch": 47.1, "learning_rate": 6.475494330428264e-06, "loss": 0.0448, "step": 167550 }, { "epoch": 47.11, "learning_rate": 6.456751944522538e-06, "loss": 0.0464, "step": 167580 }, { "epoch": 47.12, "learning_rate": 6.438009558616811e-06, "loss": 0.0386, "step": 167610 }, { "epoch": 47.13, "learning_rate": 6.419267172711087e-06, "loss": 0.045, "step": 167640 }, { "epoch": 47.14, "learning_rate": 6.4005247868053605e-06, "loss": 0.0409, "step": 167670 }, { "epoch": 47.15, "learning_rate": 6.381782400899635e-06, "loss": 0.0437, "step": 167700 }, { "epoch": 47.15, "learning_rate": 6.36304001499391e-06, "loss": 0.0507, "step": 167730 }, { "epoch": 47.16, "learning_rate": 6.344297629088183e-06, "loss": 0.0384, "step": 167760 }, { "epoch": 47.17, "learning_rate": 6.325555243182457e-06, "loss": 0.0464, "step": 167790 }, { "epoch": 47.18, "learning_rate": 6.306812857276731e-06, "loss": 0.0404, "step": 167820 }, { "epoch": 47.19, "learning_rate": 6.2880704713710065e-06, "loss": 0.0443, "step": 167850 }, { "epoch": 47.2, "learning_rate": 6.26932808546528e-06, "loss": 0.0477, "step": 167880 }, { "epoch": 47.21, "learning_rate": 6.250585699559554e-06, "loss": 0.0374, "step": 167910 }, { "epoch": 47.21, "learning_rate": 6.231843313653828e-06, "loss": 0.0461, "step": 167940 }, { "epoch": 47.22, "learning_rate": 6.213100927748102e-06, "loss": 0.0431, "step": 167970 }, { "epoch": 47.23, "learning_rate": 6.194358541842377e-06, "loss": 0.0479, "step": 168000 }, { "epoch": 47.24, "learning_rate": 6.175616155936651e-06, "loss": 0.0479, "step": 168030 }, { "epoch": 47.25, "learning_rate": 6.156873770030925e-06, "loss": 0.0379, "step": 168060 }, { "epoch": 47.26, "learning_rate": 6.138131384125199e-06, "loss": 0.044, "step": 168090 }, { "epoch": 47.26, "learning_rate": 6.119388998219474e-06, "loss": 0.0413, "step": 168120 }, { "epoch": 47.27, "learning_rate": 6.1006466123137475e-06, "loss": 0.0432, "step": 168150 }, { "epoch": 47.28, "learning_rate": 6.081904226408023e-06, "loss": 0.0465, "step": 168180 }, { "epoch": 47.29, "learning_rate": 6.063161840502296e-06, "loss": 0.0373, "step": 168210 }, { "epoch": 47.3, "learning_rate": 6.044419454596571e-06, "loss": 0.0482, "step": 168240 }, { "epoch": 47.31, "learning_rate": 6.025677068690844e-06, "loss": 0.0423, "step": 168270 }, { "epoch": 47.32, "learning_rate": 6.0069346827851185e-06, "loss": 0.0453, "step": 168300 }, { "epoch": 47.32, "learning_rate": 5.988192296879393e-06, "loss": 0.0461, "step": 168330 }, { "epoch": 47.33, "learning_rate": 5.969449910973667e-06, "loss": 0.0361, "step": 168360 }, { "epoch": 47.34, "learning_rate": 5.950707525067942e-06, "loss": 0.0475, "step": 168390 }, { "epoch": 47.35, "learning_rate": 5.931965139162215e-06, "loss": 0.0415, "step": 168420 }, { "epoch": 47.36, "learning_rate": 5.91322275325649e-06, "loss": 0.0456, "step": 168450 }, { "epoch": 47.37, "learning_rate": 5.894480367350764e-06, "loss": 0.0492, "step": 168480 }, { "epoch": 47.37, "learning_rate": 5.875737981445039e-06, "loss": 0.0353, "step": 168510 }, { "epoch": 47.38, "learning_rate": 5.856995595539312e-06, "loss": 0.0436, "step": 168540 }, { "epoch": 47.39, "learning_rate": 5.838253209633587e-06, "loss": 0.0414, "step": 168570 }, { "epoch": 47.4, "learning_rate": 5.819510823727861e-06, "loss": 0.0415, "step": 168600 }, { "epoch": 47.41, "learning_rate": 5.800768437822135e-06, "loss": 0.0481, "step": 168630 }, { "epoch": 47.42, "learning_rate": 5.78202605191641e-06, "loss": 0.0374, "step": 168660 }, { "epoch": 47.42, "learning_rate": 5.763283666010683e-06, "loss": 0.0474, "step": 168690 }, { "epoch": 47.43, "learning_rate": 5.744541280104958e-06, "loss": 0.0409, "step": 168720 }, { "epoch": 47.44, "learning_rate": 5.725798894199231e-06, "loss": 0.0399, "step": 168750 }, { "epoch": 47.45, "learning_rate": 5.707056508293506e-06, "loss": 0.046, "step": 168780 }, { "epoch": 47.46, "learning_rate": 5.68831412238778e-06, "loss": 0.0394, "step": 168810 }, { "epoch": 47.47, "learning_rate": 5.669571736482055e-06, "loss": 0.045, "step": 168840 }, { "epoch": 47.48, "learning_rate": 5.650829350576329e-06, "loss": 0.043, "step": 168870 }, { "epoch": 47.48, "learning_rate": 5.632086964670602e-06, "loss": 0.041, "step": 168900 }, { "epoch": 47.49, "learning_rate": 5.613344578764877e-06, "loss": 0.0455, "step": 168930 }, { "epoch": 47.5, "learning_rate": 5.594602192859151e-06, "loss": 0.0376, "step": 168960 }, { "epoch": 47.51, "learning_rate": 5.575859806953426e-06, "loss": 0.0485, "step": 168990 }, { "epoch": 47.52, "learning_rate": 5.557117421047699e-06, "loss": 0.0398, "step": 169020 }, { "epoch": 47.53, "learning_rate": 5.538375035141974e-06, "loss": 0.0455, "step": 169050 }, { "epoch": 47.53, "learning_rate": 5.519632649236248e-06, "loss": 0.0467, "step": 169080 }, { "epoch": 47.54, "learning_rate": 5.5008902633305225e-06, "loss": 0.0384, "step": 169110 }, { "epoch": 47.55, "learning_rate": 5.482147877424797e-06, "loss": 0.0453, "step": 169140 }, { "epoch": 47.56, "learning_rate": 5.463405491519071e-06, "loss": 0.039, "step": 169170 }, { "epoch": 47.57, "learning_rate": 5.444663105613345e-06, "loss": 0.0439, "step": 169200 }, { "epoch": 47.58, "learning_rate": 5.425920719707618e-06, "loss": 0.0464, "step": 169230 }, { "epoch": 47.58, "learning_rate": 5.4071783338018934e-06, "loss": 0.036, "step": 169260 }, { "epoch": 47.59, "learning_rate": 5.388435947896167e-06, "loss": 0.0471, "step": 169290 }, { "epoch": 47.6, "learning_rate": 5.369693561990442e-06, "loss": 0.0394, "step": 169320 }, { "epoch": 47.61, "learning_rate": 5.3515759222815735e-06, "loss": 0.0413, "step": 169350 }, { "epoch": 47.62, "learning_rate": 5.332833536375848e-06, "loss": 0.0453, "step": 169380 }, { "epoch": 47.63, "learning_rate": 5.314091150470122e-06, "loss": 0.0386, "step": 169410 }, { "epoch": 47.64, "learning_rate": 5.295348764564396e-06, "loss": 0.0478, "step": 169440 }, { "epoch": 47.64, "learning_rate": 5.27660637865867e-06, "loss": 0.0398, "step": 169470 }, { "epoch": 47.65, "learning_rate": 5.2578639927529444e-06, "loss": 0.0428, "step": 169500 }, { "epoch": 47.66, "learning_rate": 5.239121606847219e-06, "loss": 0.047, "step": 169530 }, { "epoch": 47.67, "learning_rate": 5.220379220941493e-06, "loss": 0.0369, "step": 169560 }, { "epoch": 47.68, "learning_rate": 5.201636835035767e-06, "loss": 0.0455, "step": 169590 }, { "epoch": 47.69, "learning_rate": 5.182894449130041e-06, "loss": 0.0414, "step": 169620 }, { "epoch": 47.69, "learning_rate": 5.164152063224315e-06, "loss": 0.0421, "step": 169650 }, { "epoch": 47.7, "learning_rate": 5.14540967731859e-06, "loss": 0.0445, "step": 169680 }, { "epoch": 47.71, "learning_rate": 5.126667291412864e-06, "loss": 0.0384, "step": 169710 }, { "epoch": 47.72, "learning_rate": 5.107924905507138e-06, "loss": 0.0456, "step": 169740 }, { "epoch": 47.73, "learning_rate": 5.089182519601412e-06, "loss": 0.0426, "step": 169770 }, { "epoch": 47.74, "learning_rate": 5.070440133695686e-06, "loss": 0.0431, "step": 169800 }, { "epoch": 47.75, "learning_rate": 5.0516977477899605e-06, "loss": 0.0463, "step": 169830 }, { "epoch": 47.75, "learning_rate": 5.032955361884235e-06, "loss": 0.036, "step": 169860 }, { "epoch": 47.76, "learning_rate": 5.014212975978509e-06, "loss": 0.0431, "step": 169890 }, { "epoch": 47.77, "learning_rate": 4.995470590072783e-06, "loss": 0.0406, "step": 169920 }, { "epoch": 47.78, "learning_rate": 4.976728204167057e-06, "loss": 0.0439, "step": 169950 }, { "epoch": 47.79, "learning_rate": 4.9579858182613315e-06, "loss": 0.0477, "step": 169980 }, { "epoch": 47.8, "learning_rate": 4.939243432355606e-06, "loss": 0.0387, "step": 170010 }, { "epoch": 47.8, "learning_rate": 4.92050104644988e-06, "loss": 0.0463, "step": 170040 }, { "epoch": 47.81, "learning_rate": 4.901758660544154e-06, "loss": 0.0409, "step": 170070 }, { "epoch": 47.82, "learning_rate": 4.883016274638428e-06, "loss": 0.0425, "step": 170100 }, { "epoch": 47.83, "learning_rate": 4.8642738887327024e-06, "loss": 0.0483, "step": 170130 }, { "epoch": 47.84, "learning_rate": 4.845531502826977e-06, "loss": 0.0387, "step": 170160 }, { "epoch": 47.85, "learning_rate": 4.826789116921251e-06, "loss": 0.0458, "step": 170190 }, { "epoch": 47.85, "learning_rate": 4.808046731015525e-06, "loss": 0.041, "step": 170220 }, { "epoch": 47.86, "learning_rate": 4.789304345109799e-06, "loss": 0.0432, "step": 170250 }, { "epoch": 47.87, "learning_rate": 4.770561959204073e-06, "loss": 0.046, "step": 170280 }, { "epoch": 47.88, "learning_rate": 4.7518195732983484e-06, "loss": 0.0368, "step": 170310 }, { "epoch": 47.89, "learning_rate": 4.733077187392622e-06, "loss": 0.0445, "step": 170340 }, { "epoch": 47.9, "learning_rate": 4.714334801486897e-06, "loss": 0.0409, "step": 170370 }, { "epoch": 47.91, "learning_rate": 4.69559241558117e-06, "loss": 0.0428, "step": 170400 }, { "epoch": 47.91, "learning_rate": 4.676850029675444e-06, "loss": 0.0487, "step": 170430 }, { "epoch": 47.92, "learning_rate": 4.6581076437697185e-06, "loss": 0.0376, "step": 170460 }, { "epoch": 47.93, "learning_rate": 4.639365257863993e-06, "loss": 0.0466, "step": 170490 }, { "epoch": 47.94, "learning_rate": 4.620622871958267e-06, "loss": 0.0386, "step": 170520 }, { "epoch": 47.95, "learning_rate": 4.601880486052541e-06, "loss": 0.0408, "step": 170550 }, { "epoch": 47.96, "learning_rate": 4.583138100146816e-06, "loss": 0.0453, "step": 170580 }, { "epoch": 47.96, "learning_rate": 4.5643957142410895e-06, "loss": 0.0374, "step": 170610 }, { "epoch": 47.97, "learning_rate": 4.5456533283353645e-06, "loss": 0.0468, "step": 170640 }, { "epoch": 47.98, "learning_rate": 4.526910942429638e-06, "loss": 0.0421, "step": 170670 }, { "epoch": 47.99, "learning_rate": 4.508168556523912e-06, "loss": 0.043, "step": 170700 }, { "epoch": 48.0, "learning_rate": 4.490050916815044e-06, "loss": 0.0501, "step": 170730 }, { "epoch": 48.0, "eval_loss": 0.10937908291816711, "eval_runtime": 643.5663, "eval_samples_per_second": 24.913, "eval_steps_per_second": 0.78, "eval_wer": 0.09180052679704666, "step": 170736 }, { "epoch": 48.01, "learning_rate": 4.471308530909318e-06, "loss": 0.0404, "step": 170760 }, { "epoch": 48.02, "learning_rate": 4.452566145003593e-06, "loss": 0.0433, "step": 170790 }, { "epoch": 48.02, "learning_rate": 4.433823759097866e-06, "loss": 0.0372, "step": 170820 }, { "epoch": 48.03, "learning_rate": 4.415081373192141e-06, "loss": 0.0425, "step": 170850 }, { "epoch": 48.04, "learning_rate": 4.396338987286415e-06, "loss": 0.0418, "step": 170880 }, { "epoch": 48.05, "learning_rate": 4.37759660138069e-06, "loss": 0.0448, "step": 170910 }, { "epoch": 48.06, "learning_rate": 4.358854215474963e-06, "loss": 0.0454, "step": 170940 }, { "epoch": 48.07, "learning_rate": 4.340111829569238e-06, "loss": 0.0397, "step": 170970 }, { "epoch": 48.07, "learning_rate": 4.3213694436635114e-06, "loss": 0.0473, "step": 171000 }, { "epoch": 48.08, "learning_rate": 4.3026270577577865e-06, "loss": 0.0426, "step": 171030 }, { "epoch": 48.09, "learning_rate": 4.283884671852061e-06, "loss": 0.045, "step": 171060 }, { "epoch": 48.1, "learning_rate": 4.265142285946334e-06, "loss": 0.0452, "step": 171090 }, { "epoch": 48.11, "learning_rate": 4.246399900040609e-06, "loss": 0.0401, "step": 171120 }, { "epoch": 48.12, "learning_rate": 4.227657514134882e-06, "loss": 0.0424, "step": 171150 }, { "epoch": 48.12, "learning_rate": 4.2089151282291574e-06, "loss": 0.0393, "step": 171180 }, { "epoch": 48.13, "learning_rate": 4.190172742323431e-06, "loss": 0.0406, "step": 171210 }, { "epoch": 48.14, "learning_rate": 4.171430356417706e-06, "loss": 0.0445, "step": 171240 }, { "epoch": 48.15, "learning_rate": 4.15268797051198e-06, "loss": 0.039, "step": 171270 }, { "epoch": 48.16, "learning_rate": 4.133945584606254e-06, "loss": 0.0456, "step": 171300 }, { "epoch": 48.17, "learning_rate": 4.115203198700528e-06, "loss": 0.0429, "step": 171330 }, { "epoch": 48.18, "learning_rate": 4.096460812794803e-06, "loss": 0.0413, "step": 171360 }, { "epoch": 48.18, "learning_rate": 4.077718426889077e-06, "loss": 0.0466, "step": 171390 }, { "epoch": 48.19, "learning_rate": 4.05897604098335e-06, "loss": 0.0402, "step": 171420 }, { "epoch": 48.2, "learning_rate": 4.040233655077625e-06, "loss": 0.0428, "step": 171450 }, { "epoch": 48.21, "learning_rate": 4.0214912691718985e-06, "loss": 0.042, "step": 171480 }, { "epoch": 48.22, "learning_rate": 4.0027488832661735e-06, "loss": 0.0388, "step": 171510 }, { "epoch": 48.23, "learning_rate": 3.984006497360448e-06, "loss": 0.048, "step": 171540 }, { "epoch": 48.23, "learning_rate": 3.965264111454722e-06, "loss": 0.0399, "step": 171570 }, { "epoch": 48.24, "learning_rate": 3.946521725548996e-06, "loss": 0.0477, "step": 171600 }, { "epoch": 48.25, "learning_rate": 3.92777933964327e-06, "loss": 0.0384, "step": 171630 }, { "epoch": 48.26, "learning_rate": 3.9090369537375445e-06, "loss": 0.0415, "step": 171660 }, { "epoch": 48.27, "learning_rate": 3.890294567831818e-06, "loss": 0.0421, "step": 171690 }, { "epoch": 48.28, "learning_rate": 3.871552181926093e-06, "loss": 0.041, "step": 171720 }, { "epoch": 48.29, "learning_rate": 3.852809796020366e-06, "loss": 0.0445, "step": 171750 }, { "epoch": 48.29, "learning_rate": 3.834067410114641e-06, "loss": 0.0414, "step": 171780 }, { "epoch": 48.3, "learning_rate": 3.8153250242089154e-06, "loss": 0.0386, "step": 171810 }, { "epoch": 48.31, "learning_rate": 3.796582638303189e-06, "loss": 0.0455, "step": 171840 }, { "epoch": 48.32, "learning_rate": 3.777840252397464e-06, "loss": 0.0372, "step": 171870 }, { "epoch": 48.33, "learning_rate": 3.7590978664917376e-06, "loss": 0.043, "step": 171900 }, { "epoch": 48.34, "learning_rate": 3.740355480586012e-06, "loss": 0.042, "step": 171930 }, { "epoch": 48.34, "learning_rate": 3.721613094680286e-06, "loss": 0.0422, "step": 171960 }, { "epoch": 48.35, "learning_rate": 3.7028707087745606e-06, "loss": 0.045, "step": 171990 }, { "epoch": 48.36, "learning_rate": 3.684128322868835e-06, "loss": 0.0401, "step": 172020 }, { "epoch": 48.37, "learning_rate": 3.665385936963109e-06, "loss": 0.0422, "step": 172050 }, { "epoch": 48.38, "learning_rate": 3.646643551057383e-06, "loss": 0.0401, "step": 172080 }, { "epoch": 48.39, "learning_rate": 3.6279011651516573e-06, "loss": 0.0428, "step": 172110 }, { "epoch": 48.39, "learning_rate": 3.6091587792459315e-06, "loss": 0.0469, "step": 172140 }, { "epoch": 48.4, "learning_rate": 3.5904163933402053e-06, "loss": 0.0406, "step": 172170 }, { "epoch": 48.41, "learning_rate": 3.57167400743448e-06, "loss": 0.0427, "step": 172200 }, { "epoch": 48.42, "learning_rate": 3.5529316215287537e-06, "loss": 0.0421, "step": 172230 }, { "epoch": 48.43, "learning_rate": 3.5341892356230283e-06, "loss": 0.0402, "step": 172260 }, { "epoch": 48.44, "learning_rate": 3.515446849717303e-06, "loss": 0.0505, "step": 172290 }, { "epoch": 48.45, "learning_rate": 3.4967044638115767e-06, "loss": 0.0371, "step": 172320 }, { "epoch": 48.45, "learning_rate": 3.4779620779058513e-06, "loss": 0.0437, "step": 172350 }, { "epoch": 48.46, "learning_rate": 3.459219692000125e-06, "loss": 0.0422, "step": 172380 }, { "epoch": 48.47, "learning_rate": 3.4404773060943993e-06, "loss": 0.0442, "step": 172410 }, { "epoch": 48.48, "learning_rate": 3.421734920188673e-06, "loss": 0.0437, "step": 172440 }, { "epoch": 48.49, "learning_rate": 3.4029925342829476e-06, "loss": 0.0351, "step": 172470 }, { "epoch": 48.5, "learning_rate": 3.3842501483772223e-06, "loss": 0.0466, "step": 172500 }, { "epoch": 48.5, "learning_rate": 3.365507762471496e-06, "loss": 0.0441, "step": 172530 }, { "epoch": 48.51, "learning_rate": 3.3467653765657706e-06, "loss": 0.0428, "step": 172560 }, { "epoch": 48.52, "learning_rate": 3.3280229906600444e-06, "loss": 0.0438, "step": 172590 }, { "epoch": 48.53, "learning_rate": 3.309280604754319e-06, "loss": 0.0371, "step": 172620 }, { "epoch": 48.54, "learning_rate": 3.2905382188485928e-06, "loss": 0.0445, "step": 172650 }, { "epoch": 48.55, "learning_rate": 3.271795832942867e-06, "loss": 0.041, "step": 172680 }, { "epoch": 48.55, "learning_rate": 3.253053447037141e-06, "loss": 0.0432, "step": 172710 }, { "epoch": 48.56, "learning_rate": 3.2343110611314154e-06, "loss": 0.045, "step": 172740 }, { "epoch": 48.57, "learning_rate": 3.21556867522569e-06, "loss": 0.0358, "step": 172770 }, { "epoch": 48.58, "learning_rate": 3.1968262893199637e-06, "loss": 0.0449, "step": 172800 }, { "epoch": 48.59, "learning_rate": 3.1780839034142383e-06, "loss": 0.0411, "step": 172830 }, { "epoch": 48.6, "learning_rate": 3.159341517508512e-06, "loss": 0.0416, "step": 172860 }, { "epoch": 48.61, "learning_rate": 3.1405991316027867e-06, "loss": 0.0448, "step": 172890 }, { "epoch": 48.61, "learning_rate": 3.121856745697061e-06, "loss": 0.0381, "step": 172920 }, { "epoch": 48.62, "learning_rate": 3.103114359791335e-06, "loss": 0.0445, "step": 172950 }, { "epoch": 48.63, "learning_rate": 3.0843719738856093e-06, "loss": 0.0413, "step": 172980 }, { "epoch": 48.64, "learning_rate": 3.065629587979883e-06, "loss": 0.0426, "step": 173010 }, { "epoch": 48.65, "learning_rate": 3.0468872020741573e-06, "loss": 0.0466, "step": 173040 }, { "epoch": 48.66, "learning_rate": 3.0281448161684315e-06, "loss": 0.0397, "step": 173070 }, { "epoch": 48.66, "learning_rate": 3.009402430262706e-06, "loss": 0.0432, "step": 173100 }, { "epoch": 48.67, "learning_rate": 2.9906600443569803e-06, "loss": 0.0419, "step": 173130 }, { "epoch": 48.68, "learning_rate": 2.9719176584512544e-06, "loss": 0.0421, "step": 173160 }, { "epoch": 48.69, "learning_rate": 2.9531752725455286e-06, "loss": 0.0457, "step": 173190 }, { "epoch": 48.7, "learning_rate": 2.934432886639803e-06, "loss": 0.0388, "step": 173220 }, { "epoch": 48.71, "learning_rate": 2.915690500734077e-06, "loss": 0.0451, "step": 173250 }, { "epoch": 48.72, "learning_rate": 2.896948114828351e-06, "loss": 0.0412, "step": 173280 }, { "epoch": 48.72, "learning_rate": 2.878205728922625e-06, "loss": 0.0411, "step": 173310 }, { "epoch": 48.73, "learning_rate": 2.860088089213757e-06, "loss": 0.0485, "step": 173340 }, { "epoch": 48.74, "learning_rate": 2.8413457033080313e-06, "loss": 0.0404, "step": 173370 }, { "epoch": 48.75, "learning_rate": 2.8226033174023054e-06, "loss": 0.0442, "step": 173400 }, { "epoch": 48.76, "learning_rate": 2.8038609314965796e-06, "loss": 0.0409, "step": 173430 }, { "epoch": 48.77, "learning_rate": 2.785118545590854e-06, "loss": 0.0418, "step": 173460 }, { "epoch": 48.77, "learning_rate": 2.766376159685128e-06, "loss": 0.045, "step": 173490 }, { "epoch": 48.78, "learning_rate": 2.747633773779402e-06, "loss": 0.0374, "step": 173520 }, { "epoch": 48.79, "learning_rate": 2.7288913878736764e-06, "loss": 0.0434, "step": 173550 }, { "epoch": 48.8, "learning_rate": 2.7101490019679506e-06, "loss": 0.0414, "step": 173580 }, { "epoch": 48.81, "learning_rate": 2.6914066160622248e-06, "loss": 0.0424, "step": 173610 }, { "epoch": 48.82, "learning_rate": 2.672664230156499e-06, "loss": 0.0449, "step": 173640 }, { "epoch": 48.82, "learning_rate": 2.653921844250773e-06, "loss": 0.0411, "step": 173670 }, { "epoch": 48.83, "learning_rate": 2.6351794583450474e-06, "loss": 0.0442, "step": 173700 }, { "epoch": 48.84, "learning_rate": 2.6164370724393215e-06, "loss": 0.045, "step": 173730 }, { "epoch": 48.85, "learning_rate": 2.5976946865335957e-06, "loss": 0.0415, "step": 173760 }, { "epoch": 48.86, "learning_rate": 2.57895230062787e-06, "loss": 0.045, "step": 173790 }, { "epoch": 48.87, "learning_rate": 2.560209914722144e-06, "loss": 0.037, "step": 173820 }, { "epoch": 48.88, "learning_rate": 2.5414675288164187e-06, "loss": 0.0469, "step": 173850 }, { "epoch": 48.88, "learning_rate": 2.522725142910693e-06, "loss": 0.0386, "step": 173880 }, { "epoch": 48.89, "learning_rate": 2.503982757004967e-06, "loss": 0.0422, "step": 173910 }, { "epoch": 48.9, "learning_rate": 2.485240371099241e-06, "loss": 0.0428, "step": 173940 }, { "epoch": 48.91, "learning_rate": 2.466497985193515e-06, "loss": 0.0381, "step": 173970 }, { "epoch": 48.92, "learning_rate": 2.4477555992877893e-06, "loss": 0.0446, "step": 174000 }, { "epoch": 48.93, "learning_rate": 2.4290132133820634e-06, "loss": 0.0403, "step": 174030 }, { "epoch": 48.93, "learning_rate": 2.4102708274763376e-06, "loss": 0.0417, "step": 174060 }, { "epoch": 48.94, "learning_rate": 2.3915284415706123e-06, "loss": 0.0428, "step": 174090 }, { "epoch": 48.95, "learning_rate": 2.3727860556648864e-06, "loss": 0.0367, "step": 174120 }, { "epoch": 48.96, "learning_rate": 2.3540436697591606e-06, "loss": 0.0465, "step": 174150 }, { "epoch": 48.97, "learning_rate": 2.335301283853435e-06, "loss": 0.0397, "step": 174180 }, { "epoch": 48.98, "learning_rate": 2.316558897947709e-06, "loss": 0.0429, "step": 174210 }, { "epoch": 48.98, "learning_rate": 2.2978165120419828e-06, "loss": 0.0472, "step": 174240 }, { "epoch": 48.99, "learning_rate": 2.279074126136257e-06, "loss": 0.0388, "step": 174270 }, { "epoch": 49.0, "eval_loss": 0.10990184545516968, "eval_runtime": 658.3127, "eval_samples_per_second": 24.355, "eval_steps_per_second": 0.763, "eval_wer": 0.09180735059298786, "step": 174293 }, { "epoch": 49.0, "learning_rate": 2.260331740230531e-06, "loss": 0.0459, "step": 174300 }, { "epoch": 49.01, "learning_rate": 2.2415893543248058e-06, "loss": 0.0399, "step": 174330 }, { "epoch": 49.02, "learning_rate": 2.22284696841908e-06, "loss": 0.0474, "step": 174360 }, { "epoch": 49.03, "learning_rate": 2.204104582513354e-06, "loss": 0.04, "step": 174390 }, { "epoch": 49.04, "learning_rate": 2.1853621966076283e-06, "loss": 0.0368, "step": 174420 }, { "epoch": 49.04, "learning_rate": 2.1666198107019025e-06, "loss": 0.0473, "step": 174450 }, { "epoch": 49.05, "learning_rate": 2.1478774247961767e-06, "loss": 0.0403, "step": 174480 }, { "epoch": 49.06, "learning_rate": 2.129135038890451e-06, "loss": 0.0454, "step": 174510 }, { "epoch": 49.07, "learning_rate": 2.1103926529847247e-06, "loss": 0.0436, "step": 174540 }, { "epoch": 49.08, "learning_rate": 2.0916502670789993e-06, "loss": 0.0431, "step": 174570 }, { "epoch": 49.09, "learning_rate": 2.0729078811732735e-06, "loss": 0.0444, "step": 174600 }, { "epoch": 49.09, "learning_rate": 2.0541654952675477e-06, "loss": 0.0378, "step": 174630 }, { "epoch": 49.1, "learning_rate": 2.035423109361822e-06, "loss": 0.0445, "step": 174660 }, { "epoch": 49.11, "learning_rate": 2.016680723456096e-06, "loss": 0.0444, "step": 174690 }, { "epoch": 49.12, "learning_rate": 1.9979383375503703e-06, "loss": 0.0386, "step": 174720 }, { "epoch": 49.13, "learning_rate": 1.9791959516446444e-06, "loss": 0.0432, "step": 174750 }, { "epoch": 49.14, "learning_rate": 1.9604535657389186e-06, "loss": 0.0397, "step": 174780 }, { "epoch": 49.15, "learning_rate": 1.941711179833193e-06, "loss": 0.0444, "step": 174810 }, { "epoch": 49.15, "learning_rate": 1.922968793927467e-06, "loss": 0.0438, "step": 174840 }, { "epoch": 49.16, "learning_rate": 1.9042264080217414e-06, "loss": 0.0414, "step": 174870 }, { "epoch": 49.17, "learning_rate": 1.8854840221160154e-06, "loss": 0.0455, "step": 174900 }, { "epoch": 49.18, "learning_rate": 1.8667416362102896e-06, "loss": 0.041, "step": 174930 }, { "epoch": 49.19, "learning_rate": 1.8479992503045638e-06, "loss": 0.0422, "step": 174960 }, { "epoch": 49.2, "learning_rate": 1.829256864398838e-06, "loss": 0.0407, "step": 174990 }, { "epoch": 49.2, "learning_rate": 1.8105144784931122e-06, "loss": 0.0414, "step": 175020 }, { "epoch": 49.21, "learning_rate": 1.7917720925873866e-06, "loss": 0.0444, "step": 175050 }, { "epoch": 49.22, "learning_rate": 1.7730297066816608e-06, "loss": 0.0374, "step": 175080 }, { "epoch": 49.23, "learning_rate": 1.7549120669727924e-06, "loss": 0.0429, "step": 175110 }, { "epoch": 49.24, "learning_rate": 1.7361696810670666e-06, "loss": 0.0431, "step": 175140 }, { "epoch": 49.25, "learning_rate": 1.7174272951613408e-06, "loss": 0.0397, "step": 175170 }, { "epoch": 49.25, "learning_rate": 1.698684909255615e-06, "loss": 0.0468, "step": 175200 }, { "epoch": 49.26, "learning_rate": 1.6799425233498892e-06, "loss": 0.0415, "step": 175230 }, { "epoch": 49.27, "learning_rate": 1.6612001374441632e-06, "loss": 0.0408, "step": 175260 }, { "epoch": 49.28, "learning_rate": 1.6424577515384378e-06, "loss": 0.0416, "step": 175290 }, { "epoch": 49.29, "learning_rate": 1.623715365632712e-06, "loss": 0.0403, "step": 175320 }, { "epoch": 49.3, "learning_rate": 1.6049729797269862e-06, "loss": 0.0445, "step": 175350 }, { "epoch": 49.31, "learning_rate": 1.5862305938212601e-06, "loss": 0.0398, "step": 175380 }, { "epoch": 49.31, "learning_rate": 1.5674882079155343e-06, "loss": 0.0413, "step": 175410 }, { "epoch": 49.32, "learning_rate": 1.5487458220098085e-06, "loss": 0.0442, "step": 175440 }, { "epoch": 49.33, "learning_rate": 1.530003436104083e-06, "loss": 0.0434, "step": 175470 }, { "epoch": 49.34, "learning_rate": 1.5112610501983571e-06, "loss": 0.0455, "step": 175500 }, { "epoch": 49.35, "learning_rate": 1.492518664292631e-06, "loss": 0.043, "step": 175530 }, { "epoch": 49.36, "learning_rate": 1.4737762783869053e-06, "loss": 0.0459, "step": 175560 }, { "epoch": 49.36, "learning_rate": 1.4550338924811797e-06, "loss": 0.044, "step": 175590 }, { "epoch": 49.37, "learning_rate": 1.4362915065754539e-06, "loss": 0.0394, "step": 175620 }, { "epoch": 49.38, "learning_rate": 1.417549120669728e-06, "loss": 0.0448, "step": 175650 }, { "epoch": 49.39, "learning_rate": 1.3988067347640023e-06, "loss": 0.0382, "step": 175680 }, { "epoch": 49.4, "learning_rate": 1.3800643488582764e-06, "loss": 0.0433, "step": 175710 }, { "epoch": 49.41, "learning_rate": 1.3613219629525506e-06, "loss": 0.0419, "step": 175740 }, { "epoch": 49.42, "learning_rate": 1.3425795770468248e-06, "loss": 0.039, "step": 175770 }, { "epoch": 49.42, "learning_rate": 1.323837191141099e-06, "loss": 0.0439, "step": 175800 }, { "epoch": 49.43, "learning_rate": 1.3050948052353732e-06, "loss": 0.0371, "step": 175830 }, { "epoch": 49.44, "learning_rate": 1.2863524193296474e-06, "loss": 0.0452, "step": 175860 }, { "epoch": 49.45, "learning_rate": 1.2676100334239216e-06, "loss": 0.0405, "step": 175890 }, { "epoch": 49.46, "learning_rate": 1.2488676475181958e-06, "loss": 0.0368, "step": 175920 }, { "epoch": 49.47, "learning_rate": 1.23012526161247e-06, "loss": 0.0468, "step": 175950 }, { "epoch": 49.47, "learning_rate": 1.2113828757067442e-06, "loss": 0.037, "step": 175980 }, { "epoch": 49.48, "learning_rate": 1.1926404898010184e-06, "loss": 0.0452, "step": 176010 }, { "epoch": 49.49, "learning_rate": 1.1738981038952925e-06, "loss": 0.0404, "step": 176040 }, { "epoch": 49.5, "learning_rate": 1.1551557179895667e-06, "loss": 0.0385, "step": 176070 }, { "epoch": 49.51, "learning_rate": 1.1364133320838411e-06, "loss": 0.0507, "step": 176100 }, { "epoch": 49.52, "learning_rate": 1.1176709461781151e-06, "loss": 0.0376, "step": 176130 }, { "epoch": 49.52, "learning_rate": 1.0989285602723893e-06, "loss": 0.0447, "step": 176160 }, { "epoch": 49.53, "learning_rate": 1.0801861743666635e-06, "loss": 0.0436, "step": 176190 }, { "epoch": 49.54, "learning_rate": 1.061443788460938e-06, "loss": 0.041, "step": 176220 }, { "epoch": 49.55, "learning_rate": 1.042701402555212e-06, "loss": 0.0448, "step": 176250 }, { "epoch": 49.56, "learning_rate": 1.023959016649486e-06, "loss": 0.0374, "step": 176280 }, { "epoch": 49.57, "learning_rate": 1.0052166307437603e-06, "loss": 0.0445, "step": 176310 }, { "epoch": 49.58, "learning_rate": 9.864742448380347e-07, "loss": 0.0399, "step": 176340 }, { "epoch": 49.58, "learning_rate": 9.677318589323089e-07, "loss": 0.0396, "step": 176370 }, { "epoch": 49.59, "learning_rate": 9.489894730265829e-07, "loss": 0.045, "step": 176400 }, { "epoch": 49.6, "learning_rate": 9.302470871208571e-07, "loss": 0.0401, "step": 176430 }, { "epoch": 49.61, "learning_rate": 9.115047012151314e-07, "loss": 0.0454, "step": 176460 }, { "epoch": 49.62, "learning_rate": 8.927623153094056e-07, "loss": 0.0412, "step": 176490 }, { "epoch": 49.63, "learning_rate": 8.740199294036798e-07, "loss": 0.0376, "step": 176520 }, { "epoch": 49.63, "learning_rate": 8.552775434979539e-07, "loss": 0.0451, "step": 176550 }, { "epoch": 49.64, "learning_rate": 8.365351575922283e-07, "loss": 0.0402, "step": 176580 }, { "epoch": 49.65, "learning_rate": 8.177927716865024e-07, "loss": 0.0433, "step": 176610 }, { "epoch": 49.66, "learning_rate": 7.990503857807766e-07, "loss": 0.0432, "step": 176640 }, { "epoch": 49.67, "learning_rate": 7.803079998750509e-07, "loss": 0.0424, "step": 176670 }, { "epoch": 49.68, "learning_rate": 7.61565613969325e-07, "loss": 0.0455, "step": 176700 }, { "epoch": 49.69, "learning_rate": 7.428232280635992e-07, "loss": 0.0404, "step": 176730 }, { "epoch": 49.69, "learning_rate": 7.240808421578733e-07, "loss": 0.0441, "step": 176760 }, { "epoch": 49.7, "learning_rate": 7.053384562521476e-07, "loss": 0.0422, "step": 176790 }, { "epoch": 49.71, "learning_rate": 6.865960703464218e-07, "loss": 0.0423, "step": 176820 }, { "epoch": 49.72, "learning_rate": 6.67853684440696e-07, "loss": 0.0415, "step": 176850 }, { "epoch": 49.73, "learning_rate": 6.491112985349702e-07, "loss": 0.0378, "step": 176880 }, { "epoch": 49.74, "learning_rate": 6.303689126292444e-07, "loss": 0.0427, "step": 176910 }, { "epoch": 49.74, "learning_rate": 6.116265267235186e-07, "loss": 0.0437, "step": 176940 }, { "epoch": 49.75, "learning_rate": 5.928841408177928e-07, "loss": 0.0383, "step": 176970 }, { "epoch": 49.76, "learning_rate": 5.74141754912067e-07, "loss": 0.0465, "step": 177000 }, { "epoch": 49.77, "learning_rate": 5.553993690063413e-07, "loss": 0.0377, "step": 177030 }, { "epoch": 49.78, "learning_rate": 5.366569831006153e-07, "loss": 0.0432, "step": 177060 }, { "epoch": 49.79, "learning_rate": 5.179145971948896e-07, "loss": 0.0445, "step": 177090 }, { "epoch": 49.79, "learning_rate": 4.991722112891638e-07, "loss": 0.0394, "step": 177120 }, { "epoch": 49.8, "learning_rate": 4.80429825383438e-07, "loss": 0.047, "step": 177150 }, { "epoch": 49.81, "learning_rate": 4.6168743947771216e-07, "loss": 0.0407, "step": 177180 }, { "epoch": 49.82, "learning_rate": 4.429450535719864e-07, "loss": 0.0439, "step": 177210 }, { "epoch": 49.83, "learning_rate": 4.242026676662606e-07, "loss": 0.0396, "step": 177240 }, { "epoch": 49.84, "learning_rate": 4.0546028176053484e-07, "loss": 0.0395, "step": 177270 }, { "epoch": 49.85, "learning_rate": 3.8671789585480897e-07, "loss": 0.0482, "step": 177300 }, { "epoch": 49.85, "learning_rate": 3.6797550994908316e-07, "loss": 0.0409, "step": 177330 }, { "epoch": 49.86, "learning_rate": 3.492331240433574e-07, "loss": 0.0444, "step": 177360 }, { "epoch": 49.87, "learning_rate": 3.304907381376316e-07, "loss": 0.0411, "step": 177390 }, { "epoch": 49.88, "learning_rate": 3.117483522319058e-07, "loss": 0.0408, "step": 177420 }, { "epoch": 49.89, "learning_rate": 2.9300596632618e-07, "loss": 0.0443, "step": 177450 }, { "epoch": 49.9, "learning_rate": 2.7426358042045417e-07, "loss": 0.0386, "step": 177480 }, { "epoch": 49.9, "learning_rate": 2.5552119451472836e-07, "loss": 0.0462, "step": 177510 }, { "epoch": 49.91, "learning_rate": 2.3677880860900258e-07, "loss": 0.042, "step": 177540 }, { "epoch": 49.92, "learning_rate": 2.180364227032768e-07, "loss": 0.0422, "step": 177570 }, { "epoch": 49.93, "learning_rate": 1.9929403679755099e-07, "loss": 0.043, "step": 177600 }, { "epoch": 49.94, "learning_rate": 1.805516508918252e-07, "loss": 0.0374, "step": 177630 }, { "epoch": 49.95, "learning_rate": 1.6180926498609942e-07, "loss": 0.043, "step": 177660 }, { "epoch": 49.95, "learning_rate": 1.430668790803736e-07, "loss": 0.0419, "step": 177690 }, { "epoch": 49.96, "learning_rate": 1.243244931746478e-07, "loss": 0.0397, "step": 177720 }, { "epoch": 49.97, "learning_rate": 1.05582107268922e-07, "loss": 0.0488, "step": 177750 }, { "epoch": 49.98, "learning_rate": 8.68397213631962e-08, "loss": 0.0399, "step": 177780 }, { "epoch": 49.99, "learning_rate": 6.80973354574704e-08, "loss": 0.0426, "step": 177810 }, { "epoch": 50.0, "learning_rate": 4.9354949551744604e-08, "loss": 0.0428, "step": 177840 }, { "epoch": 50.0, "eval_loss": 0.11027602851390839, "eval_runtime": 645.5008, "eval_samples_per_second": 24.838, "eval_steps_per_second": 0.778, "eval_wer": 0.0915207511634572, "step": 177850 }, { "epoch": 50.0, "step": 177850, "total_flos": 3.938373027563576e+21, "train_loss": 0.1478050081201038, "train_runtime": 1439234.2576, "train_samples_per_second": 15.819, "train_steps_per_second": 0.124 } ], "max_steps": 177850, "num_train_epochs": 50, "total_flos": 3.938373027563576e+21, "trial_name": null, "trial_params": null }