{ "best_metric": null, "best_model_checkpoint": null, "epoch": 25.0, "global_step": 153725, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.02, "learning_rate": 2e-05, "loss": 13.0218, "step": 100 }, { "epoch": 0.02, "eval_loss": 12.945786476135254, "eval_runtime": 7.9731, "eval_samples_per_second": 12.542, "eval_wer": 1.0, "step": 100 }, { "epoch": 0.03, "learning_rate": 4e-05, "loss": 4.4749, "step": 200 }, { "epoch": 0.03, "eval_loss": 3.8371927738189697, "eval_runtime": 7.0147, "eval_samples_per_second": 14.256, "eval_wer": 1.0, "step": 200 }, { "epoch": 0.05, "learning_rate": 6e-05, "loss": 3.1121, "step": 300 }, { "epoch": 0.05, "eval_loss": 3.498441457748413, "eval_runtime": 8.8314, "eval_samples_per_second": 11.323, "eval_wer": 1.0, "step": 300 }, { "epoch": 0.07, "learning_rate": 8e-05, "loss": 3.0216, "step": 400 }, { "epoch": 0.07, "eval_loss": 3.28515625, "eval_runtime": 7.5144, "eval_samples_per_second": 13.308, "eval_wer": 1.0, "step": 400 }, { "epoch": 0.08, "learning_rate": 0.0001, "loss": 2.9786, "step": 500 }, { "epoch": 0.08, "eval_loss": 3.120776891708374, "eval_runtime": 7.7151, "eval_samples_per_second": 12.962, "eval_wer": 1.0, "step": 500 }, { "epoch": 0.1, "learning_rate": 9.993473649861316e-05, "loss": 2.9376, "step": 600 }, { "epoch": 0.1, "eval_loss": 2.971864700317383, "eval_runtime": 8.4632, "eval_samples_per_second": 11.816, "eval_wer": 1.0, "step": 600 }, { "epoch": 0.11, "learning_rate": 9.986947299722631e-05, "loss": 2.0802, "step": 700 }, { "epoch": 0.11, "eval_loss": 1.857584834098816, "eval_runtime": 9.723, "eval_samples_per_second": 10.285, "eval_wer": 0.8855054811205847, "step": 700 }, { "epoch": 0.13, "learning_rate": 9.980420949583945e-05, "loss": 1.0262, "step": 800 }, { "epoch": 0.13, "eval_loss": 1.1796859502792358, "eval_runtime": 7.4195, "eval_samples_per_second": 13.478, "eval_wer": 0.6942752740560292, "step": 800 }, { "epoch": 0.15, "learning_rate": 9.97389459944526e-05, "loss": 0.7875, "step": 900 }, { "epoch": 0.15, "eval_loss": 1.219588041305542, "eval_runtime": 9.0106, "eval_samples_per_second": 11.098, "eval_wer": 0.682095006090134, "step": 900 }, { "epoch": 0.16, "learning_rate": 9.967368249306576e-05, "loss": 0.688, "step": 1000 }, { "epoch": 0.16, "eval_loss": 0.8769925832748413, "eval_runtime": 8.365, "eval_samples_per_second": 11.955, "eval_wer": 0.6065773447015834, "step": 1000 }, { "epoch": 0.18, "learning_rate": 9.96084189916789e-05, "loss": 0.6377, "step": 1100 }, { "epoch": 0.18, "eval_loss": 0.7903584241867065, "eval_runtime": 7.3855, "eval_samples_per_second": 13.54, "eval_wer": 0.5700365408038977, "step": 1100 }, { "epoch": 0.2, "learning_rate": 9.954315549029206e-05, "loss": 0.5704, "step": 1200 }, { "epoch": 0.2, "eval_loss": 0.8232672214508057, "eval_runtime": 7.6284, "eval_samples_per_second": 13.109, "eval_wer": 0.5651644336175395, "step": 1200 }, { "epoch": 0.21, "learning_rate": 9.947789198890522e-05, "loss": 0.5187, "step": 1300 }, { "epoch": 0.21, "eval_loss": 0.7398794293403625, "eval_runtime": 8.3859, "eval_samples_per_second": 11.925, "eval_wer": 0.5237515225334958, "step": 1300 }, { "epoch": 0.23, "learning_rate": 9.941262848751835e-05, "loss": Infinity, "step": 1400 }, { "epoch": 0.23, "eval_loss": 0.6848248839378357, "eval_runtime": 8.3309, "eval_samples_per_second": 12.004, "eval_wer": 0.5261875761266748, "step": 1400 }, { "epoch": 0.24, "learning_rate": 9.934736498613151e-05, "loss": NaN, "step": 1500 }, { "epoch": 0.24, "eval_loss": 0.712200403213501, "eval_runtime": 8.7637, "eval_samples_per_second": 11.411, "eval_wer": 0.5408038976857491, "step": 1500 }, { "epoch": 0.26, "learning_rate": 9.928210148474466e-05, "loss": NaN, "step": 1600 }, { "epoch": 0.26, "eval_loss": 0.7104419469833374, "eval_runtime": 8.8754, "eval_samples_per_second": 11.267, "eval_wer": 0.5371498172959805, "step": 1600 }, { "epoch": 0.28, "learning_rate": 9.921683798335781e-05, "loss": NaN, "step": 1700 }, { "epoch": 0.28, "eval_loss": 0.6172800660133362, "eval_runtime": 7.0857, "eval_samples_per_second": 14.113, "eval_wer": 0.5018270401948843, "step": 1700 }, { "epoch": 0.29, "learning_rate": 9.915157448197096e-05, "loss": NaN, "step": 1800 }, { "epoch": 0.29, "eval_loss": 0.6506848335266113, "eval_runtime": 7.7525, "eval_samples_per_second": 12.899, "eval_wer": 0.5006090133982948, "step": 1800 }, { "epoch": 0.31, "learning_rate": 9.908631098058412e-05, "loss": NaN, "step": 1900 }, { "epoch": 0.31, "eval_loss": 0.6602973937988281, "eval_runtime": 7.4177, "eval_samples_per_second": 13.481, "eval_wer": 0.5042630937880633, "step": 1900 }, { "epoch": 0.33, "learning_rate": 9.902104747919726e-05, "loss": NaN, "step": 2000 }, { "epoch": 0.33, "eval_loss": 0.7591428160667419, "eval_runtime": 8.4029, "eval_samples_per_second": 11.901, "eval_wer": 0.4981729598051157, "step": 2000 }, { "epoch": 0.34, "learning_rate": 9.895578397781041e-05, "loss": NaN, "step": 2100 }, { "epoch": 0.34, "eval_loss": 0.645115077495575, "eval_runtime": 8.9522, "eval_samples_per_second": 11.17, "eval_wer": 0.47990255785627284, "step": 2100 }, { "epoch": 0.36, "learning_rate": 9.889052047642357e-05, "loss": NaN, "step": 2200 }, { "epoch": 0.36, "eval_loss": 0.7210723757743835, "eval_runtime": 8.4131, "eval_samples_per_second": 11.886, "eval_wer": 0.5152253349573691, "step": 2200 }, { "epoch": 0.37, "learning_rate": 9.882525697503671e-05, "loss": NaN, "step": 2300 }, { "epoch": 0.37, "eval_loss": 0.6183672547340393, "eval_runtime": 8.3896, "eval_samples_per_second": 11.92, "eval_wer": 0.4725943970767357, "step": 2300 }, { "epoch": 0.39, "learning_rate": 9.875999347364987e-05, "loss": NaN, "step": 2400 }, { "epoch": 0.39, "eval_loss": 0.6048241257667542, "eval_runtime": 10.2676, "eval_samples_per_second": 9.739, "eval_wer": 0.464068209500609, "step": 2400 }, { "epoch": 0.41, "learning_rate": 9.869472997226302e-05, "loss": NaN, "step": 2500 }, { "epoch": 0.41, "eval_loss": 0.6044276356697083, "eval_runtime": 8.3824, "eval_samples_per_second": 11.93, "eval_wer": 0.49573690621193667, "step": 2500 }, { "epoch": 0.42, "learning_rate": 9.862946647087616e-05, "loss": NaN, "step": 2600 }, { "epoch": 0.42, "eval_loss": 0.6002959609031677, "eval_runtime": 9.9471, "eval_samples_per_second": 10.053, "eval_wer": 0.4835566382460414, "step": 2600 }, { "epoch": 0.44, "learning_rate": 9.856420296948932e-05, "loss": NaN, "step": 2700 }, { "epoch": 0.44, "eval_loss": 0.5933263897895813, "eval_runtime": 9.0583, "eval_samples_per_second": 11.04, "eval_wer": 0.4835566382460414, "step": 2700 }, { "epoch": 0.46, "learning_rate": 9.849893946810246e-05, "loss": NaN, "step": 2800 }, { "epoch": 0.46, "eval_loss": 0.6014515161514282, "eval_runtime": 8.0695, "eval_samples_per_second": 12.392, "eval_wer": 0.46650426309378806, "step": 2800 }, { "epoch": 0.47, "learning_rate": 9.843367596671562e-05, "loss": NaN, "step": 2900 }, { "epoch": 0.47, "eval_loss": 0.5901432037353516, "eval_runtime": 6.798, "eval_samples_per_second": 14.71, "eval_wer": 0.4762484774665043, "step": 2900 }, { "epoch": 0.49, "learning_rate": 9.836841246532877e-05, "loss": NaN, "step": 3000 }, { "epoch": 0.49, "eval_loss": 0.626334011554718, "eval_runtime": 7.8972, "eval_samples_per_second": 12.663, "eval_wer": 0.5066991473812423, "step": 3000 }, { "epoch": 0.5, "learning_rate": 9.830314896394191e-05, "loss": NaN, "step": 3100 }, { "epoch": 0.5, "eval_loss": 0.5547911524772644, "eval_runtime": 9.1187, "eval_samples_per_second": 10.966, "eval_wer": 0.464068209500609, "step": 3100 }, { "epoch": 0.52, "learning_rate": 9.823788546255507e-05, "loss": NaN, "step": 3200 }, { "epoch": 0.52, "eval_loss": 0.5864753127098083, "eval_runtime": 8.1423, "eval_samples_per_second": 12.282, "eval_wer": 0.48112058465286234, "step": 3200 }, { "epoch": 0.54, "learning_rate": 9.817262196116822e-05, "loss": NaN, "step": 3300 }, { "epoch": 0.54, "eval_loss": 0.573021650314331, "eval_runtime": 7.0496, "eval_samples_per_second": 14.185, "eval_wer": 0.45554202192448234, "step": 3300 }, { "epoch": 0.55, "learning_rate": 9.810735845978138e-05, "loss": NaN, "step": 3400 }, { "epoch": 0.55, "eval_loss": 0.5912113785743713, "eval_runtime": 7.7808, "eval_samples_per_second": 12.852, "eval_wer": 0.4543239951278928, "step": 3400 }, { "epoch": 0.57, "learning_rate": 9.804209495839452e-05, "loss": NaN, "step": 3500 }, { "epoch": 0.57, "eval_loss": 0.5591552257537842, "eval_runtime": 8.6018, "eval_samples_per_second": 11.625, "eval_wer": 0.4835566382460414, "step": 3500 }, { "epoch": 0.59, "learning_rate": 9.797683145700768e-05, "loss": NaN, "step": 3600 }, { "epoch": 0.59, "eval_loss": 0.5811930298805237, "eval_runtime": 11.1558, "eval_samples_per_second": 8.964, "eval_wer": 0.47990255785627284, "step": 3600 }, { "epoch": 0.6, "learning_rate": 9.791156795562083e-05, "loss": NaN, "step": 3700 }, { "epoch": 0.6, "eval_loss": 0.634550154209137, "eval_runtime": 6.9892, "eval_samples_per_second": 14.308, "eval_wer": 0.464068209500609, "step": 3700 }, { "epoch": 0.62, "learning_rate": 9.784630445423397e-05, "loss": NaN, "step": 3800 }, { "epoch": 0.62, "eval_loss": 0.6496349573135376, "eval_runtime": 8.2428, "eval_samples_per_second": 12.132, "eval_wer": 0.4993909866017052, "step": 3800 }, { "epoch": 0.63, "learning_rate": 9.778104095284713e-05, "loss": NaN, "step": 3900 }, { "epoch": 0.63, "eval_loss": 0.6067304611206055, "eval_runtime": 7.9623, "eval_samples_per_second": 12.559, "eval_wer": 0.464068209500609, "step": 3900 }, { "epoch": 0.65, "learning_rate": 9.771577745146027e-05, "loss": NaN, "step": 4000 }, { "epoch": 0.65, "eval_loss": 0.6350998878479004, "eval_runtime": 7.586, "eval_samples_per_second": 13.182, "eval_wer": 0.47381242387332523, "step": 4000 }, { "epoch": 0.67, "learning_rate": 9.765051395007343e-05, "loss": NaN, "step": 4100 }, { "epoch": 0.67, "eval_loss": 0.54295814037323, "eval_runtime": 8.9327, "eval_samples_per_second": 11.195, "eval_wer": 0.45554202192448234, "step": 4100 }, { "epoch": 0.68, "learning_rate": 9.758525044868658e-05, "loss": NaN, "step": 4200 }, { "epoch": 0.68, "eval_loss": 0.6605328321456909, "eval_runtime": 9.5705, "eval_samples_per_second": 10.449, "eval_wer": 0.46528623629719856, "step": 4200 }, { "epoch": 0.7, "learning_rate": 9.751998694729972e-05, "loss": NaN, "step": 4300 }, { "epoch": 0.7, "eval_loss": 0.580009937286377, "eval_runtime": 10.5327, "eval_samples_per_second": 9.494, "eval_wer": 0.464068209500609, "step": 4300 }, { "epoch": 0.72, "learning_rate": 9.745472344591288e-05, "loss": NaN, "step": 4400 }, { "epoch": 0.72, "eval_loss": 0.579453706741333, "eval_runtime": 10.8819, "eval_samples_per_second": 9.19, "eval_wer": 0.46163215590742995, "step": 4400 }, { "epoch": 0.73, "learning_rate": 9.738945994452603e-05, "loss": NaN, "step": 4500 }, { "epoch": 0.73, "eval_loss": 0.655251145362854, "eval_runtime": 9.1533, "eval_samples_per_second": 10.925, "eval_wer": 0.4591961023142509, "step": 4500 }, { "epoch": 0.75, "learning_rate": 9.732419644313919e-05, "loss": NaN, "step": 4600 }, { "epoch": 0.75, "eval_loss": 0.5785291790962219, "eval_runtime": 6.6729, "eval_samples_per_second": 14.986, "eval_wer": 0.44336175395858707, "step": 4600 }, { "epoch": 0.76, "learning_rate": 9.725893294175233e-05, "loss": NaN, "step": 4700 }, { "epoch": 0.76, "eval_loss": 0.5562949776649475, "eval_runtime": 12.0553, "eval_samples_per_second": 8.295, "eval_wer": 0.4762484774665043, "step": 4700 }, { "epoch": 0.78, "learning_rate": 9.719366944036548e-05, "loss": NaN, "step": 4800 }, { "epoch": 0.78, "eval_loss": 0.6431012749671936, "eval_runtime": 10.2668, "eval_samples_per_second": 9.74, "eval_wer": 0.46041412911084045, "step": 4800 }, { "epoch": 0.8, "learning_rate": 9.712840593897863e-05, "loss": NaN, "step": 4900 }, { "epoch": 0.8, "eval_loss": 0.5410518050193787, "eval_runtime": 7.7698, "eval_samples_per_second": 12.87, "eval_wer": 0.44336175395858707, "step": 4900 }, { "epoch": 0.81, "learning_rate": 9.706314243759178e-05, "loss": NaN, "step": 5000 }, { "epoch": 0.81, "eval_loss": 0.5471655130386353, "eval_runtime": 9.2576, "eval_samples_per_second": 10.802, "eval_wer": 0.4591961023142509, "step": 5000 }, { "epoch": 0.83, "learning_rate": 9.699787893620494e-05, "loss": NaN, "step": 5100 }, { "epoch": 0.83, "eval_loss": 0.5607233643531799, "eval_runtime": 9.7403, "eval_samples_per_second": 10.267, "eval_wer": 0.4457978075517661, "step": 5100 }, { "epoch": 0.85, "learning_rate": 9.693261543481808e-05, "loss": NaN, "step": 5200 }, { "epoch": 0.85, "eval_loss": 0.5090478658676147, "eval_runtime": 7.6231, "eval_samples_per_second": 13.118, "eval_wer": 0.42509135200974424, "step": 5200 }, { "epoch": 0.86, "learning_rate": 9.686735193343124e-05, "loss": NaN, "step": 5300 }, { "epoch": 0.86, "eval_loss": 0.5385191440582275, "eval_runtime": 8.5521, "eval_samples_per_second": 11.693, "eval_wer": 0.44336175395858707, "step": 5300 }, { "epoch": 0.88, "learning_rate": 9.680208843204437e-05, "loss": NaN, "step": 5400 }, { "epoch": 0.88, "eval_loss": 0.5557727217674255, "eval_runtime": 7.4167, "eval_samples_per_second": 13.483, "eval_wer": 0.4591961023142509, "step": 5400 }, { "epoch": 0.89, "learning_rate": 9.673682493065753e-05, "loss": NaN, "step": 5500 }, { "epoch": 0.89, "eval_loss": 0.5240246653556824, "eval_runtime": 8.9322, "eval_samples_per_second": 11.195, "eval_wer": 0.42630937880633374, "step": 5500 }, { "epoch": 0.91, "learning_rate": 9.667156142927069e-05, "loss": NaN, "step": 5600 }, { "epoch": 0.91, "eval_loss": 0.5305324792861938, "eval_runtime": 6.8749, "eval_samples_per_second": 14.546, "eval_wer": 0.440925700365408, "step": 5600 }, { "epoch": 0.93, "learning_rate": 9.660629792788384e-05, "loss": NaN, "step": 5700 }, { "epoch": 0.93, "eval_loss": 0.4999062716960907, "eval_runtime": 8.9284, "eval_samples_per_second": 11.2, "eval_wer": 0.43727161997563946, "step": 5700 }, { "epoch": 0.94, "learning_rate": 9.6541034426497e-05, "loss": NaN, "step": 5800 }, { "epoch": 0.94, "eval_loss": 0.5356720089912415, "eval_runtime": 7.3019, "eval_samples_per_second": 13.695, "eval_wer": 0.4299634591961023, "step": 5800 }, { "epoch": 0.96, "learning_rate": 9.647577092511013e-05, "loss": NaN, "step": 5900 }, { "epoch": 0.96, "eval_loss": 0.5162432193756104, "eval_runtime": 7.7242, "eval_samples_per_second": 12.946, "eval_wer": 0.4177831912302071, "step": 5900 }, { "epoch": 0.98, "learning_rate": 9.641050742372329e-05, "loss": NaN, "step": 6000 }, { "epoch": 0.98, "eval_loss": 0.541946291923523, "eval_runtime": 8.7592, "eval_samples_per_second": 11.417, "eval_wer": 0.440925700365408, "step": 6000 }, { "epoch": 0.99, "learning_rate": 9.634524392233643e-05, "loss": NaN, "step": 6100 }, { "epoch": 0.99, "eval_loss": 0.5452945828437805, "eval_runtime": 8.1867, "eval_samples_per_second": 12.215, "eval_wer": 0.44336175395858707, "step": 6100 }, { "epoch": 1.01, "learning_rate": 9.627998042094959e-05, "loss": NaN, "step": 6200 }, { "epoch": 1.01, "eval_loss": 0.6135980486869812, "eval_runtime": 8.1992, "eval_samples_per_second": 12.196, "eval_wer": 0.44336175395858707, "step": 6200 }, { "epoch": 1.02, "learning_rate": 9.621471691956275e-05, "loss": NaN, "step": 6300 }, { "epoch": 1.02, "eval_loss": 0.5763392448425293, "eval_runtime": 8.7786, "eval_samples_per_second": 11.391, "eval_wer": 0.4457978075517661, "step": 6300 }, { "epoch": 1.04, "learning_rate": 9.61494534181759e-05, "loss": NaN, "step": 6400 }, { "epoch": 1.04, "eval_loss": 0.5169751048088074, "eval_runtime": 8.8344, "eval_samples_per_second": 11.319, "eval_wer": 0.44945188794153473, "step": 6400 }, { "epoch": 1.06, "learning_rate": 9.608418991678904e-05, "loss": NaN, "step": 6500 }, { "epoch": 1.06, "eval_loss": 0.5410892367362976, "eval_runtime": 8.9659, "eval_samples_per_second": 11.153, "eval_wer": 0.41291108404384896, "step": 6500 }, { "epoch": 1.07, "learning_rate": 9.601892641540218e-05, "loss": NaN, "step": 6600 }, { "epoch": 1.07, "eval_loss": 0.6024890542030334, "eval_runtime": 9.0589, "eval_samples_per_second": 11.039, "eval_wer": 0.46650426309378806, "step": 6600 }, { "epoch": 1.09, "learning_rate": 9.595366291401534e-05, "loss": NaN, "step": 6700 }, { "epoch": 1.09, "eval_loss": 0.5081002116203308, "eval_runtime": 6.9031, "eval_samples_per_second": 14.486, "eval_wer": 0.4445797807551766, "step": 6700 }, { "epoch": 1.11, "learning_rate": 9.588839941262849e-05, "loss": NaN, "step": 6800 }, { "epoch": 1.11, "eval_loss": 0.537754237651825, "eval_runtime": 6.9434, "eval_samples_per_second": 14.402, "eval_wer": 0.44336175395858707, "step": 6800 }, { "epoch": 1.12, "learning_rate": 9.582313591124165e-05, "loss": NaN, "step": 6900 }, { "epoch": 1.12, "eval_loss": 0.5683107972145081, "eval_runtime": 7.8602, "eval_samples_per_second": 12.722, "eval_wer": 0.4336175395858709, "step": 6900 }, { "epoch": 1.14, "learning_rate": 9.57578724098548e-05, "loss": NaN, "step": 7000 }, { "epoch": 1.14, "eval_loss": 0.6018743515014648, "eval_runtime": 7.5695, "eval_samples_per_second": 13.211, "eval_wer": 0.4348355663824604, "step": 7000 }, { "epoch": 1.15, "learning_rate": 9.569260890846794e-05, "loss": NaN, "step": 7100 }, { "epoch": 1.15, "eval_loss": 0.5463069677352905, "eval_runtime": 8.1373, "eval_samples_per_second": 12.289, "eval_wer": 0.42752740560292324, "step": 7100 }, { "epoch": 1.17, "learning_rate": 9.56273454070811e-05, "loss": NaN, "step": 7200 }, { "epoch": 1.17, "eval_loss": 0.5245855450630188, "eval_runtime": 7.3379, "eval_samples_per_second": 13.628, "eval_wer": 0.42752740560292324, "step": 7200 }, { "epoch": 1.19, "learning_rate": 9.556208190569424e-05, "loss": NaN, "step": 7300 }, { "epoch": 1.19, "eval_loss": 0.48042479157447815, "eval_runtime": 6.6664, "eval_samples_per_second": 15.001, "eval_wer": 0.4336175395858709, "step": 7300 }, { "epoch": 1.2, "learning_rate": 9.54968184043074e-05, "loss": NaN, "step": 7400 }, { "epoch": 1.2, "eval_loss": 0.4897633492946625, "eval_runtime": 6.6761, "eval_samples_per_second": 14.979, "eval_wer": 0.4445797807551766, "step": 7400 }, { "epoch": 1.22, "learning_rate": 9.543155490292054e-05, "loss": NaN, "step": 7500 }, { "epoch": 1.22, "eval_loss": 0.5400981903076172, "eval_runtime": 7.744, "eval_samples_per_second": 12.913, "eval_wer": 0.4238733252131547, "step": 7500 }, { "epoch": 1.24, "learning_rate": 9.536629140153369e-05, "loss": NaN, "step": 7600 }, { "epoch": 1.24, "eval_loss": 0.5461037158966064, "eval_runtime": 7.6292, "eval_samples_per_second": 13.108, "eval_wer": 0.43118148599269185, "step": 7600 }, { "epoch": 1.25, "learning_rate": 9.530102790014685e-05, "loss": NaN, "step": 7700 }, { "epoch": 1.25, "eval_loss": 0.4961685538291931, "eval_runtime": 7.2783, "eval_samples_per_second": 13.739, "eval_wer": 0.4226552984165652, "step": 7700 }, { "epoch": 1.27, "learning_rate": 9.523576439875999e-05, "loss": NaN, "step": 7800 }, { "epoch": 1.27, "eval_loss": 0.6107471585273743, "eval_runtime": 8.6517, "eval_samples_per_second": 11.558, "eval_wer": 0.438489646772229, "step": 7800 }, { "epoch": 1.28, "learning_rate": 9.517050089737315e-05, "loss": NaN, "step": 7900 }, { "epoch": 1.28, "eval_loss": 0.5769979953765869, "eval_runtime": 7.4406, "eval_samples_per_second": 13.44, "eval_wer": 0.43605359317904996, "step": 7900 }, { "epoch": 1.3, "learning_rate": 9.51052373959863e-05, "loss": NaN, "step": 8000 }, { "epoch": 1.3, "eval_loss": 0.5004762411117554, "eval_runtime": 8.9614, "eval_samples_per_second": 11.159, "eval_wer": 0.43239951278928135, "step": 8000 }, { "epoch": 1.32, "learning_rate": 9.503997389459946e-05, "loss": NaN, "step": 8100 }, { "epoch": 1.32, "eval_loss": 0.46339115500450134, "eval_runtime": 7.2515, "eval_samples_per_second": 13.79, "eval_wer": 0.4104750304506699, "step": 8100 }, { "epoch": 1.33, "learning_rate": 9.49747103932126e-05, "loss": NaN, "step": 8200 }, { "epoch": 1.33, "eval_loss": 0.5336301922798157, "eval_runtime": 8.7749, "eval_samples_per_second": 11.396, "eval_wer": 0.44336175395858707, "step": 8200 }, { "epoch": 1.35, "learning_rate": 9.490944689182575e-05, "loss": NaN, "step": 8300 }, { "epoch": 1.35, "eval_loss": 0.5296890139579773, "eval_runtime": 8.6952, "eval_samples_per_second": 11.501, "eval_wer": 0.4238733252131547, "step": 8300 }, { "epoch": 1.37, "learning_rate": 9.48441833904389e-05, "loss": NaN, "step": 8400 }, { "epoch": 1.37, "eval_loss": 0.5209415555000305, "eval_runtime": 8.7658, "eval_samples_per_second": 11.408, "eval_wer": 0.4482338611449452, "step": 8400 }, { "epoch": 1.38, "learning_rate": 9.477891988905205e-05, "loss": NaN, "step": 8500 }, { "epoch": 1.38, "eval_loss": 0.5313872694969177, "eval_runtime": 8.6447, "eval_samples_per_second": 11.568, "eval_wer": 0.4287454323995128, "step": 8500 }, { "epoch": 1.4, "learning_rate": 9.471365638766521e-05, "loss": NaN, "step": 8600 }, { "epoch": 1.4, "eval_loss": 0.5957339406013489, "eval_runtime": 9.3851, "eval_samples_per_second": 10.655, "eval_wer": 0.4445797807551766, "step": 8600 }, { "epoch": 1.41, "learning_rate": 9.464839288627835e-05, "loss": NaN, "step": 8700 }, { "epoch": 1.41, "eval_loss": 0.4665583074092865, "eval_runtime": 7.7597, "eval_samples_per_second": 12.887, "eval_wer": 0.4336175395858709, "step": 8700 }, { "epoch": 1.43, "learning_rate": 9.45831293848915e-05, "loss": NaN, "step": 8800 }, { "epoch": 1.43, "eval_loss": 0.5392510890960693, "eval_runtime": 8.1949, "eval_samples_per_second": 12.203, "eval_wer": 0.4336175395858709, "step": 8800 }, { "epoch": 1.45, "learning_rate": 9.451786588350466e-05, "loss": NaN, "step": 8900 }, { "epoch": 1.45, "eval_loss": 0.5618553161621094, "eval_runtime": 7.3195, "eval_samples_per_second": 13.662, "eval_wer": 0.4482338611449452, "step": 8900 }, { "epoch": 1.46, "learning_rate": 9.44526023821178e-05, "loss": NaN, "step": 9000 }, { "epoch": 1.46, "eval_loss": 0.6219630837440491, "eval_runtime": 7.7967, "eval_samples_per_second": 12.826, "eval_wer": 0.4713763702801462, "step": 9000 }, { "epoch": 1.48, "learning_rate": 9.438733888073096e-05, "loss": NaN, "step": 9100 }, { "epoch": 1.48, "eval_loss": 0.6084015369415283, "eval_runtime": 8.535, "eval_samples_per_second": 11.717, "eval_wer": 0.4470158343483557, "step": 9100 }, { "epoch": 1.5, "learning_rate": 9.43220753793441e-05, "loss": NaN, "step": 9200 }, { "epoch": 1.5, "eval_loss": 0.5832752585411072, "eval_runtime": 8.3754, "eval_samples_per_second": 11.94, "eval_wer": 0.43727161997563946, "step": 9200 }, { "epoch": 1.51, "learning_rate": 9.425681187795725e-05, "loss": NaN, "step": 9300 }, { "epoch": 1.51, "eval_loss": 0.5465306043624878, "eval_runtime": 6.9903, "eval_samples_per_second": 14.306, "eval_wer": 0.43118148599269185, "step": 9300 }, { "epoch": 1.53, "learning_rate": 9.419154837657041e-05, "loss": NaN, "step": 9400 }, { "epoch": 1.53, "eval_loss": 0.527911901473999, "eval_runtime": 7.4382, "eval_samples_per_second": 13.444, "eval_wer": 0.4518879415347138, "step": 9400 }, { "epoch": 1.54, "learning_rate": 9.412628487518356e-05, "loss": NaN, "step": 9500 }, { "epoch": 1.54, "eval_loss": 0.5745791792869568, "eval_runtime": 9.6658, "eval_samples_per_second": 10.346, "eval_wer": 0.4238733252131547, "step": 9500 }, { "epoch": 1.56, "learning_rate": 9.406102137379671e-05, "loss": NaN, "step": 9600 }, { "epoch": 1.56, "eval_loss": 0.6281310319900513, "eval_runtime": 10.5392, "eval_samples_per_second": 9.488, "eval_wer": 0.4531059683313033, "step": 9600 }, { "epoch": 1.58, "learning_rate": 9.399575787240986e-05, "loss": NaN, "step": 9700 }, { "epoch": 1.58, "eval_loss": 0.5570322871208191, "eval_runtime": 7.2179, "eval_samples_per_second": 13.854, "eval_wer": 0.44336175395858707, "step": 9700 }, { "epoch": 1.59, "learning_rate": 9.393049437102302e-05, "loss": NaN, "step": 9800 }, { "epoch": 1.59, "eval_loss": 0.5097599625587463, "eval_runtime": 8.5291, "eval_samples_per_second": 11.725, "eval_wer": 0.43605359317904996, "step": 9800 }, { "epoch": 1.61, "learning_rate": 9.386523086963615e-05, "loss": NaN, "step": 9900 }, { "epoch": 1.61, "eval_loss": 0.5071770548820496, "eval_runtime": 8.0326, "eval_samples_per_second": 12.449, "eval_wer": 0.4190012180267966, "step": 9900 }, { "epoch": 1.63, "learning_rate": 9.379996736824931e-05, "loss": NaN, "step": 10000 }, { "epoch": 1.63, "eval_loss": 0.5283228158950806, "eval_runtime": 7.0447, "eval_samples_per_second": 14.195, "eval_wer": 0.42752740560292324, "step": 10000 }, { "epoch": 1.64, "learning_rate": 9.373470386686247e-05, "loss": NaN, "step": 10100 }, { "epoch": 1.64, "eval_loss": 0.6241239309310913, "eval_runtime": 7.6906, "eval_samples_per_second": 13.003, "eval_wer": 0.45676004872107184, "step": 10100 }, { "epoch": 1.66, "learning_rate": 9.366944036547561e-05, "loss": NaN, "step": 10200 }, { "epoch": 1.66, "eval_loss": 0.5286669731140137, "eval_runtime": 7.6387, "eval_samples_per_second": 13.091, "eval_wer": 0.4445797807551766, "step": 10200 }, { "epoch": 1.68, "learning_rate": 9.360417686408877e-05, "loss": NaN, "step": 10300 }, { "epoch": 1.68, "eval_loss": 0.560374915599823, "eval_runtime": 7.7761, "eval_samples_per_second": 12.86, "eval_wer": 0.4518879415347138, "step": 10300 }, { "epoch": 1.69, "learning_rate": 9.353891336270192e-05, "loss": NaN, "step": 10400 }, { "epoch": 1.69, "eval_loss": 0.5197404623031616, "eval_runtime": 7.8548, "eval_samples_per_second": 12.731, "eval_wer": 0.4445797807551766, "step": 10400 }, { "epoch": 1.71, "learning_rate": 9.347364986131506e-05, "loss": NaN, "step": 10500 }, { "epoch": 1.71, "eval_loss": 0.5106395483016968, "eval_runtime": 8.6218, "eval_samples_per_second": 11.598, "eval_wer": 0.44214372716199757, "step": 10500 }, { "epoch": 1.72, "learning_rate": 9.34083863599282e-05, "loss": NaN, "step": 10600 }, { "epoch": 1.72, "eval_loss": 0.5029647350311279, "eval_runtime": 9.875, "eval_samples_per_second": 10.127, "eval_wer": 0.4445797807551766, "step": 10600 }, { "epoch": 1.74, "learning_rate": 9.334312285854136e-05, "loss": NaN, "step": 10700 }, { "epoch": 1.74, "eval_loss": 0.5408429503440857, "eval_runtime": 8.0516, "eval_samples_per_second": 12.42, "eval_wer": 0.4397076735688185, "step": 10700 }, { "epoch": 1.76, "learning_rate": 9.327785935715452e-05, "loss": NaN, "step": 10800 }, { "epoch": 1.76, "eval_loss": 0.599218487739563, "eval_runtime": 9.8313, "eval_samples_per_second": 10.172, "eval_wer": 0.43118148599269185, "step": 10800 }, { "epoch": 1.77, "learning_rate": 9.321259585576767e-05, "loss": NaN, "step": 10900 }, { "epoch": 1.77, "eval_loss": 0.5169634819030762, "eval_runtime": 7.002, "eval_samples_per_second": 14.282, "eval_wer": 0.4092570036540804, "step": 10900 }, { "epoch": 1.79, "learning_rate": 9.314733235438081e-05, "loss": NaN, "step": 11000 }, { "epoch": 1.79, "eval_loss": 0.5207093954086304, "eval_runtime": 7.4268, "eval_samples_per_second": 13.465, "eval_wer": 0.42752740560292324, "step": 11000 }, { "epoch": 1.81, "learning_rate": 9.308206885299396e-05, "loss": NaN, "step": 11100 }, { "epoch": 1.81, "eval_loss": 0.5467461347579956, "eval_runtime": 7.8754, "eval_samples_per_second": 12.698, "eval_wer": 0.4226552984165652, "step": 11100 }, { "epoch": 1.82, "learning_rate": 9.301680535160712e-05, "loss": NaN, "step": 11200 }, { "epoch": 1.82, "eval_loss": 0.49166274070739746, "eval_runtime": 7.5148, "eval_samples_per_second": 13.307, "eval_wer": 0.4104750304506699, "step": 11200 }, { "epoch": 1.84, "learning_rate": 9.295154185022028e-05, "loss": NaN, "step": 11300 }, { "epoch": 1.84, "eval_loss": 0.49259471893310547, "eval_runtime": 8.1781, "eval_samples_per_second": 12.228, "eval_wer": 0.4336175395858709, "step": 11300 }, { "epoch": 1.85, "learning_rate": 9.288627834883342e-05, "loss": NaN, "step": 11400 }, { "epoch": 1.85, "eval_loss": 0.666587233543396, "eval_runtime": 7.8835, "eval_samples_per_second": 12.685, "eval_wer": 0.43605359317904996, "step": 11400 }, { "epoch": 1.87, "learning_rate": 9.282101484744658e-05, "loss": NaN, "step": 11500 }, { "epoch": 1.87, "eval_loss": 0.5402622222900391, "eval_runtime": 7.727, "eval_samples_per_second": 12.942, "eval_wer": 0.42630937880633374, "step": 11500 }, { "epoch": 1.89, "learning_rate": 9.275575134605971e-05, "loss": NaN, "step": 11600 }, { "epoch": 1.89, "eval_loss": 0.5431535840034485, "eval_runtime": 8.2898, "eval_samples_per_second": 12.063, "eval_wer": 0.4397076735688185, "step": 11600 }, { "epoch": 1.9, "learning_rate": 9.269048784467287e-05, "loss": NaN, "step": 11700 }, { "epoch": 1.9, "eval_loss": 0.5058331489562988, "eval_runtime": 7.6428, "eval_samples_per_second": 13.084, "eval_wer": 0.4190012180267966, "step": 11700 }, { "epoch": 1.92, "learning_rate": 9.262522434328602e-05, "loss": NaN, "step": 11800 }, { "epoch": 1.92, "eval_loss": 0.5385850667953491, "eval_runtime": 9.2261, "eval_samples_per_second": 10.839, "eval_wer": 0.4579780755176614, "step": 11800 }, { "epoch": 1.94, "learning_rate": 9.255996084189917e-05, "loss": NaN, "step": 11900 }, { "epoch": 1.94, "eval_loss": 0.5211225748062134, "eval_runtime": 8.2929, "eval_samples_per_second": 12.058, "eval_wer": 0.4470158343483557, "step": 11900 }, { "epoch": 1.95, "learning_rate": 9.249469734051233e-05, "loss": NaN, "step": 12000 }, { "epoch": 1.95, "eval_loss": 0.44943609833717346, "eval_runtime": 7.5, "eval_samples_per_second": 13.333, "eval_wer": 0.4287454323995128, "step": 12000 }, { "epoch": 1.97, "learning_rate": 9.242943383912548e-05, "loss": NaN, "step": 12100 }, { "epoch": 1.97, "eval_loss": 0.44961708784103394, "eval_runtime": 8.559, "eval_samples_per_second": 11.684, "eval_wer": 0.4007308160779537, "step": 12100 }, { "epoch": 1.98, "learning_rate": 9.236417033773862e-05, "loss": NaN, "step": 12200 }, { "epoch": 1.98, "eval_loss": 0.5775151252746582, "eval_runtime": 8.2678, "eval_samples_per_second": 12.095, "eval_wer": 0.42630937880633374, "step": 12200 }, { "epoch": 2.0, "learning_rate": 9.229890683635177e-05, "loss": NaN, "step": 12300 }, { "epoch": 2.0, "eval_loss": 0.5101304054260254, "eval_runtime": 9.5041, "eval_samples_per_second": 10.522, "eval_wer": 0.4470158343483557, "step": 12300 }, { "epoch": 2.02, "learning_rate": 9.223364333496493e-05, "loss": NaN, "step": 12400 }, { "epoch": 2.02, "eval_loss": 0.5802700519561768, "eval_runtime": 8.978, "eval_samples_per_second": 11.138, "eval_wer": 0.42021924482338613, "step": 12400 }, { "epoch": 2.03, "learning_rate": 9.216837983357807e-05, "loss": NaN, "step": 12500 }, { "epoch": 2.03, "eval_loss": 0.4817795157432556, "eval_runtime": 8.6515, "eval_samples_per_second": 11.559, "eval_wer": 0.4177831912302071, "step": 12500 }, { "epoch": 2.05, "learning_rate": 9.210311633219123e-05, "loss": NaN, "step": 12600 }, { "epoch": 2.05, "eval_loss": 0.5166882276535034, "eval_runtime": 9.9407, "eval_samples_per_second": 10.06, "eval_wer": 0.44214372716199757, "step": 12600 }, { "epoch": 2.07, "learning_rate": 9.203785283080438e-05, "loss": NaN, "step": 12700 }, { "epoch": 2.07, "eval_loss": 0.49081742763519287, "eval_runtime": 7.4879, "eval_samples_per_second": 13.355, "eval_wer": 0.42752740560292324, "step": 12700 }, { "epoch": 2.08, "learning_rate": 9.197258932941752e-05, "loss": NaN, "step": 12800 }, { "epoch": 2.08, "eval_loss": 0.5209938287734985, "eval_runtime": 9.1719, "eval_samples_per_second": 10.903, "eval_wer": 0.4457978075517661, "step": 12800 }, { "epoch": 2.1, "learning_rate": 9.190732582803068e-05, "loss": NaN, "step": 12900 }, { "epoch": 2.1, "eval_loss": 0.4667002856731415, "eval_runtime": 8.2262, "eval_samples_per_second": 12.156, "eval_wer": 0.4190012180267966, "step": 12900 }, { "epoch": 2.11, "learning_rate": 9.184206232664382e-05, "loss": NaN, "step": 13000 }, { "epoch": 2.11, "eval_loss": 0.44741660356521606, "eval_runtime": 6.9715, "eval_samples_per_second": 14.344, "eval_wer": 0.42630937880633374, "step": 13000 }, { "epoch": 2.13, "learning_rate": 9.177679882525698e-05, "loss": NaN, "step": 13100 }, { "epoch": 2.13, "eval_loss": 0.45468372106552124, "eval_runtime": 8.1778, "eval_samples_per_second": 12.228, "eval_wer": 0.4177831912302071, "step": 13100 }, { "epoch": 2.15, "learning_rate": 9.171153532387013e-05, "loss": NaN, "step": 13200 }, { "epoch": 2.15, "eval_loss": 0.47137129306793213, "eval_runtime": 9.2926, "eval_samples_per_second": 10.761, "eval_wer": 0.43605359317904996, "step": 13200 }, { "epoch": 2.16, "learning_rate": 9.164627182248327e-05, "loss": NaN, "step": 13300 }, { "epoch": 2.16, "eval_loss": 0.505387544631958, "eval_runtime": 8.3638, "eval_samples_per_second": 11.956, "eval_wer": 0.415347137637028, "step": 13300 }, { "epoch": 2.18, "learning_rate": 9.158100832109643e-05, "loss": NaN, "step": 13400 }, { "epoch": 2.18, "eval_loss": 0.4471493661403656, "eval_runtime": 7.3344, "eval_samples_per_second": 13.634, "eval_wer": 0.4226552984165652, "step": 13400 }, { "epoch": 2.2, "learning_rate": 9.151574481970958e-05, "loss": NaN, "step": 13500 }, { "epoch": 2.2, "eval_loss": 0.4644159972667694, "eval_runtime": 9.2128, "eval_samples_per_second": 10.854, "eval_wer": 0.3995127892813642, "step": 13500 }, { "epoch": 2.21, "learning_rate": 9.145048131832274e-05, "loss": NaN, "step": 13600 }, { "epoch": 2.21, "eval_loss": 0.4804657995700836, "eval_runtime": 7.5792, "eval_samples_per_second": 13.194, "eval_wer": 0.415347137637028, "step": 13600 }, { "epoch": 2.23, "learning_rate": 9.138521781693588e-05, "loss": NaN, "step": 13700 }, { "epoch": 2.23, "eval_loss": 0.5253716111183167, "eval_runtime": 9.797, "eval_samples_per_second": 10.207, "eval_wer": 0.42752740560292324, "step": 13700 }, { "epoch": 2.24, "learning_rate": 9.131995431554904e-05, "loss": NaN, "step": 13800 }, { "epoch": 2.24, "eval_loss": 0.4461153745651245, "eval_runtime": 8.0888, "eval_samples_per_second": 12.363, "eval_wer": 0.4177831912302071, "step": 13800 }, { "epoch": 2.26, "learning_rate": 9.125469081416219e-05, "loss": NaN, "step": 13900 }, { "epoch": 2.26, "eval_loss": 0.5731090307235718, "eval_runtime": 8.4905, "eval_samples_per_second": 11.778, "eval_wer": 0.43118148599269185, "step": 13900 }, { "epoch": 2.28, "learning_rate": 9.118942731277533e-05, "loss": NaN, "step": 14000 }, { "epoch": 2.28, "eval_loss": 0.5009161829948425, "eval_runtime": 8.2825, "eval_samples_per_second": 12.074, "eval_wer": 0.42021924482338613, "step": 14000 }, { "epoch": 2.29, "learning_rate": 9.112416381138849e-05, "loss": NaN, "step": 14100 }, { "epoch": 2.29, "eval_loss": 0.4805867075920105, "eval_runtime": 8.9811, "eval_samples_per_second": 11.134, "eval_wer": 0.39707673568818513, "step": 14100 }, { "epoch": 2.31, "learning_rate": 9.105890031000163e-05, "loss": NaN, "step": 14200 }, { "epoch": 2.31, "eval_loss": 0.5124616026878357, "eval_runtime": 7.2004, "eval_samples_per_second": 13.888, "eval_wer": 0.3982947624847747, "step": 14200 }, { "epoch": 2.33, "learning_rate": 9.099363680861479e-05, "loss": NaN, "step": 14300 }, { "epoch": 2.33, "eval_loss": 0.45692193508148193, "eval_runtime": 7.2681, "eval_samples_per_second": 13.759, "eval_wer": 0.4177831912302071, "step": 14300 }, { "epoch": 2.34, "learning_rate": 9.092837330722794e-05, "loss": NaN, "step": 14400 }, { "epoch": 2.34, "eval_loss": 0.44331681728363037, "eval_runtime": 8.5939, "eval_samples_per_second": 11.636, "eval_wer": 0.4177831912302071, "step": 14400 }, { "epoch": 2.36, "learning_rate": 9.086310980584108e-05, "loss": NaN, "step": 14500 }, { "epoch": 2.36, "eval_loss": 0.494161456823349, "eval_runtime": 7.6191, "eval_samples_per_second": 13.125, "eval_wer": 0.4299634591961023, "step": 14500 }, { "epoch": 2.37, "learning_rate": 9.079784630445424e-05, "loss": NaN, "step": 14600 }, { "epoch": 2.37, "eval_loss": 0.5291484594345093, "eval_runtime": 7.9069, "eval_samples_per_second": 12.647, "eval_wer": 0.4177831912302071, "step": 14600 }, { "epoch": 2.39, "learning_rate": 9.073258280306739e-05, "loss": NaN, "step": 14700 }, { "epoch": 2.39, "eval_loss": 0.45012572407722473, "eval_runtime": 9.4293, "eval_samples_per_second": 10.605, "eval_wer": 0.4056029232643118, "step": 14700 }, { "epoch": 2.41, "learning_rate": 9.066731930168055e-05, "loss": NaN, "step": 14800 }, { "epoch": 2.41, "eval_loss": 0.44526755809783936, "eval_runtime": 7.9253, "eval_samples_per_second": 12.618, "eval_wer": 0.42021924482338613, "step": 14800 }, { "epoch": 2.42, "learning_rate": 9.060205580029369e-05, "loss": NaN, "step": 14900 }, { "epoch": 2.42, "eval_loss": 0.4633622467517853, "eval_runtime": 7.3284, "eval_samples_per_second": 13.646, "eval_wer": 0.42752740560292324, "step": 14900 }, { "epoch": 2.44, "learning_rate": 9.053679229890684e-05, "loss": NaN, "step": 15000 }, { "epoch": 2.44, "eval_loss": 0.45304596424102783, "eval_runtime": 8.2189, "eval_samples_per_second": 12.167, "eval_wer": 0.4190012180267966, "step": 15000 }, { "epoch": 2.46, "learning_rate": 9.047152879752e-05, "loss": NaN, "step": 15100 }, { "epoch": 2.46, "eval_loss": 0.563227653503418, "eval_runtime": 7.3261, "eval_samples_per_second": 13.65, "eval_wer": 0.4238733252131547, "step": 15100 }, { "epoch": 2.47, "learning_rate": 9.040626529613314e-05, "loss": NaN, "step": 15200 }, { "epoch": 2.47, "eval_loss": 0.4682408273220062, "eval_runtime": 9.085, "eval_samples_per_second": 11.007, "eval_wer": 0.43118148599269185, "step": 15200 }, { "epoch": 2.49, "learning_rate": 9.03410017947463e-05, "loss": NaN, "step": 15300 }, { "epoch": 2.49, "eval_loss": 0.4495187997817993, "eval_runtime": 8.9075, "eval_samples_per_second": 11.227, "eval_wer": 0.4007308160779537, "step": 15300 }, { "epoch": 2.5, "learning_rate": 9.027573829335944e-05, "loss": NaN, "step": 15400 }, { "epoch": 2.5, "eval_loss": 0.4402164816856384, "eval_runtime": 10.3596, "eval_samples_per_second": 9.653, "eval_wer": 0.4092570036540804, "step": 15400 }, { "epoch": 2.52, "learning_rate": 9.02104747919726e-05, "loss": NaN, "step": 15500 }, { "epoch": 2.52, "eval_loss": 0.45120611786842346, "eval_runtime": 8.2246, "eval_samples_per_second": 12.159, "eval_wer": 0.40803897685749085, "step": 15500 }, { "epoch": 2.54, "learning_rate": 9.014521129058573e-05, "loss": NaN, "step": 15600 }, { "epoch": 2.54, "eval_loss": 0.44330108165740967, "eval_runtime": 7.0996, "eval_samples_per_second": 14.085, "eval_wer": 0.4007308160779537, "step": 15600 }, { "epoch": 2.55, "learning_rate": 9.007994778919889e-05, "loss": NaN, "step": 15700 }, { "epoch": 2.55, "eval_loss": 0.42252305150032043, "eval_runtime": 7.1285, "eval_samples_per_second": 14.028, "eval_wer": 0.3934226552984166, "step": 15700 }, { "epoch": 2.57, "learning_rate": 9.001468428781205e-05, "loss": NaN, "step": 15800 }, { "epoch": 2.57, "eval_loss": 0.4437943696975708, "eval_runtime": 8.6965, "eval_samples_per_second": 11.499, "eval_wer": 0.41169305724725946, "step": 15800 }, { "epoch": 2.59, "learning_rate": 8.99494207864252e-05, "loss": NaN, "step": 15900 }, { "epoch": 2.59, "eval_loss": 0.47090038657188416, "eval_runtime": 7.2716, "eval_samples_per_second": 13.752, "eval_wer": 0.4056029232643118, "step": 15900 }, { "epoch": 2.6, "learning_rate": 8.988415728503836e-05, "loss": NaN, "step": 16000 }, { "epoch": 2.6, "eval_loss": 0.45720386505126953, "eval_runtime": 8.165, "eval_samples_per_second": 12.247, "eval_wer": 0.43118148599269185, "step": 16000 }, { "epoch": 2.62, "learning_rate": 8.981889378365149e-05, "loss": NaN, "step": 16100 }, { "epoch": 2.62, "eval_loss": 0.4764085114002228, "eval_runtime": 8.2382, "eval_samples_per_second": 12.139, "eval_wer": 0.4043848964677223, "step": 16100 }, { "epoch": 2.63, "learning_rate": 8.975363028226465e-05, "loss": NaN, "step": 16200 }, { "epoch": 2.63, "eval_loss": 0.4751797020435333, "eval_runtime": 9.3113, "eval_samples_per_second": 10.74, "eval_wer": 0.41412911084043846, "step": 16200 }, { "epoch": 2.65, "learning_rate": 8.968836678087779e-05, "loss": NaN, "step": 16300 }, { "epoch": 2.65, "eval_loss": 0.44270026683807373, "eval_runtime": 7.4624, "eval_samples_per_second": 13.401, "eval_wer": 0.40194884287454324, "step": 16300 }, { "epoch": 2.67, "learning_rate": 8.962310327949095e-05, "loss": NaN, "step": 16400 }, { "epoch": 2.67, "eval_loss": 0.4818960428237915, "eval_runtime": 7.8783, "eval_samples_per_second": 12.693, "eval_wer": 0.43118148599269185, "step": 16400 }, { "epoch": 2.68, "learning_rate": 8.955783977810411e-05, "loss": NaN, "step": 16500 }, { "epoch": 2.68, "eval_loss": 0.4510990083217621, "eval_runtime": 7.04, "eval_samples_per_second": 14.205, "eval_wer": 0.4043848964677223, "step": 16500 }, { "epoch": 2.7, "learning_rate": 8.949257627671725e-05, "loss": NaN, "step": 16600 }, { "epoch": 2.7, "eval_loss": 0.4735144078731537, "eval_runtime": 10.0014, "eval_samples_per_second": 9.999, "eval_wer": 0.3995127892813642, "step": 16600 }, { "epoch": 2.72, "learning_rate": 8.94273127753304e-05, "loss": NaN, "step": 16700 }, { "epoch": 2.72, "eval_loss": 0.4041927456855774, "eval_runtime": 6.9626, "eval_samples_per_second": 14.362, "eval_wer": 0.40316686967113274, "step": 16700 }, { "epoch": 2.73, "learning_rate": 8.936204927394354e-05, "loss": NaN, "step": 16800 }, { "epoch": 2.73, "eval_loss": 0.4579096734523773, "eval_runtime": 8.5814, "eval_samples_per_second": 11.653, "eval_wer": 0.42509135200974424, "step": 16800 }, { "epoch": 2.75, "learning_rate": 8.92967857725567e-05, "loss": NaN, "step": 16900 }, { "epoch": 2.75, "eval_loss": 0.46610623598098755, "eval_runtime": 7.2885, "eval_samples_per_second": 13.72, "eval_wer": 0.42143727161997563, "step": 16900 }, { "epoch": 2.76, "learning_rate": 8.923152227116985e-05, "loss": NaN, "step": 17000 }, { "epoch": 2.76, "eval_loss": 0.46158257126808167, "eval_runtime": 9.1346, "eval_samples_per_second": 10.947, "eval_wer": 0.4177831912302071, "step": 17000 }, { "epoch": 2.78, "learning_rate": 8.9166258769783e-05, "loss": NaN, "step": 17100 }, { "epoch": 2.78, "eval_loss": 0.46586254239082336, "eval_runtime": 8.0894, "eval_samples_per_second": 12.362, "eval_wer": 0.42509135200974424, "step": 17100 }, { "epoch": 2.8, "learning_rate": 8.910099526839616e-05, "loss": NaN, "step": 17200 }, { "epoch": 2.8, "eval_loss": 0.42319783568382263, "eval_runtime": 8.6611, "eval_samples_per_second": 11.546, "eval_wer": 0.4104750304506699, "step": 17200 }, { "epoch": 2.81, "learning_rate": 8.90357317670093e-05, "loss": NaN, "step": 17300 }, { "epoch": 2.81, "eval_loss": 0.45863696932792664, "eval_runtime": 8.0216, "eval_samples_per_second": 12.466, "eval_wer": 0.4092570036540804, "step": 17300 }, { "epoch": 2.83, "learning_rate": 8.897046826562245e-05, "loss": NaN, "step": 17400 }, { "epoch": 2.83, "eval_loss": 0.52719646692276, "eval_runtime": 7.6618, "eval_samples_per_second": 13.052, "eval_wer": 0.45066991473812423, "step": 17400 }, { "epoch": 2.85, "learning_rate": 8.89052047642356e-05, "loss": NaN, "step": 17500 }, { "epoch": 2.85, "eval_loss": 0.4623071551322937, "eval_runtime": 8.3826, "eval_samples_per_second": 11.929, "eval_wer": 0.4104750304506699, "step": 17500 }, { "epoch": 2.86, "learning_rate": 8.883994126284876e-05, "loss": NaN, "step": 17600 }, { "epoch": 2.86, "eval_loss": 0.47391974925994873, "eval_runtime": 8.8856, "eval_samples_per_second": 11.254, "eval_wer": 0.4092570036540804, "step": 17600 }, { "epoch": 2.88, "learning_rate": 8.877467776146192e-05, "loss": NaN, "step": 17700 }, { "epoch": 2.88, "eval_loss": 0.4068062901496887, "eval_runtime": 7.4887, "eval_samples_per_second": 13.353, "eval_wer": 0.392204628501827, "step": 17700 }, { "epoch": 2.89, "learning_rate": 8.870941426007505e-05, "loss": NaN, "step": 17800 }, { "epoch": 2.89, "eval_loss": 0.45875948667526245, "eval_runtime": 8.0538, "eval_samples_per_second": 12.416, "eval_wer": 0.42509135200974424, "step": 17800 }, { "epoch": 2.91, "learning_rate": 8.864415075868821e-05, "loss": NaN, "step": 17900 }, { "epoch": 2.91, "eval_loss": 0.5207622051239014, "eval_runtime": 8.8428, "eval_samples_per_second": 11.309, "eval_wer": 0.3995127892813642, "step": 17900 }, { "epoch": 2.93, "learning_rate": 8.857888725730135e-05, "loss": NaN, "step": 18000 }, { "epoch": 2.93, "eval_loss": 0.4633566737174988, "eval_runtime": 7.2767, "eval_samples_per_second": 13.743, "eval_wer": 0.40803897685749085, "step": 18000 }, { "epoch": 2.94, "learning_rate": 8.851362375591451e-05, "loss": NaN, "step": 18100 }, { "epoch": 2.94, "eval_loss": 0.4258524179458618, "eval_runtime": 7.062, "eval_samples_per_second": 14.16, "eval_wer": 0.3848964677222899, "step": 18100 }, { "epoch": 2.96, "learning_rate": 8.844836025452766e-05, "loss": NaN, "step": 18200 }, { "epoch": 2.96, "eval_loss": 0.42992159724235535, "eval_runtime": 7.4964, "eval_samples_per_second": 13.34, "eval_wer": 0.4043848964677223, "step": 18200 }, { "epoch": 2.98, "learning_rate": 8.838309675314082e-05, "loss": NaN, "step": 18300 }, { "epoch": 2.98, "eval_loss": 0.4557535946369171, "eval_runtime": 8.3341, "eval_samples_per_second": 11.999, "eval_wer": 0.4177831912302071, "step": 18300 }, { "epoch": 2.99, "learning_rate": 8.831783325175396e-05, "loss": NaN, "step": 18400 }, { "epoch": 2.99, "eval_loss": 0.4576800465583801, "eval_runtime": 7.8065, "eval_samples_per_second": 12.81, "eval_wer": 0.39707673568818513, "step": 18400 }, { "epoch": 3.01, "learning_rate": 8.82525697503671e-05, "loss": NaN, "step": 18500 }, { "epoch": 3.01, "eval_loss": 0.4770311713218689, "eval_runtime": 8.6894, "eval_samples_per_second": 11.508, "eval_wer": 0.4007308160779537, "step": 18500 }, { "epoch": 3.02, "learning_rate": 8.818730624898026e-05, "loss": NaN, "step": 18600 }, { "epoch": 3.02, "eval_loss": 0.44065818190574646, "eval_runtime": 9.5635, "eval_samples_per_second": 10.456, "eval_wer": 0.41169305724725946, "step": 18600 }, { "epoch": 3.04, "learning_rate": 8.812204274759341e-05, "loss": NaN, "step": 18700 }, { "epoch": 3.04, "eval_loss": 0.4866321086883545, "eval_runtime": 7.252, "eval_samples_per_second": 13.789, "eval_wer": 0.42143727161997563, "step": 18700 }, { "epoch": 3.06, "learning_rate": 8.805677924620657e-05, "loss": NaN, "step": 18800 }, { "epoch": 3.06, "eval_loss": 0.4869626760482788, "eval_runtime": 9.3184, "eval_samples_per_second": 10.731, "eval_wer": 0.415347137637028, "step": 18800 }, { "epoch": 3.07, "learning_rate": 8.799151574481971e-05, "loss": NaN, "step": 18900 }, { "epoch": 3.07, "eval_loss": 0.580832839012146, "eval_runtime": 8.0833, "eval_samples_per_second": 12.371, "eval_wer": 0.40803897685749085, "step": 18900 }, { "epoch": 3.09, "learning_rate": 8.792625224343286e-05, "loss": NaN, "step": 19000 }, { "epoch": 3.09, "eval_loss": 0.5339367389678955, "eval_runtime": 8.6454, "eval_samples_per_second": 11.567, "eval_wer": 0.39707673568818513, "step": 19000 }, { "epoch": 3.11, "learning_rate": 8.786098874204602e-05, "loss": NaN, "step": 19100 }, { "epoch": 3.11, "eval_loss": 0.47444137930870056, "eval_runtime": 8.4893, "eval_samples_per_second": 11.78, "eval_wer": 0.40682095006090135, "step": 19100 }, { "epoch": 3.12, "learning_rate": 8.779572524065916e-05, "loss": NaN, "step": 19200 }, { "epoch": 3.12, "eval_loss": 0.4808363616466522, "eval_runtime": 8.229, "eval_samples_per_second": 12.152, "eval_wer": 0.42143727161997563, "step": 19200 }, { "epoch": 3.14, "learning_rate": 8.773046173927232e-05, "loss": NaN, "step": 19300 }, { "epoch": 3.14, "eval_loss": 0.5487423539161682, "eval_runtime": 8.6936, "eval_samples_per_second": 11.503, "eval_wer": 0.4287454323995128, "step": 19300 }, { "epoch": 3.15, "learning_rate": 8.766519823788547e-05, "loss": NaN, "step": 19400 }, { "epoch": 3.15, "eval_loss": 0.5379164218902588, "eval_runtime": 7.8502, "eval_samples_per_second": 12.739, "eval_wer": 0.4238733252131547, "step": 19400 }, { "epoch": 3.17, "learning_rate": 8.759993473649861e-05, "loss": NaN, "step": 19500 }, { "epoch": 3.17, "eval_loss": 0.4747236669063568, "eval_runtime": 6.9979, "eval_samples_per_second": 14.29, "eval_wer": 0.40316686967113274, "step": 19500 }, { "epoch": 3.19, "learning_rate": 8.753467123511177e-05, "loss": NaN, "step": 19600 }, { "epoch": 3.19, "eval_loss": 0.4517196714878082, "eval_runtime": 6.8378, "eval_samples_per_second": 14.624, "eval_wer": 0.40194884287454324, "step": 19600 }, { "epoch": 3.2, "learning_rate": 8.746940773372492e-05, "loss": NaN, "step": 19700 }, { "epoch": 3.2, "eval_loss": 0.473175972700119, "eval_runtime": 7.9557, "eval_samples_per_second": 12.57, "eval_wer": 0.3861144945188794, "step": 19700 }, { "epoch": 3.22, "learning_rate": 8.740414423233807e-05, "loss": NaN, "step": 19800 }, { "epoch": 3.22, "eval_loss": 0.4839608371257782, "eval_runtime": 7.511, "eval_samples_per_second": 13.314, "eval_wer": 0.40194884287454324, "step": 19800 }, { "epoch": 3.24, "learning_rate": 8.733888073095122e-05, "loss": NaN, "step": 19900 }, { "epoch": 3.24, "eval_loss": 0.45369553565979004, "eval_runtime": 7.3681, "eval_samples_per_second": 13.572, "eval_wer": 0.37758830694275275, "step": 19900 }, { "epoch": 3.25, "learning_rate": 8.727361722956438e-05, "loss": NaN, "step": 20000 }, { "epoch": 3.25, "eval_loss": 0.44059714674949646, "eval_runtime": 8.867, "eval_samples_per_second": 11.278, "eval_wer": 0.3861144945188794, "step": 20000 }, { "epoch": 3.27, "learning_rate": 8.720835372817752e-05, "loss": NaN, "step": 20100 }, { "epoch": 3.27, "eval_loss": 0.4481971859931946, "eval_runtime": 7.089, "eval_samples_per_second": 14.106, "eval_wer": 0.40194884287454324, "step": 20100 }, { "epoch": 3.29, "learning_rate": 8.714309022679067e-05, "loss": NaN, "step": 20200 }, { "epoch": 3.29, "eval_loss": 0.49499496817588806, "eval_runtime": 9.068, "eval_samples_per_second": 11.028, "eval_wer": 0.40194884287454324, "step": 20200 }, { "epoch": 3.3, "learning_rate": 8.707782672540383e-05, "loss": NaN, "step": 20300 }, { "epoch": 3.3, "eval_loss": 0.4684819281101227, "eval_runtime": 8.8297, "eval_samples_per_second": 11.325, "eval_wer": 0.3946406820950061, "step": 20300 }, { "epoch": 3.32, "learning_rate": 8.701256322401697e-05, "loss": NaN, "step": 20400 }, { "epoch": 3.32, "eval_loss": 0.5416879057884216, "eval_runtime": 8.4935, "eval_samples_per_second": 11.774, "eval_wer": 0.3982947624847747, "step": 20400 }, { "epoch": 3.33, "learning_rate": 8.694729972263013e-05, "loss": NaN, "step": 20500 }, { "epoch": 3.33, "eval_loss": 0.49328354001045227, "eval_runtime": 7.5212, "eval_samples_per_second": 13.296, "eval_wer": 0.39585870889159563, "step": 20500 }, { "epoch": 3.35, "learning_rate": 8.688203622124328e-05, "loss": NaN, "step": 20600 }, { "epoch": 3.35, "eval_loss": 0.48222553730010986, "eval_runtime": 9.8089, "eval_samples_per_second": 10.195, "eval_wer": 0.4165651644336175, "step": 20600 }, { "epoch": 3.37, "learning_rate": 8.681677271985642e-05, "loss": NaN, "step": 20700 }, { "epoch": 3.37, "eval_loss": 0.4871315658092499, "eval_runtime": 8.0731, "eval_samples_per_second": 12.387, "eval_wer": 0.4104750304506699, "step": 20700 }, { "epoch": 3.38, "learning_rate": 8.675150921846958e-05, "loss": NaN, "step": 20800 }, { "epoch": 3.38, "eval_loss": 0.4995521605014801, "eval_runtime": 8.1255, "eval_samples_per_second": 12.307, "eval_wer": 0.42021924482338613, "step": 20800 }, { "epoch": 3.4, "learning_rate": 8.668624571708272e-05, "loss": NaN, "step": 20900 }, { "epoch": 3.4, "eval_loss": 0.46075180172920227, "eval_runtime": 7.3922, "eval_samples_per_second": 13.528, "eval_wer": 0.41412911084043846, "step": 20900 }, { "epoch": 3.42, "learning_rate": 8.662098221569588e-05, "loss": NaN, "step": 21000 }, { "epoch": 3.42, "eval_loss": 0.4704657793045044, "eval_runtime": 8.87, "eval_samples_per_second": 11.274, "eval_wer": 0.40316686967113274, "step": 21000 }, { "epoch": 3.43, "learning_rate": 8.655571871430903e-05, "loss": NaN, "step": 21100 }, { "epoch": 3.43, "eval_loss": 0.44366922974586487, "eval_runtime": 8.0362, "eval_samples_per_second": 12.444, "eval_wer": 0.3982947624847747, "step": 21100 }, { "epoch": 3.45, "learning_rate": 8.649045521292217e-05, "loss": NaN, "step": 21200 }, { "epoch": 3.45, "eval_loss": 0.5748487710952759, "eval_runtime": 8.4229, "eval_samples_per_second": 11.872, "eval_wer": 0.4226552984165652, "step": 21200 }, { "epoch": 3.46, "learning_rate": 8.642519171153532e-05, "loss": NaN, "step": 21300 }, { "epoch": 3.46, "eval_loss": 0.4763486385345459, "eval_runtime": 7.3956, "eval_samples_per_second": 13.522, "eval_wer": 0.3800243605359318, "step": 21300 }, { "epoch": 3.48, "learning_rate": 8.635992821014848e-05, "loss": NaN, "step": 21400 }, { "epoch": 3.48, "eval_loss": 0.45793360471725464, "eval_runtime": 7.217, "eval_samples_per_second": 13.856, "eval_wer": 0.4104750304506699, "step": 21400 }, { "epoch": 3.5, "learning_rate": 8.629466470876164e-05, "loss": NaN, "step": 21500 }, { "epoch": 3.5, "eval_loss": 0.4132789373397827, "eval_runtime": 9.7025, "eval_samples_per_second": 10.307, "eval_wer": 0.4056029232643118, "step": 21500 }, { "epoch": 3.51, "learning_rate": 8.622940120737478e-05, "loss": NaN, "step": 21600 }, { "epoch": 3.51, "eval_loss": 0.4666365385055542, "eval_runtime": 9.4541, "eval_samples_per_second": 10.577, "eval_wer": 0.40682095006090135, "step": 21600 }, { "epoch": 3.53, "learning_rate": 8.616413770598794e-05, "loss": NaN, "step": 21700 }, { "epoch": 3.53, "eval_loss": 0.43131592869758606, "eval_runtime": 7.5373, "eval_samples_per_second": 13.267, "eval_wer": 0.37758830694275275, "step": 21700 }, { "epoch": 3.55, "learning_rate": 8.609887420460107e-05, "loss": NaN, "step": 21800 }, { "epoch": 3.55, "eval_loss": 0.4624130129814148, "eval_runtime": 8.6512, "eval_samples_per_second": 11.559, "eval_wer": 0.3934226552984166, "step": 21800 }, { "epoch": 3.56, "learning_rate": 8.603361070321423e-05, "loss": NaN, "step": 21900 }, { "epoch": 3.56, "eval_loss": 0.47029244899749756, "eval_runtime": 7.0891, "eval_samples_per_second": 14.106, "eval_wer": 0.39707673568818513, "step": 21900 }, { "epoch": 3.58, "learning_rate": 8.596834720182738e-05, "loss": NaN, "step": 22000 }, { "epoch": 3.58, "eval_loss": 0.4115927219390869, "eval_runtime": 7.9478, "eval_samples_per_second": 12.582, "eval_wer": 0.38855054811205847, "step": 22000 }, { "epoch": 3.59, "learning_rate": 8.590308370044053e-05, "loss": NaN, "step": 22100 }, { "epoch": 3.59, "eval_loss": 0.4755612313747406, "eval_runtime": 8.2831, "eval_samples_per_second": 12.073, "eval_wer": 0.3848964677222899, "step": 22100 }, { "epoch": 3.61, "learning_rate": 8.583782019905369e-05, "loss": NaN, "step": 22200 }, { "epoch": 3.61, "eval_loss": 0.42175978422164917, "eval_runtime": 10.3113, "eval_samples_per_second": 9.698, "eval_wer": 0.38855054811205847, "step": 22200 }, { "epoch": 3.63, "learning_rate": 8.577255669766684e-05, "loss": NaN, "step": 22300 }, { "epoch": 3.63, "eval_loss": 0.4504680633544922, "eval_runtime": 8.4957, "eval_samples_per_second": 11.771, "eval_wer": 0.40316686967113274, "step": 22300 }, { "epoch": 3.64, "learning_rate": 8.570729319627998e-05, "loss": NaN, "step": 22400 }, { "epoch": 3.64, "eval_loss": 0.4168296754360199, "eval_runtime": 7.4037, "eval_samples_per_second": 13.507, "eval_wer": 0.40194884287454324, "step": 22400 }, { "epoch": 3.66, "learning_rate": 8.564202969489313e-05, "loss": NaN, "step": 22500 }, { "epoch": 3.66, "eval_loss": 0.3921906650066376, "eval_runtime": 7.4162, "eval_samples_per_second": 13.484, "eval_wer": 0.37271619975639464, "step": 22500 }, { "epoch": 3.68, "learning_rate": 8.557676619350629e-05, "loss": NaN, "step": 22600 }, { "epoch": 3.68, "eval_loss": 0.4271007478237152, "eval_runtime": 8.8145, "eval_samples_per_second": 11.345, "eval_wer": 0.38855054811205847, "step": 22600 }, { "epoch": 3.69, "learning_rate": 8.551150269211943e-05, "loss": NaN, "step": 22700 }, { "epoch": 3.69, "eval_loss": 0.416711688041687, "eval_runtime": 8.4178, "eval_samples_per_second": 11.88, "eval_wer": 0.40682095006090135, "step": 22700 }, { "epoch": 3.71, "learning_rate": 8.544623919073259e-05, "loss": NaN, "step": 22800 }, { "epoch": 3.71, "eval_loss": 0.42215126752853394, "eval_runtime": 7.8605, "eval_samples_per_second": 12.722, "eval_wer": 0.392204628501827, "step": 22800 }, { "epoch": 3.72, "learning_rate": 8.538097568934574e-05, "loss": NaN, "step": 22900 }, { "epoch": 3.72, "eval_loss": 0.4496414065361023, "eval_runtime": 7.9977, "eval_samples_per_second": 12.504, "eval_wer": 0.4177831912302071, "step": 22900 }, { "epoch": 3.74, "learning_rate": 8.531571218795888e-05, "loss": NaN, "step": 23000 }, { "epoch": 3.74, "eval_loss": 0.4615870714187622, "eval_runtime": 8.1022, "eval_samples_per_second": 12.342, "eval_wer": 0.38855054811205847, "step": 23000 }, { "epoch": 3.76, "learning_rate": 8.525044868657204e-05, "loss": NaN, "step": 23100 }, { "epoch": 3.76, "eval_loss": 0.4659249186515808, "eval_runtime": 8.1138, "eval_samples_per_second": 12.325, "eval_wer": 0.4007308160779537, "step": 23100 }, { "epoch": 3.77, "learning_rate": 8.518518518518518e-05, "loss": NaN, "step": 23200 }, { "epoch": 3.77, "eval_loss": 0.45942869782447815, "eval_runtime": 7.7263, "eval_samples_per_second": 12.943, "eval_wer": 0.36784409257003653, "step": 23200 }, { "epoch": 3.79, "learning_rate": 8.511992168379834e-05, "loss": NaN, "step": 23300 }, { "epoch": 3.79, "eval_loss": 0.4240889847278595, "eval_runtime": 7.2849, "eval_samples_per_second": 13.727, "eval_wer": 0.37880633373934225, "step": 23300 }, { "epoch": 3.81, "learning_rate": 8.505465818241149e-05, "loss": NaN, "step": 23400 }, { "epoch": 3.81, "eval_loss": 0.4439373314380646, "eval_runtime": 7.5713, "eval_samples_per_second": 13.208, "eval_wer": 0.39707673568818513, "step": 23400 }, { "epoch": 3.82, "learning_rate": 8.498939468102463e-05, "loss": NaN, "step": 23500 }, { "epoch": 3.82, "eval_loss": 0.4574301838874817, "eval_runtime": 7.723, "eval_samples_per_second": 12.948, "eval_wer": 0.39707673568818513, "step": 23500 }, { "epoch": 3.84, "learning_rate": 8.492413117963779e-05, "loss": NaN, "step": 23600 }, { "epoch": 3.84, "eval_loss": 0.41990235447883606, "eval_runtime": 7.2988, "eval_samples_per_second": 13.701, "eval_wer": 0.38246041412911086, "step": 23600 }, { "epoch": 3.85, "learning_rate": 8.485886767825094e-05, "loss": NaN, "step": 23700 }, { "epoch": 3.85, "eval_loss": 0.4570240080356598, "eval_runtime": 9.4247, "eval_samples_per_second": 10.61, "eval_wer": 0.3934226552984166, "step": 23700 }, { "epoch": 3.87, "learning_rate": 8.47936041768641e-05, "loss": NaN, "step": 23800 }, { "epoch": 3.87, "eval_loss": 0.42279544472694397, "eval_runtime": 7.429, "eval_samples_per_second": 13.461, "eval_wer": 0.37880633373934225, "step": 23800 }, { "epoch": 3.89, "learning_rate": 8.472834067547724e-05, "loss": NaN, "step": 23900 }, { "epoch": 3.89, "eval_loss": 0.4250124394893646, "eval_runtime": 8.7078, "eval_samples_per_second": 11.484, "eval_wer": 0.39585870889159563, "step": 23900 }, { "epoch": 3.9, "learning_rate": 8.46630771740904e-05, "loss": NaN, "step": 24000 }, { "epoch": 3.9, "eval_loss": 0.48117172718048096, "eval_runtime": 7.6756, "eval_samples_per_second": 13.028, "eval_wer": 0.40803897685749085, "step": 24000 }, { "epoch": 3.92, "learning_rate": 8.459781367270355e-05, "loss": NaN, "step": 24100 }, { "epoch": 3.92, "eval_loss": 0.4824243485927582, "eval_runtime": 9.2626, "eval_samples_per_second": 10.796, "eval_wer": 0.3812423873325213, "step": 24100 }, { "epoch": 3.94, "learning_rate": 8.453255017131669e-05, "loss": NaN, "step": 24200 }, { "epoch": 3.94, "eval_loss": 0.45317116379737854, "eval_runtime": 7.8742, "eval_samples_per_second": 12.7, "eval_wer": 0.39585870889159563, "step": 24200 }, { "epoch": 3.95, "learning_rate": 8.446728666992985e-05, "loss": NaN, "step": 24300 }, { "epoch": 3.95, "eval_loss": 0.5323064923286438, "eval_runtime": 7.1451, "eval_samples_per_second": 13.996, "eval_wer": 0.42509135200974424, "step": 24300 }, { "epoch": 3.97, "learning_rate": 8.4402023168543e-05, "loss": NaN, "step": 24400 }, { "epoch": 3.97, "eval_loss": 0.5017148852348328, "eval_runtime": 8.2004, "eval_samples_per_second": 12.194, "eval_wer": 0.40803897685749085, "step": 24400 }, { "epoch": 3.98, "learning_rate": 8.433675966715615e-05, "loss": NaN, "step": 24500 }, { "epoch": 3.98, "eval_loss": 0.4483763873577118, "eval_runtime": 7.3109, "eval_samples_per_second": 13.678, "eval_wer": 0.38246041412911086, "step": 24500 }, { "epoch": 4.0, "learning_rate": 8.42714961657693e-05, "loss": NaN, "step": 24600 }, { "epoch": 4.0, "eval_loss": 0.4591113030910492, "eval_runtime": 7.7451, "eval_samples_per_second": 12.911, "eval_wer": 0.3800243605359318, "step": 24600 }, { "epoch": 4.02, "learning_rate": 8.420623266438244e-05, "loss": NaN, "step": 24700 }, { "epoch": 4.02, "eval_loss": 0.45395427942276, "eval_runtime": 7.718, "eval_samples_per_second": 12.957, "eval_wer": 0.3763702801461632, "step": 24700 }, { "epoch": 4.03, "learning_rate": 8.41409691629956e-05, "loss": NaN, "step": 24800 }, { "epoch": 4.03, "eval_loss": 0.5075406432151794, "eval_runtime": 8.7905, "eval_samples_per_second": 11.376, "eval_wer": 0.40803897685749085, "step": 24800 }, { "epoch": 4.05, "learning_rate": 8.407570566160875e-05, "loss": NaN, "step": 24900 }, { "epoch": 4.05, "eval_loss": 0.5291510224342346, "eval_runtime": 8.3479, "eval_samples_per_second": 11.979, "eval_wer": 0.4104750304506699, "step": 24900 }, { "epoch": 4.07, "learning_rate": 8.40104421602219e-05, "loss": NaN, "step": 25000 }, { "epoch": 4.07, "eval_loss": 0.4835575819015503, "eval_runtime": 9.1852, "eval_samples_per_second": 10.887, "eval_wer": 0.3934226552984166, "step": 25000 }, { "epoch": 4.08, "learning_rate": 8.394517865883505e-05, "loss": NaN, "step": 25100 }, { "epoch": 4.08, "eval_loss": 0.4627467691898346, "eval_runtime": 8.3255, "eval_samples_per_second": 12.011, "eval_wer": 0.40803897685749085, "step": 25100 }, { "epoch": 4.1, "learning_rate": 8.38799151574482e-05, "loss": NaN, "step": 25200 }, { "epoch": 4.1, "eval_loss": 0.45444557070732117, "eval_runtime": 7.7259, "eval_samples_per_second": 12.943, "eval_wer": 0.40316686967113274, "step": 25200 }, { "epoch": 4.11, "learning_rate": 8.381465165606135e-05, "loss": NaN, "step": 25300 }, { "epoch": 4.11, "eval_loss": 0.4336519241333008, "eval_runtime": 7.905, "eval_samples_per_second": 12.65, "eval_wer": 0.3873325213154689, "step": 25300 }, { "epoch": 4.13, "learning_rate": 8.37493881546745e-05, "loss": NaN, "step": 25400 }, { "epoch": 4.13, "eval_loss": 0.44815555214881897, "eval_runtime": 8.3801, "eval_samples_per_second": 11.933, "eval_wer": 0.4104750304506699, "step": 25400 }, { "epoch": 4.15, "learning_rate": 8.368412465328766e-05, "loss": NaN, "step": 25500 }, { "epoch": 4.15, "eval_loss": 0.45955729484558105, "eval_runtime": 7.7863, "eval_samples_per_second": 12.843, "eval_wer": 0.38855054811205847, "step": 25500 }, { "epoch": 4.16, "learning_rate": 8.36188611519008e-05, "loss": NaN, "step": 25600 }, { "epoch": 4.16, "eval_loss": 0.47062352299690247, "eval_runtime": 9.5871, "eval_samples_per_second": 10.431, "eval_wer": 0.39707673568818513, "step": 25600 }, { "epoch": 4.18, "learning_rate": 8.355359765051396e-05, "loss": NaN, "step": 25700 }, { "epoch": 4.18, "eval_loss": 0.44303008913993835, "eval_runtime": 8.2157, "eval_samples_per_second": 12.172, "eval_wer": 0.3995127892813642, "step": 25700 }, { "epoch": 4.2, "learning_rate": 8.348833414912711e-05, "loss": NaN, "step": 25800 }, { "epoch": 4.2, "eval_loss": 0.527855396270752, "eval_runtime": 8.507, "eval_samples_per_second": 11.755, "eval_wer": 0.4104750304506699, "step": 25800 }, { "epoch": 4.21, "learning_rate": 8.342307064774025e-05, "loss": NaN, "step": 25900 }, { "epoch": 4.21, "eval_loss": 0.4706363379955292, "eval_runtime": 6.3997, "eval_samples_per_second": 15.626, "eval_wer": 0.4007308160779537, "step": 25900 }, { "epoch": 4.23, "learning_rate": 8.335780714635341e-05, "loss": NaN, "step": 26000 }, { "epoch": 4.23, "eval_loss": 0.46070727705955505, "eval_runtime": 6.6071, "eval_samples_per_second": 15.135, "eval_wer": 0.37880633373934225, "step": 26000 }, { "epoch": 4.24, "learning_rate": 8.329254364496656e-05, "loss": NaN, "step": 26100 }, { "epoch": 4.24, "eval_loss": 0.47955620288848877, "eval_runtime": 8.053, "eval_samples_per_second": 12.418, "eval_wer": 0.3812423873325213, "step": 26100 }, { "epoch": 4.26, "learning_rate": 8.322728014357972e-05, "loss": NaN, "step": 26200 }, { "epoch": 4.26, "eval_loss": 0.4731149971485138, "eval_runtime": 8.8267, "eval_samples_per_second": 11.329, "eval_wer": 0.40682095006090135, "step": 26200 }, { "epoch": 4.28, "learning_rate": 8.316201664219285e-05, "loss": NaN, "step": 26300 }, { "epoch": 4.28, "eval_loss": 0.4844764471054077, "eval_runtime": 7.374, "eval_samples_per_second": 13.561, "eval_wer": 0.39585870889159563, "step": 26300 }, { "epoch": 4.29, "learning_rate": 8.3096753140806e-05, "loss": NaN, "step": 26400 }, { "epoch": 4.29, "eval_loss": 0.4396247863769531, "eval_runtime": 9.6514, "eval_samples_per_second": 10.361, "eval_wer": 0.3751522533495737, "step": 26400 }, { "epoch": 4.31, "learning_rate": 8.303148963941916e-05, "loss": NaN, "step": 26500 }, { "epoch": 4.31, "eval_loss": 0.4746050238609314, "eval_runtime": 8.1321, "eval_samples_per_second": 12.297, "eval_wer": 0.38246041412911086, "step": 26500 }, { "epoch": 4.33, "learning_rate": 8.296622613803231e-05, "loss": NaN, "step": 26600 }, { "epoch": 4.33, "eval_loss": 0.4225209951400757, "eval_runtime": 7.7046, "eval_samples_per_second": 12.979, "eval_wer": 0.3702801461632156, "step": 26600 }, { "epoch": 4.34, "learning_rate": 8.290096263664547e-05, "loss": NaN, "step": 26700 }, { "epoch": 4.34, "eval_loss": 0.46304523944854736, "eval_runtime": 8.8314, "eval_samples_per_second": 11.323, "eval_wer": 0.40194884287454324, "step": 26700 }, { "epoch": 4.36, "learning_rate": 8.283569913525861e-05, "loss": NaN, "step": 26800 }, { "epoch": 4.36, "eval_loss": 0.45539891719818115, "eval_runtime": 8.3892, "eval_samples_per_second": 11.92, "eval_wer": 0.3848964677222899, "step": 26800 }, { "epoch": 4.37, "learning_rate": 8.277043563387176e-05, "loss": NaN, "step": 26900 }, { "epoch": 4.37, "eval_loss": 0.4747115671634674, "eval_runtime": 8.0532, "eval_samples_per_second": 12.417, "eval_wer": 0.3861144945188794, "step": 26900 }, { "epoch": 4.39, "learning_rate": 8.27051721324849e-05, "loss": NaN, "step": 27000 }, { "epoch": 4.39, "eval_loss": 0.4937517046928406, "eval_runtime": 8.6063, "eval_samples_per_second": 11.619, "eval_wer": 0.3982947624847747, "step": 27000 }, { "epoch": 4.41, "learning_rate": 8.263990863109806e-05, "loss": NaN, "step": 27100 }, { "epoch": 4.41, "eval_loss": 0.5522226095199585, "eval_runtime": 7.3096, "eval_samples_per_second": 13.681, "eval_wer": 0.38855054811205847, "step": 27100 }, { "epoch": 4.42, "learning_rate": 8.257464512971122e-05, "loss": NaN, "step": 27200 }, { "epoch": 4.42, "eval_loss": 0.48202434182167053, "eval_runtime": 7.8854, "eval_samples_per_second": 12.682, "eval_wer": 0.4056029232643118, "step": 27200 }, { "epoch": 4.44, "learning_rate": 8.250938162832437e-05, "loss": NaN, "step": 27300 }, { "epoch": 4.44, "eval_loss": 0.4578789472579956, "eval_runtime": 8.752, "eval_samples_per_second": 11.426, "eval_wer": 0.37393422655298414, "step": 27300 }, { "epoch": 4.46, "learning_rate": 8.244411812693752e-05, "loss": NaN, "step": 27400 }, { "epoch": 4.46, "eval_loss": 0.44214507937431335, "eval_runtime": 10.4981, "eval_samples_per_second": 9.526, "eval_wer": 0.3946406820950061, "step": 27400 }, { "epoch": 4.47, "learning_rate": 8.237885462555066e-05, "loss": NaN, "step": 27500 }, { "epoch": 4.47, "eval_loss": 0.43562430143356323, "eval_runtime": 7.8819, "eval_samples_per_second": 12.687, "eval_wer": 0.3848964677222899, "step": 27500 }, { "epoch": 4.49, "learning_rate": 8.231359112416381e-05, "loss": NaN, "step": 27600 }, { "epoch": 4.49, "eval_loss": 0.5293126106262207, "eval_runtime": 9.3755, "eval_samples_per_second": 10.666, "eval_wer": 0.3982947624847747, "step": 27600 }, { "epoch": 4.5, "learning_rate": 8.224832762277696e-05, "loss": NaN, "step": 27700 }, { "epoch": 4.5, "eval_loss": 0.4340215027332306, "eval_runtime": 8.0204, "eval_samples_per_second": 12.468, "eval_wer": 0.38855054811205847, "step": 27700 }, { "epoch": 4.52, "learning_rate": 8.218306412139012e-05, "loss": NaN, "step": 27800 }, { "epoch": 4.52, "eval_loss": 0.4252225160598755, "eval_runtime": 8.021, "eval_samples_per_second": 12.467, "eval_wer": 0.3763702801461632, "step": 27800 }, { "epoch": 4.54, "learning_rate": 8.211780062000328e-05, "loss": NaN, "step": 27900 }, { "epoch": 4.54, "eval_loss": 0.43396663665771484, "eval_runtime": 7.1016, "eval_samples_per_second": 14.081, "eval_wer": 0.38855054811205847, "step": 27900 }, { "epoch": 4.55, "learning_rate": 8.205253711861641e-05, "loss": NaN, "step": 28000 }, { "epoch": 4.55, "eval_loss": 0.4182353615760803, "eval_runtime": 9.2514, "eval_samples_per_second": 10.809, "eval_wer": 0.3800243605359318, "step": 28000 }, { "epoch": 4.57, "learning_rate": 8.198727361722957e-05, "loss": NaN, "step": 28100 }, { "epoch": 4.57, "eval_loss": 0.5017396211624146, "eval_runtime": 8.9953, "eval_samples_per_second": 11.117, "eval_wer": 0.40316686967113274, "step": 28100 }, { "epoch": 4.59, "learning_rate": 8.192201011584271e-05, "loss": NaN, "step": 28200 }, { "epoch": 4.59, "eval_loss": 0.4595078229904175, "eval_runtime": 9.3616, "eval_samples_per_second": 10.682, "eval_wer": 0.3909866017052375, "step": 28200 }, { "epoch": 4.6, "learning_rate": 8.185674661445587e-05, "loss": NaN, "step": 28300 }, { "epoch": 4.6, "eval_loss": 0.44491440057754517, "eval_runtime": 10.1045, "eval_samples_per_second": 9.897, "eval_wer": 0.3946406820950061, "step": 28300 }, { "epoch": 4.62, "learning_rate": 8.179148311306902e-05, "loss": NaN, "step": 28400 }, { "epoch": 4.62, "eval_loss": 0.4460849463939667, "eval_runtime": 9.8214, "eval_samples_per_second": 10.182, "eval_wer": 0.3909866017052375, "step": 28400 }, { "epoch": 4.63, "learning_rate": 8.172621961168218e-05, "loss": NaN, "step": 28500 }, { "epoch": 4.63, "eval_loss": 0.49524936079978943, "eval_runtime": 7.8304, "eval_samples_per_second": 12.771, "eval_wer": 0.40194884287454324, "step": 28500 }, { "epoch": 4.65, "learning_rate": 8.166095611029532e-05, "loss": NaN, "step": 28600 }, { "epoch": 4.65, "eval_loss": 0.481218159198761, "eval_runtime": 8.0581, "eval_samples_per_second": 12.41, "eval_wer": 0.4043848964677223, "step": 28600 }, { "epoch": 4.67, "learning_rate": 8.159569260890847e-05, "loss": NaN, "step": 28700 }, { "epoch": 4.67, "eval_loss": 0.4491060674190521, "eval_runtime": 7.4142, "eval_samples_per_second": 13.488, "eval_wer": 0.3909866017052375, "step": 28700 }, { "epoch": 4.68, "learning_rate": 8.153042910752162e-05, "loss": NaN, "step": 28800 }, { "epoch": 4.68, "eval_loss": 0.5148893594741821, "eval_runtime": 6.7875, "eval_samples_per_second": 14.733, "eval_wer": 0.3946406820950061, "step": 28800 }, { "epoch": 4.7, "learning_rate": 8.146516560613477e-05, "loss": NaN, "step": 28900 }, { "epoch": 4.7, "eval_loss": 0.46138709783554077, "eval_runtime": 7.3893, "eval_samples_per_second": 13.533, "eval_wer": 0.4007308160779537, "step": 28900 }, { "epoch": 4.72, "learning_rate": 8.139990210474793e-05, "loss": NaN, "step": 29000 }, { "epoch": 4.72, "eval_loss": 0.44223907589912415, "eval_runtime": 8.6011, "eval_samples_per_second": 11.626, "eval_wer": 0.3873325213154689, "step": 29000 }, { "epoch": 4.73, "learning_rate": 8.133463860336107e-05, "loss": NaN, "step": 29100 }, { "epoch": 4.73, "eval_loss": 0.471282958984375, "eval_runtime": 10.4884, "eval_samples_per_second": 9.534, "eval_wer": 0.40803897685749085, "step": 29100 }, { "epoch": 4.75, "learning_rate": 8.126937510197422e-05, "loss": NaN, "step": 29200 }, { "epoch": 4.75, "eval_loss": 0.43840956687927246, "eval_runtime": 8.0732, "eval_samples_per_second": 12.387, "eval_wer": 0.41412911084043846, "step": 29200 }, { "epoch": 4.77, "learning_rate": 8.120411160058738e-05, "loss": NaN, "step": 29300 }, { "epoch": 4.77, "eval_loss": 0.4980277717113495, "eval_runtime": 8.0117, "eval_samples_per_second": 12.482, "eval_wer": 0.4007308160779537, "step": 29300 }, { "epoch": 4.78, "learning_rate": 8.113884809920052e-05, "loss": NaN, "step": 29400 }, { "epoch": 4.78, "eval_loss": 0.46275556087493896, "eval_runtime": 8.4323, "eval_samples_per_second": 11.859, "eval_wer": 0.41169305724725946, "step": 29400 }, { "epoch": 4.8, "learning_rate": 8.107358459781368e-05, "loss": NaN, "step": 29500 }, { "epoch": 4.8, "eval_loss": 0.5011305809020996, "eval_runtime": 9.4028, "eval_samples_per_second": 10.635, "eval_wer": 0.39707673568818513, "step": 29500 }, { "epoch": 4.81, "learning_rate": 8.100832109642683e-05, "loss": NaN, "step": 29600 }, { "epoch": 4.81, "eval_loss": 0.4675903022289276, "eval_runtime": 8.4503, "eval_samples_per_second": 11.834, "eval_wer": 0.3861144945188794, "step": 29600 }, { "epoch": 4.83, "learning_rate": 8.094305759503997e-05, "loss": NaN, "step": 29700 }, { "epoch": 4.83, "eval_loss": 0.4845035970211029, "eval_runtime": 10.1458, "eval_samples_per_second": 9.856, "eval_wer": 0.40316686967113274, "step": 29700 }, { "epoch": 4.85, "learning_rate": 8.087779409365313e-05, "loss": NaN, "step": 29800 }, { "epoch": 4.85, "eval_loss": 0.47924065589904785, "eval_runtime": 9.6324, "eval_samples_per_second": 10.382, "eval_wer": 0.41169305724725946, "step": 29800 }, { "epoch": 4.86, "learning_rate": 8.081253059226628e-05, "loss": NaN, "step": 29900 }, { "epoch": 4.86, "eval_loss": 0.4541124701499939, "eval_runtime": 7.4256, "eval_samples_per_second": 13.467, "eval_wer": 0.4007308160779537, "step": 29900 }, { "epoch": 4.88, "learning_rate": 8.074726709087943e-05, "loss": NaN, "step": 30000 }, { "epoch": 4.88, "eval_loss": 0.4285271167755127, "eval_runtime": 6.7649, "eval_samples_per_second": 14.782, "eval_wer": 0.4056029232643118, "step": 30000 }, { "epoch": 4.9, "learning_rate": 8.068200358949258e-05, "loss": NaN, "step": 30100 }, { "epoch": 4.9, "eval_loss": 0.4844328761100769, "eval_runtime": 9.5693, "eval_samples_per_second": 10.45, "eval_wer": 0.3934226552984166, "step": 30100 }, { "epoch": 4.91, "learning_rate": 8.061674008810574e-05, "loss": NaN, "step": 30200 }, { "epoch": 4.91, "eval_loss": 0.4602464735507965, "eval_runtime": 10.2251, "eval_samples_per_second": 9.78, "eval_wer": 0.3909866017052375, "step": 30200 }, { "epoch": 4.93, "learning_rate": 8.055147658671888e-05, "loss": NaN, "step": 30300 }, { "epoch": 4.93, "eval_loss": 0.431302934885025, "eval_runtime": 8.621, "eval_samples_per_second": 11.6, "eval_wer": 0.3982947624847747, "step": 30300 }, { "epoch": 4.94, "learning_rate": 8.048621308533203e-05, "loss": NaN, "step": 30400 }, { "epoch": 4.94, "eval_loss": 0.4665343463420868, "eval_runtime": 8.6252, "eval_samples_per_second": 11.594, "eval_wer": 0.4092570036540804, "step": 30400 }, { "epoch": 4.96, "learning_rate": 8.042094958394519e-05, "loss": NaN, "step": 30500 }, { "epoch": 4.96, "eval_loss": 0.4470652639865875, "eval_runtime": 8.3879, "eval_samples_per_second": 11.922, "eval_wer": 0.3946406820950061, "step": 30500 }, { "epoch": 4.98, "learning_rate": 8.035568608255833e-05, "loss": NaN, "step": 30600 }, { "epoch": 4.98, "eval_loss": 0.4649478495121002, "eval_runtime": 8.0029, "eval_samples_per_second": 12.495, "eval_wer": 0.3934226552984166, "step": 30600 }, { "epoch": 4.99, "learning_rate": 8.029042258117149e-05, "loss": NaN, "step": 30700 }, { "epoch": 4.99, "eval_loss": 0.42199084162712097, "eval_runtime": 7.8648, "eval_samples_per_second": 12.715, "eval_wer": 0.38367844092570036, "step": 30700 }, { "epoch": 5.01, "learning_rate": 8.022515907978464e-05, "loss": NaN, "step": 30800 }, { "epoch": 5.01, "eval_loss": 0.43867814540863037, "eval_runtime": 10.0022, "eval_samples_per_second": 9.998, "eval_wer": 0.4092570036540804, "step": 30800 }, { "epoch": 5.03, "learning_rate": 8.015989557839778e-05, "loss": NaN, "step": 30900 }, { "epoch": 5.03, "eval_loss": 0.4615475535392761, "eval_runtime": 7.5843, "eval_samples_per_second": 13.185, "eval_wer": 0.4104750304506699, "step": 30900 }, { "epoch": 5.04, "learning_rate": 8.009463207701094e-05, "loss": NaN, "step": 31000 }, { "epoch": 5.04, "eval_loss": 0.4595627188682556, "eval_runtime": 8.6951, "eval_samples_per_second": 11.501, "eval_wer": 0.41169305724725946, "step": 31000 }, { "epoch": 5.06, "learning_rate": 8.002936857562408e-05, "loss": NaN, "step": 31100 }, { "epoch": 5.06, "eval_loss": 0.48309993743896484, "eval_runtime": 7.7623, "eval_samples_per_second": 12.883, "eval_wer": 0.41169305724725946, "step": 31100 }, { "epoch": 5.07, "learning_rate": 7.996410507423724e-05, "loss": NaN, "step": 31200 }, { "epoch": 5.07, "eval_loss": 0.4405969977378845, "eval_runtime": 8.6906, "eval_samples_per_second": 11.507, "eval_wer": 0.392204628501827, "step": 31200 }, { "epoch": 5.09, "learning_rate": 7.989884157285039e-05, "loss": NaN, "step": 31300 }, { "epoch": 5.09, "eval_loss": 0.46763721108436584, "eval_runtime": 8.1484, "eval_samples_per_second": 12.272, "eval_wer": 0.3909866017052375, "step": 31300 }, { "epoch": 5.11, "learning_rate": 7.983357807146353e-05, "loss": NaN, "step": 31400 }, { "epoch": 5.11, "eval_loss": 0.4569970369338989, "eval_runtime": 8.3373, "eval_samples_per_second": 11.994, "eval_wer": 0.41169305724725946, "step": 31400 }, { "epoch": 5.12, "learning_rate": 7.976831457007669e-05, "loss": NaN, "step": 31500 }, { "epoch": 5.12, "eval_loss": 0.4363997280597687, "eval_runtime": 8.1102, "eval_samples_per_second": 12.33, "eval_wer": 0.3848964677222899, "step": 31500 }, { "epoch": 5.14, "learning_rate": 7.970305106868984e-05, "loss": NaN, "step": 31600 }, { "epoch": 5.14, "eval_loss": 0.4483918249607086, "eval_runtime": 8.4558, "eval_samples_per_second": 11.826, "eval_wer": 0.38246041412911086, "step": 31600 }, { "epoch": 5.16, "learning_rate": 7.9637787567303e-05, "loss": NaN, "step": 31700 }, { "epoch": 5.16, "eval_loss": 0.40626582503318787, "eval_runtime": 7.4323, "eval_samples_per_second": 13.455, "eval_wer": 0.3751522533495737, "step": 31700 }, { "epoch": 5.17, "learning_rate": 7.957252406591614e-05, "loss": NaN, "step": 31800 }, { "epoch": 5.17, "eval_loss": 0.4829193949699402, "eval_runtime": 7.8066, "eval_samples_per_second": 12.81, "eval_wer": 0.40194884287454324, "step": 31800 }, { "epoch": 5.19, "learning_rate": 7.95072605645293e-05, "loss": NaN, "step": 31900 }, { "epoch": 5.19, "eval_loss": 0.49380388855934143, "eval_runtime": 8.2852, "eval_samples_per_second": 12.07, "eval_wer": 0.38246041412911086, "step": 31900 }, { "epoch": 5.2, "learning_rate": 7.944199706314243e-05, "loss": NaN, "step": 32000 }, { "epoch": 5.2, "eval_loss": 0.4846552014350891, "eval_runtime": 8.2309, "eval_samples_per_second": 12.149, "eval_wer": 0.3812423873325213, "step": 32000 }, { "epoch": 5.22, "learning_rate": 7.937673356175559e-05, "loss": NaN, "step": 32100 }, { "epoch": 5.22, "eval_loss": 0.4324251413345337, "eval_runtime": 7.5408, "eval_samples_per_second": 13.261, "eval_wer": 0.38976857490864797, "step": 32100 }, { "epoch": 5.24, "learning_rate": 7.931147006036875e-05, "loss": NaN, "step": 32200 }, { "epoch": 5.24, "eval_loss": 0.4314603805541992, "eval_runtime": 8.6415, "eval_samples_per_second": 11.572, "eval_wer": 0.3909866017052375, "step": 32200 }, { "epoch": 5.25, "learning_rate": 7.92462065589819e-05, "loss": NaN, "step": 32300 }, { "epoch": 5.25, "eval_loss": 0.4612935185432434, "eval_runtime": 8.2981, "eval_samples_per_second": 12.051, "eval_wer": 0.4092570036540804, "step": 32300 }, { "epoch": 5.27, "learning_rate": 7.918094305759505e-05, "loss": NaN, "step": 32400 }, { "epoch": 5.27, "eval_loss": 0.4439612329006195, "eval_runtime": 6.8526, "eval_samples_per_second": 14.593, "eval_wer": 0.3946406820950061, "step": 32400 }, { "epoch": 5.29, "learning_rate": 7.91156795562082e-05, "loss": NaN, "step": 32500 }, { "epoch": 5.29, "eval_loss": 0.5218726396560669, "eval_runtime": 10.5449, "eval_samples_per_second": 9.483, "eval_wer": 0.42143727161997563, "step": 32500 }, { "epoch": 5.3, "learning_rate": 7.905041605482134e-05, "loss": NaN, "step": 32600 }, { "epoch": 5.3, "eval_loss": 0.45300713181495667, "eval_runtime": 7.9081, "eval_samples_per_second": 12.645, "eval_wer": 0.3812423873325213, "step": 32600 }, { "epoch": 5.32, "learning_rate": 7.898515255343449e-05, "loss": NaN, "step": 32700 }, { "epoch": 5.32, "eval_loss": 0.46696189045906067, "eval_runtime": 8.375, "eval_samples_per_second": 11.94, "eval_wer": 0.36662606577344703, "step": 32700 }, { "epoch": 5.33, "learning_rate": 7.891988905204765e-05, "loss": NaN, "step": 32800 }, { "epoch": 5.33, "eval_loss": 0.4551876485347748, "eval_runtime": 8.9235, "eval_samples_per_second": 11.206, "eval_wer": 0.39707673568818513, "step": 32800 }, { "epoch": 5.35, "learning_rate": 7.88546255506608e-05, "loss": NaN, "step": 32900 }, { "epoch": 5.35, "eval_loss": 0.49849167466163635, "eval_runtime": 7.4164, "eval_samples_per_second": 13.484, "eval_wer": 0.3763702801461632, "step": 32900 }, { "epoch": 5.37, "learning_rate": 7.878936204927395e-05, "loss": NaN, "step": 33000 }, { "epoch": 5.37, "eval_loss": 0.4134560525417328, "eval_runtime": 8.9386, "eval_samples_per_second": 11.187, "eval_wer": 0.3800243605359318, "step": 33000 }, { "epoch": 5.38, "learning_rate": 7.87240985478871e-05, "loss": NaN, "step": 33100 }, { "epoch": 5.38, "eval_loss": 0.43791449069976807, "eval_runtime": 7.9006, "eval_samples_per_second": 12.657, "eval_wer": 0.37149817295980514, "step": 33100 }, { "epoch": 5.4, "learning_rate": 7.865883504650024e-05, "loss": NaN, "step": 33200 }, { "epoch": 5.4, "eval_loss": 0.3854129910469055, "eval_runtime": 8.888, "eval_samples_per_second": 11.251, "eval_wer": 0.3702801461632156, "step": 33200 }, { "epoch": 5.42, "learning_rate": 7.85935715451134e-05, "loss": NaN, "step": 33300 }, { "epoch": 5.42, "eval_loss": 0.45465293526649475, "eval_runtime": 7.5638, "eval_samples_per_second": 13.221, "eval_wer": 0.392204628501827, "step": 33300 }, { "epoch": 5.43, "learning_rate": 7.852830804372654e-05, "loss": NaN, "step": 33400 }, { "epoch": 5.43, "eval_loss": 0.4339330196380615, "eval_runtime": 7.2942, "eval_samples_per_second": 13.709, "eval_wer": 0.37880633373934225, "step": 33400 }, { "epoch": 5.45, "learning_rate": 7.84630445423397e-05, "loss": NaN, "step": 33500 }, { "epoch": 5.45, "eval_loss": 0.47783201932907104, "eval_runtime": 10.4013, "eval_samples_per_second": 9.614, "eval_wer": 0.38976857490864797, "step": 33500 }, { "epoch": 5.46, "learning_rate": 7.839778104095286e-05, "loss": NaN, "step": 33600 }, { "epoch": 5.46, "eval_loss": 0.451149582862854, "eval_runtime": 10.0363, "eval_samples_per_second": 9.964, "eval_wer": 0.3934226552984166, "step": 33600 }, { "epoch": 5.48, "learning_rate": 7.8332517539566e-05, "loss": NaN, "step": 33700 }, { "epoch": 5.48, "eval_loss": 0.4253043830394745, "eval_runtime": 7.7756, "eval_samples_per_second": 12.861, "eval_wer": 0.3751522533495737, "step": 33700 }, { "epoch": 5.5, "learning_rate": 7.826725403817915e-05, "loss": NaN, "step": 33800 }, { "epoch": 5.5, "eval_loss": 0.4464089274406433, "eval_runtime": 6.8445, "eval_samples_per_second": 14.61, "eval_wer": 0.38976857490864797, "step": 33800 }, { "epoch": 5.51, "learning_rate": 7.82019905367923e-05, "loss": NaN, "step": 33900 }, { "epoch": 5.51, "eval_loss": 0.4914042353630066, "eval_runtime": 8.3493, "eval_samples_per_second": 11.977, "eval_wer": 0.39585870889159563, "step": 33900 }, { "epoch": 5.53, "learning_rate": 7.813672703540546e-05, "loss": NaN, "step": 34000 }, { "epoch": 5.53, "eval_loss": 0.4946918487548828, "eval_runtime": 7.3641, "eval_samples_per_second": 13.579, "eval_wer": 0.3995127892813642, "step": 34000 }, { "epoch": 5.55, "learning_rate": 7.80714635340186e-05, "loss": NaN, "step": 34100 }, { "epoch": 5.55, "eval_loss": 0.5067921280860901, "eval_runtime": 8.8184, "eval_samples_per_second": 11.34, "eval_wer": 0.4092570036540804, "step": 34100 }, { "epoch": 5.56, "learning_rate": 7.800620003263176e-05, "loss": NaN, "step": 34200 }, { "epoch": 5.56, "eval_loss": 0.517976701259613, "eval_runtime": 8.7478, "eval_samples_per_second": 11.431, "eval_wer": 0.40682095006090135, "step": 34200 }, { "epoch": 5.58, "learning_rate": 7.79409365312449e-05, "loss": NaN, "step": 34300 }, { "epoch": 5.58, "eval_loss": 0.5033119916915894, "eval_runtime": 9.201, "eval_samples_per_second": 10.868, "eval_wer": 0.392204628501827, "step": 34300 }, { "epoch": 5.59, "learning_rate": 7.787567302985805e-05, "loss": NaN, "step": 34400 }, { "epoch": 5.59, "eval_loss": 0.49291473627090454, "eval_runtime": 11.455, "eval_samples_per_second": 8.73, "eval_wer": 0.40316686967113274, "step": 34400 }, { "epoch": 5.61, "learning_rate": 7.781040952847121e-05, "loss": NaN, "step": 34500 }, { "epoch": 5.61, "eval_loss": 0.4840911626815796, "eval_runtime": 9.864, "eval_samples_per_second": 10.138, "eval_wer": 0.39707673568818513, "step": 34500 }, { "epoch": 5.63, "learning_rate": 7.774514602708435e-05, "loss": NaN, "step": 34600 }, { "epoch": 5.63, "eval_loss": 0.4436954855918884, "eval_runtime": 7.5792, "eval_samples_per_second": 13.194, "eval_wer": 0.37393422655298414, "step": 34600 }, { "epoch": 5.64, "learning_rate": 7.767988252569751e-05, "loss": NaN, "step": 34700 }, { "epoch": 5.64, "eval_loss": 0.42483794689178467, "eval_runtime": 9.6007, "eval_samples_per_second": 10.416, "eval_wer": 0.36784409257003653, "step": 34700 }, { "epoch": 5.66, "learning_rate": 7.761461902431066e-05, "loss": NaN, "step": 34800 }, { "epoch": 5.66, "eval_loss": 0.4381932020187378, "eval_runtime": 8.7213, "eval_samples_per_second": 11.466, "eval_wer": 0.3909866017052375, "step": 34800 }, { "epoch": 5.68, "learning_rate": 7.75493555229238e-05, "loss": NaN, "step": 34900 }, { "epoch": 5.68, "eval_loss": 0.40743523836135864, "eval_runtime": 9.6342, "eval_samples_per_second": 10.38, "eval_wer": 0.38367844092570036, "step": 34900 }, { "epoch": 5.69, "learning_rate": 7.748409202153696e-05, "loss": NaN, "step": 35000 }, { "epoch": 5.69, "eval_loss": 0.4256589412689209, "eval_runtime": 7.6861, "eval_samples_per_second": 13.01, "eval_wer": 0.392204628501827, "step": 35000 }, { "epoch": 5.71, "learning_rate": 7.741882852015011e-05, "loss": NaN, "step": 35100 }, { "epoch": 5.71, "eval_loss": 0.41759517788887024, "eval_runtime": 7.5282, "eval_samples_per_second": 13.283, "eval_wer": 0.3946406820950061, "step": 35100 }, { "epoch": 5.72, "learning_rate": 7.735356501876327e-05, "loss": NaN, "step": 35200 }, { "epoch": 5.72, "eval_loss": 0.4593577980995178, "eval_runtime": 8.4088, "eval_samples_per_second": 11.892, "eval_wer": 0.4104750304506699, "step": 35200 }, { "epoch": 5.74, "learning_rate": 7.728830151737641e-05, "loss": NaN, "step": 35300 }, { "epoch": 5.74, "eval_loss": 0.4901994466781616, "eval_runtime": 7.524, "eval_samples_per_second": 13.291, "eval_wer": 0.4056029232643118, "step": 35300 }, { "epoch": 5.76, "learning_rate": 7.722303801598956e-05, "loss": NaN, "step": 35400 }, { "epoch": 5.76, "eval_loss": 0.47598525881767273, "eval_runtime": 8.5548, "eval_samples_per_second": 11.689, "eval_wer": 0.38246041412911086, "step": 35400 }, { "epoch": 5.77, "learning_rate": 7.715777451460271e-05, "loss": NaN, "step": 35500 }, { "epoch": 5.77, "eval_loss": 0.4955834150314331, "eval_runtime": 8.2229, "eval_samples_per_second": 12.161, "eval_wer": 0.3995127892813642, "step": 35500 }, { "epoch": 5.79, "learning_rate": 7.709251101321586e-05, "loss": NaN, "step": 35600 }, { "epoch": 5.79, "eval_loss": 0.5013775825500488, "eval_runtime": 7.3332, "eval_samples_per_second": 13.637, "eval_wer": 0.37758830694275275, "step": 35600 }, { "epoch": 5.81, "learning_rate": 7.702724751182902e-05, "loss": NaN, "step": 35700 }, { "epoch": 5.81, "eval_loss": 0.4535202085971832, "eval_runtime": 6.7442, "eval_samples_per_second": 14.828, "eval_wer": 0.3617539585870889, "step": 35700 }, { "epoch": 5.82, "learning_rate": 7.696198401044216e-05, "loss": NaN, "step": 35800 }, { "epoch": 5.82, "eval_loss": 0.43038153648376465, "eval_runtime": 7.9798, "eval_samples_per_second": 12.532, "eval_wer": 0.38367844092570036, "step": 35800 }, { "epoch": 5.84, "learning_rate": 7.689672050905532e-05, "loss": NaN, "step": 35900 }, { "epoch": 5.84, "eval_loss": 0.4333917200565338, "eval_runtime": 8.5583, "eval_samples_per_second": 11.685, "eval_wer": 0.3800243605359318, "step": 35900 }, { "epoch": 5.85, "learning_rate": 7.683145700766847e-05, "loss": NaN, "step": 36000 }, { "epoch": 5.85, "eval_loss": 0.49249768257141113, "eval_runtime": 9.3291, "eval_samples_per_second": 10.719, "eval_wer": 0.40316686967113274, "step": 36000 }, { "epoch": 5.87, "learning_rate": 7.676619350628161e-05, "loss": NaN, "step": 36100 }, { "epoch": 5.87, "eval_loss": 0.47578758001327515, "eval_runtime": 7.9207, "eval_samples_per_second": 12.625, "eval_wer": 0.38976857490864797, "step": 36100 }, { "epoch": 5.89, "learning_rate": 7.670093000489477e-05, "loss": NaN, "step": 36200 }, { "epoch": 5.89, "eval_loss": 0.44561660289764404, "eval_runtime": 6.6969, "eval_samples_per_second": 14.932, "eval_wer": 0.3873325213154689, "step": 36200 }, { "epoch": 5.9, "learning_rate": 7.663566650350792e-05, "loss": NaN, "step": 36300 }, { "epoch": 5.9, "eval_loss": 0.46735045313835144, "eval_runtime": 7.2262, "eval_samples_per_second": 13.839, "eval_wer": 0.39585870889159563, "step": 36300 }, { "epoch": 5.92, "learning_rate": 7.657040300212108e-05, "loss": NaN, "step": 36400 }, { "epoch": 5.92, "eval_loss": 0.42316126823425293, "eval_runtime": 8.7463, "eval_samples_per_second": 11.433, "eval_wer": 0.37758830694275275, "step": 36400 }, { "epoch": 5.94, "learning_rate": 7.65051395007342e-05, "loss": NaN, "step": 36500 }, { "epoch": 5.94, "eval_loss": 0.46479174494743347, "eval_runtime": 9.1318, "eval_samples_per_second": 10.951, "eval_wer": 0.39585870889159563, "step": 36500 }, { "epoch": 5.95, "learning_rate": 7.643987599934737e-05, "loss": NaN, "step": 36600 }, { "epoch": 5.95, "eval_loss": 0.42728888988494873, "eval_runtime": 8.4942, "eval_samples_per_second": 11.773, "eval_wer": 0.37758830694275275, "step": 36600 }, { "epoch": 5.97, "learning_rate": 7.637461249796052e-05, "loss": NaN, "step": 36700 }, { "epoch": 5.97, "eval_loss": 0.4792998433113098, "eval_runtime": 8.1451, "eval_samples_per_second": 12.277, "eval_wer": 0.4007308160779537, "step": 36700 }, { "epoch": 5.98, "learning_rate": 7.630934899657367e-05, "loss": NaN, "step": 36800 }, { "epoch": 5.98, "eval_loss": 0.4131828546524048, "eval_runtime": 6.536, "eval_samples_per_second": 15.3, "eval_wer": 0.3629719853836784, "step": 36800 }, { "epoch": 6.0, "learning_rate": 7.624408549518683e-05, "loss": NaN, "step": 36900 }, { "epoch": 6.0, "eval_loss": 0.5964876413345337, "eval_runtime": 8.3503, "eval_samples_per_second": 11.976, "eval_wer": 0.392204628501827, "step": 36900 }, { "epoch": 6.02, "learning_rate": 7.617882199379997e-05, "loss": NaN, "step": 37000 }, { "epoch": 6.02, "eval_loss": 0.5113080739974976, "eval_runtime": 7.8786, "eval_samples_per_second": 12.693, "eval_wer": 0.40803897685749085, "step": 37000 }, { "epoch": 6.03, "learning_rate": 7.611355849241312e-05, "loss": NaN, "step": 37100 }, { "epoch": 6.03, "eval_loss": 0.44438639283180237, "eval_runtime": 7.8581, "eval_samples_per_second": 12.726, "eval_wer": 0.3812423873325213, "step": 37100 }, { "epoch": 6.05, "learning_rate": 7.604829499102626e-05, "loss": NaN, "step": 37200 }, { "epoch": 6.05, "eval_loss": 0.44501668214797974, "eval_runtime": 6.8166, "eval_samples_per_second": 14.67, "eval_wer": 0.3861144945188794, "step": 37200 }, { "epoch": 6.07, "learning_rate": 7.598303148963942e-05, "loss": NaN, "step": 37300 }, { "epoch": 6.07, "eval_loss": 0.46016010642051697, "eval_runtime": 6.8605, "eval_samples_per_second": 14.576, "eval_wer": 0.37758830694275275, "step": 37300 }, { "epoch": 6.08, "learning_rate": 7.591776798825258e-05, "loss": NaN, "step": 37400 }, { "epoch": 6.08, "eval_loss": 0.4487974941730499, "eval_runtime": 8.698, "eval_samples_per_second": 11.497, "eval_wer": 0.392204628501827, "step": 37400 }, { "epoch": 6.1, "learning_rate": 7.585250448686573e-05, "loss": NaN, "step": 37500 }, { "epoch": 6.1, "eval_loss": 0.46871453523635864, "eval_runtime": 7.2092, "eval_samples_per_second": 13.871, "eval_wer": 0.3909866017052375, "step": 37500 }, { "epoch": 6.11, "learning_rate": 7.578724098547888e-05, "loss": NaN, "step": 37600 }, { "epoch": 6.11, "eval_loss": 0.5187182426452637, "eval_runtime": 8.235, "eval_samples_per_second": 12.143, "eval_wer": 0.3848964677222899, "step": 37600 }, { "epoch": 6.13, "learning_rate": 7.572197748409202e-05, "loss": NaN, "step": 37700 }, { "epoch": 6.13, "eval_loss": 0.4755428433418274, "eval_runtime": 8.6418, "eval_samples_per_second": 11.572, "eval_wer": 0.3909866017052375, "step": 37700 }, { "epoch": 6.15, "learning_rate": 7.565671398270517e-05, "loss": NaN, "step": 37800 }, { "epoch": 6.15, "eval_loss": 0.4716055393218994, "eval_runtime": 8.6568, "eval_samples_per_second": 11.552, "eval_wer": 0.39585870889159563, "step": 37800 }, { "epoch": 6.16, "learning_rate": 7.559145048131832e-05, "loss": NaN, "step": 37900 }, { "epoch": 6.16, "eval_loss": 0.43883880972862244, "eval_runtime": 8.0179, "eval_samples_per_second": 12.472, "eval_wer": 0.3861144945188794, "step": 37900 }, { "epoch": 6.18, "learning_rate": 7.552618697993148e-05, "loss": NaN, "step": 38000 }, { "epoch": 6.18, "eval_loss": 0.447729229927063, "eval_runtime": 7.3355, "eval_samples_per_second": 13.632, "eval_wer": 0.38855054811205847, "step": 38000 }, { "epoch": 6.2, "learning_rate": 7.546092347854464e-05, "loss": NaN, "step": 38100 }, { "epoch": 6.2, "eval_loss": 0.5071135759353638, "eval_runtime": 9.0115, "eval_samples_per_second": 11.097, "eval_wer": 0.4092570036540804, "step": 38100 }, { "epoch": 6.21, "learning_rate": 7.539565997715777e-05, "loss": NaN, "step": 38200 }, { "epoch": 6.21, "eval_loss": 0.45388340950012207, "eval_runtime": 7.6236, "eval_samples_per_second": 13.117, "eval_wer": 0.3873325213154689, "step": 38200 }, { "epoch": 6.23, "learning_rate": 7.533039647577093e-05, "loss": NaN, "step": 38300 }, { "epoch": 6.23, "eval_loss": 0.4727196991443634, "eval_runtime": 9.3783, "eval_samples_per_second": 10.663, "eval_wer": 0.392204628501827, "step": 38300 }, { "epoch": 6.24, "learning_rate": 7.526513297438407e-05, "loss": NaN, "step": 38400 }, { "epoch": 6.24, "eval_loss": 0.45815300941467285, "eval_runtime": 8.7937, "eval_samples_per_second": 11.372, "eval_wer": 0.3995127892813642, "step": 38400 }, { "epoch": 6.26, "learning_rate": 7.519986947299723e-05, "loss": NaN, "step": 38500 }, { "epoch": 6.26, "eval_loss": 0.45697593688964844, "eval_runtime": 7.849, "eval_samples_per_second": 12.74, "eval_wer": 0.38367844092570036, "step": 38500 }, { "epoch": 6.28, "learning_rate": 7.513460597161039e-05, "loss": NaN, "step": 38600 }, { "epoch": 6.28, "eval_loss": 0.4512711465358734, "eval_runtime": 8.0969, "eval_samples_per_second": 12.35, "eval_wer": 0.4056029232643118, "step": 38600 }, { "epoch": 6.29, "learning_rate": 7.506934247022354e-05, "loss": NaN, "step": 38700 }, { "epoch": 6.29, "eval_loss": 0.47323668003082275, "eval_runtime": 9.4309, "eval_samples_per_second": 10.603, "eval_wer": 0.4007308160779537, "step": 38700 }, { "epoch": 6.31, "learning_rate": 7.500407896883668e-05, "loss": NaN, "step": 38800 }, { "epoch": 6.31, "eval_loss": 0.46344485878944397, "eval_runtime": 7.4323, "eval_samples_per_second": 13.455, "eval_wer": 0.3909866017052375, "step": 38800 }, { "epoch": 6.33, "learning_rate": 7.493881546744983e-05, "loss": NaN, "step": 38900 }, { "epoch": 6.33, "eval_loss": 0.46373656392097473, "eval_runtime": 8.8968, "eval_samples_per_second": 11.24, "eval_wer": 0.4043848964677223, "step": 38900 }, { "epoch": 6.34, "learning_rate": 7.487355196606298e-05, "loss": NaN, "step": 39000 }, { "epoch": 6.34, "eval_loss": 0.5335507392883301, "eval_runtime": 7.8243, "eval_samples_per_second": 12.781, "eval_wer": 0.3982947624847747, "step": 39000 }, { "epoch": 6.36, "learning_rate": 7.480828846467613e-05, "loss": NaN, "step": 39100 }, { "epoch": 6.36, "eval_loss": 0.4426437318325043, "eval_runtime": 9.3026, "eval_samples_per_second": 10.75, "eval_wer": 0.38246041412911086, "step": 39100 }, { "epoch": 6.38, "learning_rate": 7.474302496328929e-05, "loss": NaN, "step": 39200 }, { "epoch": 6.38, "eval_loss": 0.4251578450202942, "eval_runtime": 7.5958, "eval_samples_per_second": 13.165, "eval_wer": 0.38976857490864797, "step": 39200 }, { "epoch": 6.39, "learning_rate": 7.467776146190245e-05, "loss": NaN, "step": 39300 }, { "epoch": 6.39, "eval_loss": 0.45868903398513794, "eval_runtime": 7.9208, "eval_samples_per_second": 12.625, "eval_wer": 0.37271619975639464, "step": 39300 }, { "epoch": 6.41, "learning_rate": 7.461249796051558e-05, "loss": NaN, "step": 39400 }, { "epoch": 6.41, "eval_loss": 0.4029034376144409, "eval_runtime": 7.9815, "eval_samples_per_second": 12.529, "eval_wer": 0.37271619975639464, "step": 39400 }, { "epoch": 6.42, "learning_rate": 7.454723445912874e-05, "loss": NaN, "step": 39500 }, { "epoch": 6.42, "eval_loss": 0.43351614475250244, "eval_runtime": 8.7741, "eval_samples_per_second": 11.397, "eval_wer": 0.3848964677222899, "step": 39500 }, { "epoch": 6.44, "learning_rate": 7.448197095774188e-05, "loss": NaN, "step": 39600 }, { "epoch": 6.44, "eval_loss": 0.4573790729045868, "eval_runtime": 7.9568, "eval_samples_per_second": 12.568, "eval_wer": 0.38367844092570036, "step": 39600 }, { "epoch": 6.46, "learning_rate": 7.441670745635504e-05, "loss": NaN, "step": 39700 }, { "epoch": 6.46, "eval_loss": 0.47754156589508057, "eval_runtime": 8.0778, "eval_samples_per_second": 12.38, "eval_wer": 0.3848964677222899, "step": 39700 }, { "epoch": 6.47, "learning_rate": 7.435144395496819e-05, "loss": NaN, "step": 39800 }, { "epoch": 6.47, "eval_loss": 0.5262435674667358, "eval_runtime": 9.0367, "eval_samples_per_second": 11.066, "eval_wer": 0.3934226552984166, "step": 39800 }, { "epoch": 6.49, "learning_rate": 7.428618045358133e-05, "loss": NaN, "step": 39900 }, { "epoch": 6.49, "eval_loss": 0.45043036341667175, "eval_runtime": 8.4329, "eval_samples_per_second": 11.858, "eval_wer": 0.38855054811205847, "step": 39900 }, { "epoch": 6.51, "learning_rate": 7.422091695219449e-05, "loss": NaN, "step": 40000 }, { "epoch": 6.51, "eval_loss": 0.5360258221626282, "eval_runtime": 8.3169, "eval_samples_per_second": 12.024, "eval_wer": 0.38976857490864797, "step": 40000 }, { "epoch": 6.52, "learning_rate": 7.415565345080763e-05, "loss": NaN, "step": 40100 }, { "epoch": 6.52, "eval_loss": 0.43279510736465454, "eval_runtime": 8.3411, "eval_samples_per_second": 11.989, "eval_wer": 0.37880633373934225, "step": 40100 }, { "epoch": 6.54, "learning_rate": 7.40903899494208e-05, "loss": NaN, "step": 40200 }, { "epoch": 6.54, "eval_loss": 0.436869353055954, "eval_runtime": 7.5681, "eval_samples_per_second": 13.213, "eval_wer": 0.37758830694275275, "step": 40200 }, { "epoch": 6.55, "learning_rate": 7.402512644803394e-05, "loss": NaN, "step": 40300 }, { "epoch": 6.55, "eval_loss": 0.48069870471954346, "eval_runtime": 7.7372, "eval_samples_per_second": 12.924, "eval_wer": 0.4177831912302071, "step": 40300 }, { "epoch": 6.57, "learning_rate": 7.39598629466471e-05, "loss": NaN, "step": 40400 }, { "epoch": 6.57, "eval_loss": 0.43905335664749146, "eval_runtime": 7.4851, "eval_samples_per_second": 13.36, "eval_wer": 0.3848964677222899, "step": 40400 }, { "epoch": 6.59, "learning_rate": 7.389459944526024e-05, "loss": NaN, "step": 40500 }, { "epoch": 6.59, "eval_loss": 0.45289239287376404, "eval_runtime": 8.056, "eval_samples_per_second": 12.413, "eval_wer": 0.3873325213154689, "step": 40500 }, { "epoch": 6.6, "learning_rate": 7.382933594387339e-05, "loss": NaN, "step": 40600 }, { "epoch": 6.6, "eval_loss": 0.4513566195964813, "eval_runtime": 8.3785, "eval_samples_per_second": 11.935, "eval_wer": 0.3848964677222899, "step": 40600 }, { "epoch": 6.62, "learning_rate": 7.376407244248655e-05, "loss": NaN, "step": 40700 }, { "epoch": 6.62, "eval_loss": 0.45488113164901733, "eval_runtime": 9.389, "eval_samples_per_second": 10.651, "eval_wer": 0.37149817295980514, "step": 40700 }, { "epoch": 6.64, "learning_rate": 7.369880894109969e-05, "loss": NaN, "step": 40800 }, { "epoch": 6.64, "eval_loss": 0.4812730550765991, "eval_runtime": 9.6857, "eval_samples_per_second": 10.324, "eval_wer": 0.37149817295980514, "step": 40800 }, { "epoch": 6.65, "learning_rate": 7.363354543971285e-05, "loss": NaN, "step": 40900 }, { "epoch": 6.65, "eval_loss": 0.4662674367427826, "eval_runtime": 9.1141, "eval_samples_per_second": 10.972, "eval_wer": 0.37271619975639464, "step": 40900 }, { "epoch": 6.67, "learning_rate": 7.3568281938326e-05, "loss": NaN, "step": 41000 }, { "epoch": 6.67, "eval_loss": 0.43189141154289246, "eval_runtime": 7.7905, "eval_samples_per_second": 12.836, "eval_wer": 0.38855054811205847, "step": 41000 }, { "epoch": 6.68, "learning_rate": 7.350301843693914e-05, "loss": NaN, "step": 41100 }, { "epoch": 6.68, "eval_loss": 0.4479624032974243, "eval_runtime": 6.7026, "eval_samples_per_second": 14.919, "eval_wer": 0.392204628501827, "step": 41100 }, { "epoch": 6.7, "learning_rate": 7.34377549355523e-05, "loss": NaN, "step": 41200 }, { "epoch": 6.7, "eval_loss": 0.5534685254096985, "eval_runtime": 7.9313, "eval_samples_per_second": 12.608, "eval_wer": 0.392204628501827, "step": 41200 }, { "epoch": 6.72, "learning_rate": 7.337249143416544e-05, "loss": NaN, "step": 41300 }, { "epoch": 6.72, "eval_loss": 0.42362719774246216, "eval_runtime": 7.9752, "eval_samples_per_second": 12.539, "eval_wer": 0.3763702801461632, "step": 41300 }, { "epoch": 6.73, "learning_rate": 7.33072279327786e-05, "loss": NaN, "step": 41400 }, { "epoch": 6.73, "eval_loss": 0.4316897690296173, "eval_runtime": 9.0445, "eval_samples_per_second": 11.056, "eval_wer": 0.3800243605359318, "step": 41400 }, { "epoch": 6.75, "learning_rate": 7.324196443139175e-05, "loss": NaN, "step": 41500 }, { "epoch": 6.75, "eval_loss": 0.4458038806915283, "eval_runtime": 8.5585, "eval_samples_per_second": 11.684, "eval_wer": 0.38246041412911086, "step": 41500 }, { "epoch": 6.77, "learning_rate": 7.31767009300049e-05, "loss": NaN, "step": 41600 }, { "epoch": 6.77, "eval_loss": 0.4252176582813263, "eval_runtime": 6.9682, "eval_samples_per_second": 14.351, "eval_wer": 0.38855054811205847, "step": 41600 }, { "epoch": 6.78, "learning_rate": 7.311143742861805e-05, "loss": NaN, "step": 41700 }, { "epoch": 6.78, "eval_loss": 0.42161300778388977, "eval_runtime": 8.2804, "eval_samples_per_second": 12.077, "eval_wer": 0.36053593179049936, "step": 41700 }, { "epoch": 6.8, "learning_rate": 7.30461739272312e-05, "loss": NaN, "step": 41800 }, { "epoch": 6.8, "eval_loss": 0.43236517906188965, "eval_runtime": 6.8741, "eval_samples_per_second": 14.547, "eval_wer": 0.3763702801461632, "step": 41800 }, { "epoch": 6.81, "learning_rate": 7.298091042584436e-05, "loss": NaN, "step": 41900 }, { "epoch": 6.81, "eval_loss": 0.42260417342185974, "eval_runtime": 8.7571, "eval_samples_per_second": 11.419, "eval_wer": 0.3763702801461632, "step": 41900 }, { "epoch": 6.83, "learning_rate": 7.29156469244575e-05, "loss": NaN, "step": 42000 }, { "epoch": 6.83, "eval_loss": 0.4526902735233307, "eval_runtime": 9.9377, "eval_samples_per_second": 10.063, "eval_wer": 0.364190012180268, "step": 42000 }, { "epoch": 6.85, "learning_rate": 7.285038342307066e-05, "loss": NaN, "step": 42100 }, { "epoch": 6.85, "eval_loss": 0.4244474768638611, "eval_runtime": 7.3805, "eval_samples_per_second": 13.549, "eval_wer": 0.3861144945188794, "step": 42100 }, { "epoch": 6.86, "learning_rate": 7.278511992168379e-05, "loss": NaN, "step": 42200 }, { "epoch": 6.86, "eval_loss": 0.3987332284450531, "eval_runtime": 7.9724, "eval_samples_per_second": 12.543, "eval_wer": 0.3690621193666261, "step": 42200 }, { "epoch": 6.88, "learning_rate": 7.271985642029695e-05, "loss": NaN, "step": 42300 }, { "epoch": 6.88, "eval_loss": 0.4404261112213135, "eval_runtime": 8.8576, "eval_samples_per_second": 11.29, "eval_wer": 0.38976857490864797, "step": 42300 }, { "epoch": 6.9, "learning_rate": 7.265459291891011e-05, "loss": NaN, "step": 42400 }, { "epoch": 6.9, "eval_loss": 0.4243963658809662, "eval_runtime": 9.9726, "eval_samples_per_second": 10.027, "eval_wer": 0.37758830694275275, "step": 42400 }, { "epoch": 6.91, "learning_rate": 7.258932941752325e-05, "loss": NaN, "step": 42500 }, { "epoch": 6.91, "eval_loss": 0.44823479652404785, "eval_runtime": 9.933, "eval_samples_per_second": 10.067, "eval_wer": 0.3995127892813642, "step": 42500 }, { "epoch": 6.93, "learning_rate": 7.252406591613641e-05, "loss": NaN, "step": 42600 }, { "epoch": 6.93, "eval_loss": 0.39962050318717957, "eval_runtime": 6.5522, "eval_samples_per_second": 15.262, "eval_wer": 0.3848964677222899, "step": 42600 }, { "epoch": 6.94, "learning_rate": 7.245880241474956e-05, "loss": NaN, "step": 42700 }, { "epoch": 6.94, "eval_loss": 0.43537867069244385, "eval_runtime": 7.7406, "eval_samples_per_second": 12.919, "eval_wer": 0.3812423873325213, "step": 42700 }, { "epoch": 6.96, "learning_rate": 7.23935389133627e-05, "loss": NaN, "step": 42800 }, { "epoch": 6.96, "eval_loss": 0.43869927525520325, "eval_runtime": 8.2951, "eval_samples_per_second": 12.055, "eval_wer": 0.392204628501827, "step": 42800 }, { "epoch": 6.98, "learning_rate": 7.232827541197585e-05, "loss": NaN, "step": 42900 }, { "epoch": 6.98, "eval_loss": 0.4649328589439392, "eval_runtime": 8.5972, "eval_samples_per_second": 11.632, "eval_wer": 0.4092570036540804, "step": 42900 }, { "epoch": 6.99, "learning_rate": 7.2263011910589e-05, "loss": NaN, "step": 43000 }, { "epoch": 6.99, "eval_loss": 0.3986141085624695, "eval_runtime": 10.2183, "eval_samples_per_second": 9.786, "eval_wer": 0.37149817295980514, "step": 43000 }, { "epoch": 7.01, "learning_rate": 7.219774840920217e-05, "loss": NaN, "step": 43100 }, { "epoch": 7.01, "eval_loss": 0.41271498799324036, "eval_runtime": 8.2539, "eval_samples_per_second": 12.116, "eval_wer": 0.39585870889159563, "step": 43100 }, { "epoch": 7.03, "learning_rate": 7.213248490781531e-05, "loss": NaN, "step": 43200 }, { "epoch": 7.03, "eval_loss": 0.42347651720046997, "eval_runtime": 6.7075, "eval_samples_per_second": 14.909, "eval_wer": 0.3848964677222899, "step": 43200 }, { "epoch": 7.04, "learning_rate": 7.206722140642846e-05, "loss": NaN, "step": 43300 }, { "epoch": 7.04, "eval_loss": 0.4063185453414917, "eval_runtime": 7.6729, "eval_samples_per_second": 13.033, "eval_wer": 0.36662606577344703, "step": 43300 }, { "epoch": 7.06, "learning_rate": 7.20019579050416e-05, "loss": NaN, "step": 43400 }, { "epoch": 7.06, "eval_loss": 0.49583899974823, "eval_runtime": 6.9774, "eval_samples_per_second": 14.332, "eval_wer": 0.38855054811205847, "step": 43400 }, { "epoch": 7.07, "learning_rate": 7.193669440365476e-05, "loss": NaN, "step": 43500 }, { "epoch": 7.07, "eval_loss": 0.4709340035915375, "eval_runtime": 7.0993, "eval_samples_per_second": 14.086, "eval_wer": 0.4056029232643118, "step": 43500 }, { "epoch": 7.09, "learning_rate": 7.18714309022679e-05, "loss": NaN, "step": 43600 }, { "epoch": 7.09, "eval_loss": 0.45330917835235596, "eval_runtime": 6.7893, "eval_samples_per_second": 14.729, "eval_wer": 0.3702801461632156, "step": 43600 }, { "epoch": 7.11, "learning_rate": 7.180616740088106e-05, "loss": NaN, "step": 43700 }, { "epoch": 7.11, "eval_loss": 0.444570392370224, "eval_runtime": 7.3413, "eval_samples_per_second": 13.622, "eval_wer": 0.4043848964677223, "step": 43700 }, { "epoch": 7.12, "learning_rate": 7.174090389949422e-05, "loss": NaN, "step": 43800 }, { "epoch": 7.12, "eval_loss": 0.42336639761924744, "eval_runtime": 7.0892, "eval_samples_per_second": 14.106, "eval_wer": 0.3690621193666261, "step": 43800 }, { "epoch": 7.14, "learning_rate": 7.167564039810735e-05, "loss": NaN, "step": 43900 }, { "epoch": 7.14, "eval_loss": 0.4557478427886963, "eval_runtime": 9.6857, "eval_samples_per_second": 10.325, "eval_wer": 0.38246041412911086, "step": 43900 }, { "epoch": 7.16, "learning_rate": 7.161037689672051e-05, "loss": NaN, "step": 44000 }, { "epoch": 7.16, "eval_loss": 0.4820619225502014, "eval_runtime": 8.8382, "eval_samples_per_second": 11.314, "eval_wer": 0.37393422655298414, "step": 44000 }, { "epoch": 7.17, "learning_rate": 7.154511339533366e-05, "loss": NaN, "step": 44100 }, { "epoch": 7.17, "eval_loss": 0.4444971978664398, "eval_runtime": 9.4662, "eval_samples_per_second": 10.564, "eval_wer": 0.38976857490864797, "step": 44100 }, { "epoch": 7.19, "learning_rate": 7.147984989394682e-05, "loss": NaN, "step": 44200 }, { "epoch": 7.19, "eval_loss": 0.4306584596633911, "eval_runtime": 9.2167, "eval_samples_per_second": 10.85, "eval_wer": 0.37758830694275275, "step": 44200 }, { "epoch": 7.2, "learning_rate": 7.141458639255996e-05, "loss": NaN, "step": 44300 }, { "epoch": 7.2, "eval_loss": 0.43316277861595154, "eval_runtime": 6.9757, "eval_samples_per_second": 14.336, "eval_wer": 0.364190012180268, "step": 44300 }, { "epoch": 7.22, "learning_rate": 7.13493228911731e-05, "loss": NaN, "step": 44400 }, { "epoch": 7.22, "eval_loss": 0.4009106755256653, "eval_runtime": 7.8376, "eval_samples_per_second": 12.759, "eval_wer": 0.3629719853836784, "step": 44400 }, { "epoch": 7.24, "learning_rate": 7.128405938978626e-05, "loss": NaN, "step": 44500 }, { "epoch": 7.24, "eval_loss": 0.3961714804172516, "eval_runtime": 7.8289, "eval_samples_per_second": 12.773, "eval_wer": 0.3629719853836784, "step": 44500 }, { "epoch": 7.25, "learning_rate": 7.121879588839941e-05, "loss": NaN, "step": 44600 }, { "epoch": 7.25, "eval_loss": 0.4771730303764343, "eval_runtime": 10.2069, "eval_samples_per_second": 9.797, "eval_wer": 0.3861144945188794, "step": 44600 }, { "epoch": 7.27, "learning_rate": 7.115353238701257e-05, "loss": NaN, "step": 44700 }, { "epoch": 7.27, "eval_loss": 0.41656962037086487, "eval_runtime": 8.6363, "eval_samples_per_second": 11.579, "eval_wer": 0.3751522533495737, "step": 44700 }, { "epoch": 7.29, "learning_rate": 7.108826888562571e-05, "loss": NaN, "step": 44800 }, { "epoch": 7.29, "eval_loss": 0.4536881744861603, "eval_runtime": 6.9673, "eval_samples_per_second": 14.353, "eval_wer": 0.3909866017052375, "step": 44800 }, { "epoch": 7.3, "learning_rate": 7.102300538423887e-05, "loss": NaN, "step": 44900 }, { "epoch": 7.3, "eval_loss": 0.4048987627029419, "eval_runtime": 7.9455, "eval_samples_per_second": 12.586, "eval_wer": 0.37758830694275275, "step": 44900 }, { "epoch": 7.32, "learning_rate": 7.095774188285202e-05, "loss": NaN, "step": 45000 }, { "epoch": 7.32, "eval_loss": 0.4246349334716797, "eval_runtime": 7.4556, "eval_samples_per_second": 13.413, "eval_wer": 0.3861144945188794, "step": 45000 }, { "epoch": 7.33, "learning_rate": 7.089247838146516e-05, "loss": NaN, "step": 45100 }, { "epoch": 7.33, "eval_loss": 0.49522098898887634, "eval_runtime": 6.8596, "eval_samples_per_second": 14.578, "eval_wer": 0.38246041412911086, "step": 45100 }, { "epoch": 7.35, "learning_rate": 7.082721488007832e-05, "loss": NaN, "step": 45200 }, { "epoch": 7.35, "eval_loss": 0.47712311148643494, "eval_runtime": 9.0655, "eval_samples_per_second": 11.031, "eval_wer": 0.40194884287454324, "step": 45200 }, { "epoch": 7.37, "learning_rate": 7.076195137869147e-05, "loss": NaN, "step": 45300 }, { "epoch": 7.37, "eval_loss": 0.407779723405838, "eval_runtime": 8.3949, "eval_samples_per_second": 11.912, "eval_wer": 0.3861144945188794, "step": 45300 }, { "epoch": 7.38, "learning_rate": 7.069668787730463e-05, "loss": NaN, "step": 45400 }, { "epoch": 7.38, "eval_loss": 0.42167598009109497, "eval_runtime": 7.6909, "eval_samples_per_second": 13.002, "eval_wer": 0.38976857490864797, "step": 45400 }, { "epoch": 7.4, "learning_rate": 7.063142437591777e-05, "loss": NaN, "step": 45500 }, { "epoch": 7.4, "eval_loss": 0.46571946144104004, "eval_runtime": 8.1474, "eval_samples_per_second": 12.274, "eval_wer": 0.3934226552984166, "step": 45500 }, { "epoch": 7.42, "learning_rate": 7.056616087453092e-05, "loss": NaN, "step": 45600 }, { "epoch": 7.42, "eval_loss": 0.40125495195388794, "eval_runtime": 7.1588, "eval_samples_per_second": 13.969, "eval_wer": 0.4007308160779537, "step": 45600 }, { "epoch": 7.43, "learning_rate": 7.050089737314407e-05, "loss": NaN, "step": 45700 }, { "epoch": 7.43, "eval_loss": 0.41013047099113464, "eval_runtime": 8.2392, "eval_samples_per_second": 12.137, "eval_wer": 0.39707673568818513, "step": 45700 }, { "epoch": 7.45, "learning_rate": 7.043563387175722e-05, "loss": NaN, "step": 45800 }, { "epoch": 7.45, "eval_loss": 0.3986717164516449, "eval_runtime": 6.5584, "eval_samples_per_second": 15.248, "eval_wer": 0.37393422655298414, "step": 45800 }, { "epoch": 7.46, "learning_rate": 7.037037037037038e-05, "loss": NaN, "step": 45900 }, { "epoch": 7.46, "eval_loss": 0.3988329768180847, "eval_runtime": 8.4951, "eval_samples_per_second": 11.771, "eval_wer": 0.3763702801461632, "step": 45900 }, { "epoch": 7.48, "learning_rate": 7.030510686898352e-05, "loss": NaN, "step": 46000 }, { "epoch": 7.48, "eval_loss": 0.45179134607315063, "eval_runtime": 9.3929, "eval_samples_per_second": 10.646, "eval_wer": 0.3800243605359318, "step": 46000 }, { "epoch": 7.5, "learning_rate": 7.023984336759667e-05, "loss": NaN, "step": 46100 }, { "epoch": 7.5, "eval_loss": 0.4907733201980591, "eval_runtime": 8.1588, "eval_samples_per_second": 12.257, "eval_wer": 0.41169305724725946, "step": 46100 }, { "epoch": 7.51, "learning_rate": 7.017457986620983e-05, "loss": NaN, "step": 46200 }, { "epoch": 7.51, "eval_loss": 0.4354599416255951, "eval_runtime": 7.4922, "eval_samples_per_second": 13.347, "eval_wer": 0.3909866017052375, "step": 46200 }, { "epoch": 7.53, "learning_rate": 7.010931636482297e-05, "loss": NaN, "step": 46300 }, { "epoch": 7.53, "eval_loss": 0.4466521441936493, "eval_runtime": 10.9543, "eval_samples_per_second": 9.129, "eval_wer": 0.3909866017052375, "step": 46300 }, { "epoch": 7.55, "learning_rate": 7.004405286343613e-05, "loss": NaN, "step": 46400 }, { "epoch": 7.55, "eval_loss": 0.4440977871417999, "eval_runtime": 9.6264, "eval_samples_per_second": 10.388, "eval_wer": 0.40316686967113274, "step": 46400 }, { "epoch": 7.56, "learning_rate": 6.997878936204928e-05, "loss": NaN, "step": 46500 }, { "epoch": 7.56, "eval_loss": 0.40619930624961853, "eval_runtime": 8.2096, "eval_samples_per_second": 12.181, "eval_wer": 0.37149817295980514, "step": 46500 }, { "epoch": 7.58, "learning_rate": 6.991352586066243e-05, "loss": NaN, "step": 46600 }, { "epoch": 7.58, "eval_loss": 0.4126388430595398, "eval_runtime": 8.8109, "eval_samples_per_second": 11.35, "eval_wer": 0.3909866017052375, "step": 46600 }, { "epoch": 7.59, "learning_rate": 6.984826235927558e-05, "loss": NaN, "step": 46700 }, { "epoch": 7.59, "eval_loss": 0.41685402393341064, "eval_runtime": 8.6911, "eval_samples_per_second": 11.506, "eval_wer": 0.3800243605359318, "step": 46700 }, { "epoch": 7.61, "learning_rate": 6.978299885788873e-05, "loss": NaN, "step": 46800 }, { "epoch": 7.61, "eval_loss": 0.42471861839294434, "eval_runtime": 6.7824, "eval_samples_per_second": 14.744, "eval_wer": 0.39585870889159563, "step": 46800 }, { "epoch": 7.63, "learning_rate": 6.971773535650188e-05, "loss": NaN, "step": 46900 }, { "epoch": 7.63, "eval_loss": 0.4128079116344452, "eval_runtime": 7.183, "eval_samples_per_second": 13.922, "eval_wer": 0.3946406820950061, "step": 46900 }, { "epoch": 7.64, "learning_rate": 6.965247185511503e-05, "loss": NaN, "step": 47000 }, { "epoch": 7.64, "eval_loss": 0.3996775448322296, "eval_runtime": 8.3343, "eval_samples_per_second": 11.999, "eval_wer": 0.3654080389768575, "step": 47000 }, { "epoch": 7.66, "learning_rate": 6.958720835372819e-05, "loss": NaN, "step": 47100 }, { "epoch": 7.66, "eval_loss": 0.3690239191055298, "eval_runtime": 6.5963, "eval_samples_per_second": 15.16, "eval_wer": 0.37880633373934225, "step": 47100 }, { "epoch": 7.68, "learning_rate": 6.952194485234133e-05, "loss": NaN, "step": 47200 }, { "epoch": 7.68, "eval_loss": 0.42326632142066956, "eval_runtime": 8.3908, "eval_samples_per_second": 11.918, "eval_wer": 0.3909866017052375, "step": 47200 }, { "epoch": 7.69, "learning_rate": 6.945668135095448e-05, "loss": NaN, "step": 47300 }, { "epoch": 7.69, "eval_loss": 0.39741602540016174, "eval_runtime": 8.5855, "eval_samples_per_second": 11.648, "eval_wer": 0.36784409257003653, "step": 47300 }, { "epoch": 7.71, "learning_rate": 6.939141784956764e-05, "loss": NaN, "step": 47400 }, { "epoch": 7.71, "eval_loss": 0.42626139521598816, "eval_runtime": 8.2558, "eval_samples_per_second": 12.113, "eval_wer": 0.3982947624847747, "step": 47400 }, { "epoch": 7.72, "learning_rate": 6.932615434818078e-05, "loss": NaN, "step": 47500 }, { "epoch": 7.72, "eval_loss": 0.41164088249206543, "eval_runtime": 7.9604, "eval_samples_per_second": 12.562, "eval_wer": 0.392204628501827, "step": 47500 }, { "epoch": 7.74, "learning_rate": 6.926089084679394e-05, "loss": NaN, "step": 47600 }, { "epoch": 7.74, "eval_loss": 0.41196590662002563, "eval_runtime": 7.4856, "eval_samples_per_second": 13.359, "eval_wer": 0.3654080389768575, "step": 47600 }, { "epoch": 7.76, "learning_rate": 6.919562734540709e-05, "loss": NaN, "step": 47700 }, { "epoch": 7.76, "eval_loss": 0.4575519263744354, "eval_runtime": 7.5753, "eval_samples_per_second": 13.201, "eval_wer": 0.392204628501827, "step": 47700 }, { "epoch": 7.77, "learning_rate": 6.913036384402023e-05, "loss": NaN, "step": 47800 }, { "epoch": 7.77, "eval_loss": 0.47335246205329895, "eval_runtime": 8.6796, "eval_samples_per_second": 11.521, "eval_wer": 0.40194884287454324, "step": 47800 }, { "epoch": 7.79, "learning_rate": 6.906510034263338e-05, "loss": NaN, "step": 47900 }, { "epoch": 7.79, "eval_loss": 0.46512919664382935, "eval_runtime": 7.9927, "eval_samples_per_second": 12.511, "eval_wer": 0.3873325213154689, "step": 47900 }, { "epoch": 7.81, "learning_rate": 6.899983684124653e-05, "loss": NaN, "step": 48000 }, { "epoch": 7.81, "eval_loss": 0.45921266078948975, "eval_runtime": 8.1681, "eval_samples_per_second": 12.243, "eval_wer": 0.3946406820950061, "step": 48000 }, { "epoch": 7.82, "learning_rate": 6.89345733398597e-05, "loss": NaN, "step": 48100 }, { "epoch": 7.82, "eval_loss": 0.4549075961112976, "eval_runtime": 9.0376, "eval_samples_per_second": 11.065, "eval_wer": 0.38246041412911086, "step": 48100 }, { "epoch": 7.84, "learning_rate": 6.886930983847284e-05, "loss": NaN, "step": 48200 }, { "epoch": 7.84, "eval_loss": 0.45289474725723267, "eval_runtime": 7.9376, "eval_samples_per_second": 12.598, "eval_wer": 0.3873325213154689, "step": 48200 }, { "epoch": 7.85, "learning_rate": 6.8804046337086e-05, "loss": NaN, "step": 48300 }, { "epoch": 7.85, "eval_loss": 0.4604376256465912, "eval_runtime": 8.0346, "eval_samples_per_second": 12.446, "eval_wer": 0.3861144945188794, "step": 48300 }, { "epoch": 7.87, "learning_rate": 6.873878283569913e-05, "loss": NaN, "step": 48400 }, { "epoch": 7.87, "eval_loss": 0.42993414402008057, "eval_runtime": 9.3655, "eval_samples_per_second": 10.677, "eval_wer": 0.38367844092570036, "step": 48400 }, { "epoch": 7.89, "learning_rate": 6.867351933431229e-05, "loss": NaN, "step": 48500 }, { "epoch": 7.89, "eval_loss": 0.5003374218940735, "eval_runtime": 9.3394, "eval_samples_per_second": 10.707, "eval_wer": 0.3946406820950061, "step": 48500 }, { "epoch": 7.9, "learning_rate": 6.860825583292543e-05, "loss": NaN, "step": 48600 }, { "epoch": 7.9, "eval_loss": 0.4476844072341919, "eval_runtime": 8.2996, "eval_samples_per_second": 12.049, "eval_wer": 0.3982947624847747, "step": 48600 }, { "epoch": 7.92, "learning_rate": 6.854299233153859e-05, "loss": NaN, "step": 48700 }, { "epoch": 7.92, "eval_loss": 0.4162767827510834, "eval_runtime": 7.2206, "eval_samples_per_second": 13.849, "eval_wer": 0.3861144945188794, "step": 48700 }, { "epoch": 7.94, "learning_rate": 6.847772883015175e-05, "loss": NaN, "step": 48800 }, { "epoch": 7.94, "eval_loss": 0.5044607520103455, "eval_runtime": 8.7024, "eval_samples_per_second": 11.491, "eval_wer": 0.3909866017052375, "step": 48800 }, { "epoch": 7.95, "learning_rate": 6.84124653287649e-05, "loss": NaN, "step": 48900 }, { "epoch": 7.95, "eval_loss": 0.42168164253234863, "eval_runtime": 6.5122, "eval_samples_per_second": 15.356, "eval_wer": 0.3800243605359318, "step": 48900 }, { "epoch": 7.97, "learning_rate": 6.834720182737804e-05, "loss": NaN, "step": 49000 }, { "epoch": 7.97, "eval_loss": 0.4774813950061798, "eval_runtime": 8.4021, "eval_samples_per_second": 11.902, "eval_wer": 0.3873325213154689, "step": 49000 }, { "epoch": 7.99, "learning_rate": 6.828193832599119e-05, "loss": NaN, "step": 49100 }, { "epoch": 7.99, "eval_loss": 0.47412794828414917, "eval_runtime": 7.8667, "eval_samples_per_second": 12.712, "eval_wer": 0.3946406820950061, "step": 49100 }, { "epoch": 8.0, "learning_rate": 6.821667482460434e-05, "loss": NaN, "step": 49200 }, { "epoch": 8.0, "eval_loss": 0.4439965784549713, "eval_runtime": 8.4464, "eval_samples_per_second": 11.839, "eval_wer": 0.3873325213154689, "step": 49200 }, { "epoch": 8.02, "learning_rate": 6.815141132321749e-05, "loss": NaN, "step": 49300 }, { "epoch": 8.02, "eval_loss": 0.47220298647880554, "eval_runtime": 8.4551, "eval_samples_per_second": 11.827, "eval_wer": 0.38367844092570036, "step": 49300 }, { "epoch": 8.03, "learning_rate": 6.808614782183065e-05, "loss": NaN, "step": 49400 }, { "epoch": 8.03, "eval_loss": 0.41892436146736145, "eval_runtime": 7.9787, "eval_samples_per_second": 12.533, "eval_wer": 0.37880633373934225, "step": 49400 }, { "epoch": 8.05, "learning_rate": 6.802088432044379e-05, "loss": NaN, "step": 49500 }, { "epoch": 8.05, "eval_loss": 0.4536736309528351, "eval_runtime": 7.9322, "eval_samples_per_second": 12.607, "eval_wer": 0.39585870889159563, "step": 49500 }, { "epoch": 8.07, "learning_rate": 6.795562081905694e-05, "loss": NaN, "step": 49600 }, { "epoch": 8.07, "eval_loss": 0.45775213837623596, "eval_runtime": 8.207, "eval_samples_per_second": 12.185, "eval_wer": 0.3873325213154689, "step": 49600 }, { "epoch": 8.08, "learning_rate": 6.78903573176701e-05, "loss": NaN, "step": 49700 }, { "epoch": 8.08, "eval_loss": 0.44402602314949036, "eval_runtime": 8.5892, "eval_samples_per_second": 11.643, "eval_wer": 0.38976857490864797, "step": 49700 }, { "epoch": 8.1, "learning_rate": 6.782509381628324e-05, "loss": NaN, "step": 49800 }, { "epoch": 8.1, "eval_loss": 0.46547335386276245, "eval_runtime": 9.3683, "eval_samples_per_second": 10.674, "eval_wer": 0.3934226552984166, "step": 49800 }, { "epoch": 8.12, "learning_rate": 6.77598303148964e-05, "loss": NaN, "step": 49900 }, { "epoch": 8.12, "eval_loss": 0.46032240986824036, "eval_runtime": 8.8425, "eval_samples_per_second": 11.309, "eval_wer": 0.3848964677222899, "step": 49900 }, { "epoch": 8.13, "learning_rate": 6.769456681350955e-05, "loss": NaN, "step": 50000 }, { "epoch": 8.13, "eval_loss": 0.4585595726966858, "eval_runtime": 8.5708, "eval_samples_per_second": 11.667, "eval_wer": 0.3848964677222899, "step": 50000 }, { "epoch": 8.15, "learning_rate": 6.762930331212269e-05, "loss": NaN, "step": 50100 }, { "epoch": 8.15, "eval_loss": 0.41307058930397034, "eval_runtime": 7.0952, "eval_samples_per_second": 14.094, "eval_wer": 0.37271619975639464, "step": 50100 }, { "epoch": 8.16, "learning_rate": 6.756403981073585e-05, "loss": NaN, "step": 50200 }, { "epoch": 8.16, "eval_loss": 0.41041550040245056, "eval_runtime": 7.1426, "eval_samples_per_second": 14.001, "eval_wer": 0.36784409257003653, "step": 50200 }, { "epoch": 8.18, "learning_rate": 6.7498776309349e-05, "loss": NaN, "step": 50300 }, { "epoch": 8.18, "eval_loss": 0.44717052578926086, "eval_runtime": 7.0047, "eval_samples_per_second": 14.276, "eval_wer": 0.39707673568818513, "step": 50300 }, { "epoch": 8.2, "learning_rate": 6.743351280796215e-05, "loss": NaN, "step": 50400 }, { "epoch": 8.2, "eval_loss": 0.5247046947479248, "eval_runtime": 7.6638, "eval_samples_per_second": 13.048, "eval_wer": 0.3982947624847747, "step": 50400 }, { "epoch": 8.21, "learning_rate": 6.73682493065753e-05, "loss": NaN, "step": 50500 }, { "epoch": 8.21, "eval_loss": 0.5030866861343384, "eval_runtime": 7.6449, "eval_samples_per_second": 13.081, "eval_wer": 0.38246041412911086, "step": 50500 }, { "epoch": 8.23, "learning_rate": 6.730298580518846e-05, "loss": NaN, "step": 50600 }, { "epoch": 8.23, "eval_loss": 0.4644200801849365, "eval_runtime": 7.0234, "eval_samples_per_second": 14.238, "eval_wer": 0.364190012180268, "step": 50600 }, { "epoch": 8.25, "learning_rate": 6.72377223038016e-05, "loss": NaN, "step": 50700 }, { "epoch": 8.25, "eval_loss": 0.4306560158729553, "eval_runtime": 8.0867, "eval_samples_per_second": 12.366, "eval_wer": 0.3800243605359318, "step": 50700 }, { "epoch": 8.26, "learning_rate": 6.717245880241475e-05, "loss": NaN, "step": 50800 }, { "epoch": 8.26, "eval_loss": 0.45848017930984497, "eval_runtime": 8.7036, "eval_samples_per_second": 11.489, "eval_wer": 0.39707673568818513, "step": 50800 }, { "epoch": 8.28, "learning_rate": 6.71071953010279e-05, "loss": NaN, "step": 50900 }, { "epoch": 8.28, "eval_loss": 0.5098088979721069, "eval_runtime": 7.2954, "eval_samples_per_second": 13.707, "eval_wer": 0.3861144945188794, "step": 50900 }, { "epoch": 8.29, "learning_rate": 6.704193179964105e-05, "loss": NaN, "step": 51000 }, { "epoch": 8.29, "eval_loss": 0.5031391382217407, "eval_runtime": 7.9446, "eval_samples_per_second": 12.587, "eval_wer": 0.3934226552984166, "step": 51000 }, { "epoch": 8.31, "learning_rate": 6.697666829825421e-05, "loss": NaN, "step": 51100 }, { "epoch": 8.31, "eval_loss": 0.455885648727417, "eval_runtime": 8.4028, "eval_samples_per_second": 11.901, "eval_wer": 0.392204628501827, "step": 51100 }, { "epoch": 8.33, "learning_rate": 6.691140479686736e-05, "loss": NaN, "step": 51200 }, { "epoch": 8.33, "eval_loss": 0.4358394145965576, "eval_runtime": 9.3301, "eval_samples_per_second": 10.718, "eval_wer": 0.3702801461632156, "step": 51200 }, { "epoch": 8.34, "learning_rate": 6.68461412954805e-05, "loss": NaN, "step": 51300 }, { "epoch": 8.34, "eval_loss": 0.4508705139160156, "eval_runtime": 7.2511, "eval_samples_per_second": 13.791, "eval_wer": 0.37880633373934225, "step": 51300 }, { "epoch": 8.36, "learning_rate": 6.678087779409366e-05, "loss": NaN, "step": 51400 }, { "epoch": 8.36, "eval_loss": 0.5324064493179321, "eval_runtime": 7.3965, "eval_samples_per_second": 13.52, "eval_wer": 0.37880633373934225, "step": 51400 }, { "epoch": 8.38, "learning_rate": 6.67156142927068e-05, "loss": NaN, "step": 51500 }, { "epoch": 8.38, "eval_loss": 0.4332933723926544, "eval_runtime": 7.9068, "eval_samples_per_second": 12.647, "eval_wer": 0.3751522533495737, "step": 51500 }, { "epoch": 8.39, "learning_rate": 6.665035079131996e-05, "loss": NaN, "step": 51600 }, { "epoch": 8.39, "eval_loss": 0.5386966466903687, "eval_runtime": 6.9317, "eval_samples_per_second": 14.426, "eval_wer": 0.364190012180268, "step": 51600 }, { "epoch": 8.41, "learning_rate": 6.658508728993311e-05, "loss": NaN, "step": 51700 }, { "epoch": 8.41, "eval_loss": 0.47883322834968567, "eval_runtime": 8.0805, "eval_samples_per_second": 12.376, "eval_wer": 0.3861144945188794, "step": 51700 }, { "epoch": 8.42, "learning_rate": 6.651982378854625e-05, "loss": NaN, "step": 51800 }, { "epoch": 8.42, "eval_loss": 0.49707546830177307, "eval_runtime": 6.9503, "eval_samples_per_second": 14.388, "eval_wer": 0.3763702801461632, "step": 51800 }, { "epoch": 8.44, "learning_rate": 6.645456028715941e-05, "loss": NaN, "step": 51900 }, { "epoch": 8.44, "eval_loss": 0.4724676012992859, "eval_runtime": 8.5223, "eval_samples_per_second": 11.734, "eval_wer": 0.37758830694275275, "step": 51900 }, { "epoch": 8.46, "learning_rate": 6.638929678577256e-05, "loss": NaN, "step": 52000 }, { "epoch": 8.46, "eval_loss": 0.49637308716773987, "eval_runtime": 6.8621, "eval_samples_per_second": 14.573, "eval_wer": 0.37393422655298414, "step": 52000 }, { "epoch": 8.47, "learning_rate": 6.632403328438572e-05, "loss": NaN, "step": 52100 }, { "epoch": 8.47, "eval_loss": 0.46207770705223083, "eval_runtime": 9.6685, "eval_samples_per_second": 10.343, "eval_wer": 0.3812423873325213, "step": 52100 }, { "epoch": 8.49, "learning_rate": 6.625876978299886e-05, "loss": NaN, "step": 52200 }, { "epoch": 8.49, "eval_loss": 0.47856566309928894, "eval_runtime": 9.3206, "eval_samples_per_second": 10.729, "eval_wer": 0.3751522533495737, "step": 52200 }, { "epoch": 8.51, "learning_rate": 6.619350628161202e-05, "loss": NaN, "step": 52300 }, { "epoch": 8.51, "eval_loss": 0.49372223019599915, "eval_runtime": 8.558, "eval_samples_per_second": 11.685, "eval_wer": 0.3873325213154689, "step": 52300 }, { "epoch": 8.52, "learning_rate": 6.612824278022516e-05, "loss": NaN, "step": 52400 }, { "epoch": 8.52, "eval_loss": 0.4097326695919037, "eval_runtime": 7.8765, "eval_samples_per_second": 12.696, "eval_wer": 0.3568818514007308, "step": 52400 }, { "epoch": 8.54, "learning_rate": 6.606297927883831e-05, "loss": NaN, "step": 52500 }, { "epoch": 8.54, "eval_loss": 0.510248601436615, "eval_runtime": 8.7686, "eval_samples_per_second": 11.404, "eval_wer": 0.3751522533495737, "step": 52500 }, { "epoch": 8.55, "learning_rate": 6.599771577745147e-05, "loss": NaN, "step": 52600 }, { "epoch": 8.55, "eval_loss": 0.4330621063709259, "eval_runtime": 7.4599, "eval_samples_per_second": 13.405, "eval_wer": 0.36662606577344703, "step": 52600 }, { "epoch": 8.57, "learning_rate": 6.593245227606461e-05, "loss": NaN, "step": 52700 }, { "epoch": 8.57, "eval_loss": 0.4965771436691284, "eval_runtime": 9.6722, "eval_samples_per_second": 10.339, "eval_wer": 0.392204628501827, "step": 52700 }, { "epoch": 8.59, "learning_rate": 6.586718877467777e-05, "loss": NaN, "step": 52800 }, { "epoch": 8.59, "eval_loss": 0.5258552432060242, "eval_runtime": 8.3154, "eval_samples_per_second": 12.026, "eval_wer": 0.3934226552984166, "step": 52800 }, { "epoch": 8.6, "learning_rate": 6.58019252732909e-05, "loss": NaN, "step": 52900 }, { "epoch": 8.6, "eval_loss": 0.47305095195770264, "eval_runtime": 8.8487, "eval_samples_per_second": 11.301, "eval_wer": 0.3873325213154689, "step": 52900 }, { "epoch": 8.62, "learning_rate": 6.573666177190406e-05, "loss": NaN, "step": 53000 }, { "epoch": 8.62, "eval_loss": 0.5063592791557312, "eval_runtime": 8.5975, "eval_samples_per_second": 11.631, "eval_wer": 0.39585870889159563, "step": 53000 }, { "epoch": 8.64, "learning_rate": 6.567139827051722e-05, "loss": NaN, "step": 53100 }, { "epoch": 8.64, "eval_loss": 0.5428659319877625, "eval_runtime": 8.4203, "eval_samples_per_second": 11.876, "eval_wer": 0.3800243605359318, "step": 53100 }, { "epoch": 8.65, "learning_rate": 6.560613476913037e-05, "loss": NaN, "step": 53200 }, { "epoch": 8.65, "eval_loss": 0.44813072681427, "eval_runtime": 8.2801, "eval_samples_per_second": 12.077, "eval_wer": 0.37880633373934225, "step": 53200 }, { "epoch": 8.67, "learning_rate": 6.554087126774353e-05, "loss": NaN, "step": 53300 }, { "epoch": 8.67, "eval_loss": 0.4521804451942444, "eval_runtime": 8.2143, "eval_samples_per_second": 12.174, "eval_wer": 0.37393422655298414, "step": 53300 }, { "epoch": 8.68, "learning_rate": 6.547560776635667e-05, "loss": NaN, "step": 53400 }, { "epoch": 8.68, "eval_loss": 0.45459070801734924, "eval_runtime": 8.9144, "eval_samples_per_second": 11.218, "eval_wer": 0.37149817295980514, "step": 53400 }, { "epoch": 8.7, "learning_rate": 6.541034426496982e-05, "loss": NaN, "step": 53500 }, { "epoch": 8.7, "eval_loss": 0.5054107904434204, "eval_runtime": 6.4804, "eval_samples_per_second": 15.431, "eval_wer": 0.3763702801461632, "step": 53500 }, { "epoch": 8.72, "learning_rate": 6.534508076358296e-05, "loss": NaN, "step": 53600 }, { "epoch": 8.72, "eval_loss": 0.4579046666622162, "eval_runtime": 6.6279, "eval_samples_per_second": 15.088, "eval_wer": 0.3702801461632156, "step": 53600 }, { "epoch": 8.73, "learning_rate": 6.527981726219612e-05, "loss": NaN, "step": 53700 }, { "epoch": 8.73, "eval_loss": 0.4322802722454071, "eval_runtime": 9.2316, "eval_samples_per_second": 10.832, "eval_wer": 0.3763702801461632, "step": 53700 }, { "epoch": 8.75, "learning_rate": 6.521455376080928e-05, "loss": NaN, "step": 53800 }, { "epoch": 8.75, "eval_loss": 0.42796722054481506, "eval_runtime": 7.68, "eval_samples_per_second": 13.021, "eval_wer": 0.37271619975639464, "step": 53800 }, { "epoch": 8.77, "learning_rate": 6.514929025942242e-05, "loss": NaN, "step": 53900 }, { "epoch": 8.77, "eval_loss": 0.44873932003974915, "eval_runtime": 7.9481, "eval_samples_per_second": 12.582, "eval_wer": 0.38855054811205847, "step": 53900 }, { "epoch": 8.78, "learning_rate": 6.508402675803558e-05, "loss": NaN, "step": 54000 }, { "epoch": 8.78, "eval_loss": 0.4511549472808838, "eval_runtime": 9.1786, "eval_samples_per_second": 10.895, "eval_wer": 0.3654080389768575, "step": 54000 }, { "epoch": 8.8, "learning_rate": 6.501876325664871e-05, "loss": NaN, "step": 54100 }, { "epoch": 8.8, "eval_loss": 0.42401379346847534, "eval_runtime": 7.9905, "eval_samples_per_second": 12.515, "eval_wer": 0.3629719853836784, "step": 54100 }, { "epoch": 8.81, "learning_rate": 6.495349975526187e-05, "loss": NaN, "step": 54200 }, { "epoch": 8.81, "eval_loss": 0.4265538156032562, "eval_runtime": 9.2408, "eval_samples_per_second": 10.822, "eval_wer": 0.3751522533495737, "step": 54200 }, { "epoch": 8.83, "learning_rate": 6.488823625387502e-05, "loss": NaN, "step": 54300 }, { "epoch": 8.83, "eval_loss": 0.505720853805542, "eval_runtime": 8.1012, "eval_samples_per_second": 12.344, "eval_wer": 0.37393422655298414, "step": 54300 }, { "epoch": 8.85, "learning_rate": 6.482297275248818e-05, "loss": NaN, "step": 54400 }, { "epoch": 8.85, "eval_loss": 0.4096541702747345, "eval_runtime": 7.7623, "eval_samples_per_second": 12.883, "eval_wer": 0.37149817295980514, "step": 54400 }, { "epoch": 8.86, "learning_rate": 6.475770925110133e-05, "loss": NaN, "step": 54500 }, { "epoch": 8.86, "eval_loss": 0.4086014926433563, "eval_runtime": 8.886, "eval_samples_per_second": 11.254, "eval_wer": 0.3763702801461632, "step": 54500 }, { "epoch": 8.88, "learning_rate": 6.469244574971447e-05, "loss": NaN, "step": 54600 }, { "epoch": 8.88, "eval_loss": 0.43217840790748596, "eval_runtime": 7.9198, "eval_samples_per_second": 12.627, "eval_wer": 0.36662606577344703, "step": 54600 }, { "epoch": 8.9, "learning_rate": 6.462718224832762e-05, "loss": NaN, "step": 54700 }, { "epoch": 8.9, "eval_loss": 0.428193062543869, "eval_runtime": 8.0067, "eval_samples_per_second": 12.49, "eval_wer": 0.3873325213154689, "step": 54700 }, { "epoch": 8.91, "learning_rate": 6.456191874694077e-05, "loss": NaN, "step": 54800 }, { "epoch": 8.91, "eval_loss": 0.43840643763542175, "eval_runtime": 8.3593, "eval_samples_per_second": 11.963, "eval_wer": 0.37393422655298414, "step": 54800 }, { "epoch": 8.93, "learning_rate": 6.449665524555393e-05, "loss": NaN, "step": 54900 }, { "epoch": 8.93, "eval_loss": 0.41468119621276855, "eval_runtime": 7.1084, "eval_samples_per_second": 14.068, "eval_wer": 0.36784409257003653, "step": 54900 }, { "epoch": 8.94, "learning_rate": 6.443139174416707e-05, "loss": NaN, "step": 55000 }, { "epoch": 8.94, "eval_loss": 0.4655587673187256, "eval_runtime": 7.4051, "eval_samples_per_second": 13.504, "eval_wer": 0.364190012180268, "step": 55000 }, { "epoch": 8.96, "learning_rate": 6.436612824278023e-05, "loss": NaN, "step": 55100 }, { "epoch": 8.96, "eval_loss": 0.4038917124271393, "eval_runtime": 8.3584, "eval_samples_per_second": 11.964, "eval_wer": 0.36784409257003653, "step": 55100 }, { "epoch": 8.98, "learning_rate": 6.430086474139338e-05, "loss": NaN, "step": 55200 }, { "epoch": 8.98, "eval_loss": 0.39275607466697693, "eval_runtime": 7.452, "eval_samples_per_second": 13.419, "eval_wer": 0.36784409257003653, "step": 55200 }, { "epoch": 8.99, "learning_rate": 6.423560124000652e-05, "loss": NaN, "step": 55300 }, { "epoch": 8.99, "eval_loss": 0.4186645448207855, "eval_runtime": 8.5472, "eval_samples_per_second": 11.7, "eval_wer": 0.364190012180268, "step": 55300 }, { "epoch": 9.01, "learning_rate": 6.417033773861968e-05, "loss": NaN, "step": 55400 }, { "epoch": 9.01, "eval_loss": 0.44433704018592834, "eval_runtime": 7.986, "eval_samples_per_second": 12.522, "eval_wer": 0.36662606577344703, "step": 55400 }, { "epoch": 9.03, "learning_rate": 6.410507423723283e-05, "loss": NaN, "step": 55500 }, { "epoch": 9.03, "eval_loss": 0.43365246057510376, "eval_runtime": 7.3226, "eval_samples_per_second": 13.656, "eval_wer": 0.35931790499390986, "step": 55500 }, { "epoch": 9.04, "learning_rate": 6.403981073584599e-05, "loss": NaN, "step": 55600 }, { "epoch": 9.04, "eval_loss": 0.4543744623661041, "eval_runtime": 8.7477, "eval_samples_per_second": 11.432, "eval_wer": 0.37271619975639464, "step": 55600 }, { "epoch": 9.06, "learning_rate": 6.397454723445913e-05, "loss": NaN, "step": 55700 }, { "epoch": 9.06, "eval_loss": 0.43953046202659607, "eval_runtime": 7.711, "eval_samples_per_second": 12.968, "eval_wer": 0.3934226552984166, "step": 55700 }, { "epoch": 9.07, "learning_rate": 6.390928373307228e-05, "loss": NaN, "step": 55800 }, { "epoch": 9.07, "eval_loss": 0.43022480607032776, "eval_runtime": 7.9745, "eval_samples_per_second": 12.54, "eval_wer": 0.36053593179049936, "step": 55800 }, { "epoch": 9.09, "learning_rate": 6.384402023168543e-05, "loss": NaN, "step": 55900 }, { "epoch": 9.09, "eval_loss": 0.4893076419830322, "eval_runtime": 8.1627, "eval_samples_per_second": 12.251, "eval_wer": 0.3507917174177832, "step": 55900 }, { "epoch": 9.11, "learning_rate": 6.377875673029858e-05, "loss": NaN, "step": 56000 }, { "epoch": 9.11, "eval_loss": 0.4135149419307709, "eval_runtime": 7.9225, "eval_samples_per_second": 12.622, "eval_wer": 0.3763702801461632, "step": 56000 }, { "epoch": 9.12, "learning_rate": 6.371349322891174e-05, "loss": NaN, "step": 56100 }, { "epoch": 9.12, "eval_loss": 0.4469653069972992, "eval_runtime": 8.096, "eval_samples_per_second": 12.352, "eval_wer": 0.3800243605359318, "step": 56100 }, { "epoch": 9.14, "learning_rate": 6.364822972752488e-05, "loss": NaN, "step": 56200 }, { "epoch": 9.14, "eval_loss": 0.42649006843566895, "eval_runtime": 8.89, "eval_samples_per_second": 11.249, "eval_wer": 0.3690621193666261, "step": 56200 }, { "epoch": 9.16, "learning_rate": 6.358296622613803e-05, "loss": NaN, "step": 56300 }, { "epoch": 9.16, "eval_loss": 0.46478691697120667, "eval_runtime": 7.1008, "eval_samples_per_second": 14.083, "eval_wer": 0.36784409257003653, "step": 56300 }, { "epoch": 9.17, "learning_rate": 6.351770272475119e-05, "loss": NaN, "step": 56400 }, { "epoch": 9.17, "eval_loss": 0.45123374462127686, "eval_runtime": 8.3492, "eval_samples_per_second": 11.977, "eval_wer": 0.37393422655298414, "step": 56400 }, { "epoch": 9.19, "learning_rate": 6.345243922336433e-05, "loss": NaN, "step": 56500 }, { "epoch": 9.19, "eval_loss": 0.42654842138290405, "eval_runtime": 6.8554, "eval_samples_per_second": 14.587, "eval_wer": 0.3812423873325213, "step": 56500 }, { "epoch": 9.2, "learning_rate": 6.338717572197749e-05, "loss": NaN, "step": 56600 }, { "epoch": 9.2, "eval_loss": 0.4205102026462555, "eval_runtime": 8.9024, "eval_samples_per_second": 11.233, "eval_wer": 0.37271619975639464, "step": 56600 }, { "epoch": 9.22, "learning_rate": 6.332191222059064e-05, "loss": NaN, "step": 56700 }, { "epoch": 9.22, "eval_loss": 0.4153713583946228, "eval_runtime": 8.0624, "eval_samples_per_second": 12.403, "eval_wer": 0.35931790499390986, "step": 56700 }, { "epoch": 9.24, "learning_rate": 6.32566487192038e-05, "loss": NaN, "step": 56800 }, { "epoch": 9.24, "eval_loss": 0.4380166232585907, "eval_runtime": 7.3533, "eval_samples_per_second": 13.599, "eval_wer": 0.3471376370280146, "step": 56800 }, { "epoch": 9.25, "learning_rate": 6.319138521781694e-05, "loss": NaN, "step": 56900 }, { "epoch": 9.25, "eval_loss": 0.3888612389564514, "eval_runtime": 9.3301, "eval_samples_per_second": 10.718, "eval_wer": 0.3520097442143727, "step": 56900 }, { "epoch": 9.27, "learning_rate": 6.312612171643009e-05, "loss": NaN, "step": 57000 }, { "epoch": 9.27, "eval_loss": 0.39410483837127686, "eval_runtime": 8.4812, "eval_samples_per_second": 11.791, "eval_wer": 0.3568818514007308, "step": 57000 }, { "epoch": 9.29, "learning_rate": 6.306085821504324e-05, "loss": NaN, "step": 57100 }, { "epoch": 9.29, "eval_loss": 0.4467742443084717, "eval_runtime": 7.367, "eval_samples_per_second": 13.574, "eval_wer": 0.35931790499390986, "step": 57100 }, { "epoch": 9.3, "learning_rate": 6.299559471365639e-05, "loss": NaN, "step": 57200 }, { "epoch": 9.3, "eval_loss": 0.47365981340408325, "eval_runtime": 8.3932, "eval_samples_per_second": 11.914, "eval_wer": 0.3800243605359318, "step": 57200 }, { "epoch": 9.32, "learning_rate": 6.293033121226955e-05, "loss": NaN, "step": 57300 }, { "epoch": 9.32, "eval_loss": 0.4668024182319641, "eval_runtime": 8.2093, "eval_samples_per_second": 12.181, "eval_wer": 0.3690621193666261, "step": 57300 }, { "epoch": 9.33, "learning_rate": 6.286506771088269e-05, "loss": NaN, "step": 57400 }, { "epoch": 9.33, "eval_loss": 0.4525511860847473, "eval_runtime": 9.8628, "eval_samples_per_second": 10.139, "eval_wer": 0.37758830694275275, "step": 57400 }, { "epoch": 9.35, "learning_rate": 6.279980420949584e-05, "loss": NaN, "step": 57500 }, { "epoch": 9.35, "eval_loss": 0.45667481422424316, "eval_runtime": 7.42, "eval_samples_per_second": 13.477, "eval_wer": 0.38367844092570036, "step": 57500 }, { "epoch": 9.37, "learning_rate": 6.2734540708109e-05, "loss": NaN, "step": 57600 }, { "epoch": 9.37, "eval_loss": 0.4748976230621338, "eval_runtime": 7.9502, "eval_samples_per_second": 12.578, "eval_wer": 0.37271619975639464, "step": 57600 }, { "epoch": 9.38, "learning_rate": 6.266927720672214e-05, "loss": NaN, "step": 57700 }, { "epoch": 9.38, "eval_loss": 0.41124123334884644, "eval_runtime": 8.7336, "eval_samples_per_second": 11.45, "eval_wer": 0.3629719853836784, "step": 57700 }, { "epoch": 9.4, "learning_rate": 6.26040137053353e-05, "loss": NaN, "step": 57800 }, { "epoch": 9.4, "eval_loss": 0.4126984477043152, "eval_runtime": 7.3596, "eval_samples_per_second": 13.588, "eval_wer": 0.3654080389768575, "step": 57800 }, { "epoch": 9.42, "learning_rate": 6.253875020394845e-05, "loss": NaN, "step": 57900 }, { "epoch": 9.42, "eval_loss": 0.41617000102996826, "eval_runtime": 8.9616, "eval_samples_per_second": 11.159, "eval_wer": 0.3617539585870889, "step": 57900 }, { "epoch": 9.43, "learning_rate": 6.247348670256159e-05, "loss": NaN, "step": 58000 }, { "epoch": 9.43, "eval_loss": 0.4667081832885742, "eval_runtime": 7.9176, "eval_samples_per_second": 12.63, "eval_wer": 0.37271619975639464, "step": 58000 }, { "epoch": 9.45, "learning_rate": 6.240822320117474e-05, "loss": NaN, "step": 58100 }, { "epoch": 9.45, "eval_loss": 0.4130760431289673, "eval_runtime": 9.1619, "eval_samples_per_second": 10.915, "eval_wer": 0.3520097442143727, "step": 58100 }, { "epoch": 9.46, "learning_rate": 6.23429596997879e-05, "loss": NaN, "step": 58200 }, { "epoch": 9.46, "eval_loss": 0.3896174728870392, "eval_runtime": 6.9796, "eval_samples_per_second": 14.328, "eval_wer": 0.3507917174177832, "step": 58200 }, { "epoch": 9.48, "learning_rate": 6.227769619840105e-05, "loss": NaN, "step": 58300 }, { "epoch": 9.48, "eval_loss": 0.44675758481025696, "eval_runtime": 10.5739, "eval_samples_per_second": 9.457, "eval_wer": 0.37393422655298414, "step": 58300 }, { "epoch": 9.5, "learning_rate": 6.22124326970142e-05, "loss": NaN, "step": 58400 }, { "epoch": 9.5, "eval_loss": 0.45445725321769714, "eval_runtime": 8.0137, "eval_samples_per_second": 12.479, "eval_wer": 0.35322777101096225, "step": 58400 }, { "epoch": 9.51, "learning_rate": 6.214716919562736e-05, "loss": NaN, "step": 58500 }, { "epoch": 9.51, "eval_loss": 0.47014904022216797, "eval_runtime": 8.4495, "eval_samples_per_second": 11.835, "eval_wer": 0.36784409257003653, "step": 58500 }, { "epoch": 9.53, "learning_rate": 6.208190569424049e-05, "loss": NaN, "step": 58600 }, { "epoch": 9.53, "eval_loss": 0.42686671018600464, "eval_runtime": 7.4504, "eval_samples_per_second": 13.422, "eval_wer": 0.36053593179049936, "step": 58600 }, { "epoch": 9.55, "learning_rate": 6.201664219285365e-05, "loss": NaN, "step": 58700 }, { "epoch": 9.55, "eval_loss": 0.45379403233528137, "eval_runtime": 7.6774, "eval_samples_per_second": 13.025, "eval_wer": 0.3617539585870889, "step": 58700 }, { "epoch": 9.56, "learning_rate": 6.19513786914668e-05, "loss": NaN, "step": 58800 }, { "epoch": 9.56, "eval_loss": 0.4386783838272095, "eval_runtime": 9.7583, "eval_samples_per_second": 10.248, "eval_wer": 0.36662606577344703, "step": 58800 }, { "epoch": 9.58, "learning_rate": 6.188611519007995e-05, "loss": NaN, "step": 58900 }, { "epoch": 9.58, "eval_loss": 0.40192508697509766, "eval_runtime": 9.6879, "eval_samples_per_second": 10.322, "eval_wer": 0.35809987819732036, "step": 58900 }, { "epoch": 9.6, "learning_rate": 6.182085168869311e-05, "loss": NaN, "step": 59000 }, { "epoch": 9.6, "eval_loss": 0.46459415555000305, "eval_runtime": 8.441, "eval_samples_per_second": 11.847, "eval_wer": 0.35931790499390986, "step": 59000 }, { "epoch": 9.61, "learning_rate": 6.175558818730625e-05, "loss": NaN, "step": 59100 }, { "epoch": 9.61, "eval_loss": 0.41784995794296265, "eval_runtime": 7.9289, "eval_samples_per_second": 12.612, "eval_wer": 0.38246041412911086, "step": 59100 }, { "epoch": 9.63, "learning_rate": 6.16903246859194e-05, "loss": NaN, "step": 59200 }, { "epoch": 9.63, "eval_loss": 0.44782283902168274, "eval_runtime": 6.8119, "eval_samples_per_second": 14.68, "eval_wer": 0.37758830694275275, "step": 59200 }, { "epoch": 9.64, "learning_rate": 6.162506118453255e-05, "loss": NaN, "step": 59300 }, { "epoch": 9.64, "eval_loss": 0.40649664402008057, "eval_runtime": 7.3722, "eval_samples_per_second": 13.564, "eval_wer": 0.3520097442143727, "step": 59300 }, { "epoch": 9.66, "learning_rate": 6.15597976831457e-05, "loss": NaN, "step": 59400 }, { "epoch": 9.66, "eval_loss": 0.405249685049057, "eval_runtime": 7.7895, "eval_samples_per_second": 12.838, "eval_wer": 0.3690621193666261, "step": 59400 }, { "epoch": 9.68, "learning_rate": 6.149453418175886e-05, "loss": NaN, "step": 59500 }, { "epoch": 9.68, "eval_loss": 0.37005943059921265, "eval_runtime": 7.3848, "eval_samples_per_second": 13.541, "eval_wer": 0.3507917174177832, "step": 59500 }, { "epoch": 9.69, "learning_rate": 6.142927068037201e-05, "loss": NaN, "step": 59600 }, { "epoch": 9.69, "eval_loss": 0.4289380609989166, "eval_runtime": 8.9702, "eval_samples_per_second": 11.148, "eval_wer": 0.36053593179049936, "step": 59600 }, { "epoch": 9.71, "learning_rate": 6.136400717898515e-05, "loss": NaN, "step": 59700 }, { "epoch": 9.71, "eval_loss": 0.39418941736221313, "eval_runtime": 7.4148, "eval_samples_per_second": 13.487, "eval_wer": 0.3654080389768575, "step": 59700 }, { "epoch": 9.73, "learning_rate": 6.12987436775983e-05, "loss": NaN, "step": 59800 }, { "epoch": 9.73, "eval_loss": 0.44876864552497864, "eval_runtime": 10.228, "eval_samples_per_second": 9.777, "eval_wer": 0.3556638246041413, "step": 59800 }, { "epoch": 9.74, "learning_rate": 6.123348017621146e-05, "loss": NaN, "step": 59900 }, { "epoch": 9.74, "eval_loss": 0.49101337790489197, "eval_runtime": 8.1552, "eval_samples_per_second": 12.262, "eval_wer": 0.3848964677222899, "step": 59900 }, { "epoch": 9.76, "learning_rate": 6.11682166748246e-05, "loss": NaN, "step": 60000 }, { "epoch": 9.76, "eval_loss": 0.3982294797897339, "eval_runtime": 8.4742, "eval_samples_per_second": 11.8, "eval_wer": 0.37149817295980514, "step": 60000 }, { "epoch": 9.77, "learning_rate": 6.110295317343776e-05, "loss": NaN, "step": 60100 }, { "epoch": 9.77, "eval_loss": 0.3967539668083191, "eval_runtime": 6.4434, "eval_samples_per_second": 15.52, "eval_wer": 0.36053593179049936, "step": 60100 }, { "epoch": 9.79, "learning_rate": 6.103768967205092e-05, "loss": NaN, "step": 60200 }, { "epoch": 9.79, "eval_loss": 0.4385029673576355, "eval_runtime": 7.5002, "eval_samples_per_second": 13.333, "eval_wer": 0.3617539585870889, "step": 60200 }, { "epoch": 9.81, "learning_rate": 6.097242617066406e-05, "loss": NaN, "step": 60300 }, { "epoch": 9.81, "eval_loss": 0.4130534827709198, "eval_runtime": 8.817, "eval_samples_per_second": 11.342, "eval_wer": 0.3751522533495737, "step": 60300 }, { "epoch": 9.82, "learning_rate": 6.090716266927721e-05, "loss": NaN, "step": 60400 }, { "epoch": 9.82, "eval_loss": 0.5191701650619507, "eval_runtime": 7.9727, "eval_samples_per_second": 12.543, "eval_wer": 0.37880633373934225, "step": 60400 }, { "epoch": 9.84, "learning_rate": 6.084189916789036e-05, "loss": NaN, "step": 60500 }, { "epoch": 9.84, "eval_loss": 0.4418995678424835, "eval_runtime": 9.1327, "eval_samples_per_second": 10.95, "eval_wer": 0.37880633373934225, "step": 60500 }, { "epoch": 9.86, "learning_rate": 6.077663566650351e-05, "loss": NaN, "step": 60600 }, { "epoch": 9.86, "eval_loss": 0.4954804480075836, "eval_runtime": 9.5074, "eval_samples_per_second": 10.518, "eval_wer": 0.4056029232643118, "step": 60600 }, { "epoch": 9.87, "learning_rate": 6.0711372165116665e-05, "loss": NaN, "step": 60700 }, { "epoch": 9.87, "eval_loss": 0.45987486839294434, "eval_runtime": 6.9269, "eval_samples_per_second": 14.436, "eval_wer": 0.36784409257003653, "step": 60700 }, { "epoch": 9.89, "learning_rate": 6.064610866372982e-05, "loss": NaN, "step": 60800 }, { "epoch": 9.89, "eval_loss": 0.38861092925071716, "eval_runtime": 9.0697, "eval_samples_per_second": 11.026, "eval_wer": 0.35931790499390986, "step": 60800 }, { "epoch": 9.9, "learning_rate": 6.0580845162342956e-05, "loss": NaN, "step": 60900 }, { "epoch": 9.9, "eval_loss": 0.38833603262901306, "eval_runtime": 7.6516, "eval_samples_per_second": 13.069, "eval_wer": 0.364190012180268, "step": 60900 }, { "epoch": 9.92, "learning_rate": 6.0515581660956114e-05, "loss": NaN, "step": 61000 }, { "epoch": 9.92, "eval_loss": 0.44373536109924316, "eval_runtime": 7.1189, "eval_samples_per_second": 14.047, "eval_wer": 0.35809987819732036, "step": 61000 }, { "epoch": 9.94, "learning_rate": 6.0450318159569266e-05, "loss": NaN, "step": 61100 }, { "epoch": 9.94, "eval_loss": 0.41120070219039917, "eval_runtime": 7.3599, "eval_samples_per_second": 13.587, "eval_wer": 0.3459196102314251, "step": 61100 }, { "epoch": 9.95, "learning_rate": 6.038505465818242e-05, "loss": NaN, "step": 61200 }, { "epoch": 9.95, "eval_loss": 0.41615867614746094, "eval_runtime": 9.4386, "eval_samples_per_second": 10.595, "eval_wer": 0.3568818514007308, "step": 61200 }, { "epoch": 9.97, "learning_rate": 6.031979115679557e-05, "loss": NaN, "step": 61300 }, { "epoch": 9.97, "eval_loss": 0.4973611831665039, "eval_runtime": 8.1559, "eval_samples_per_second": 12.261, "eval_wer": 0.3702801461632156, "step": 61300 }, { "epoch": 9.99, "learning_rate": 6.025452765540871e-05, "loss": NaN, "step": 61400 }, { "epoch": 9.99, "eval_loss": 0.448307603597641, "eval_runtime": 9.8048, "eval_samples_per_second": 10.199, "eval_wer": 0.3690621193666261, "step": 61400 }, { "epoch": 10.0, "learning_rate": 6.018926415402186e-05, "loss": NaN, "step": 61500 }, { "epoch": 10.0, "eval_loss": 0.5115909576416016, "eval_runtime": 7.945, "eval_samples_per_second": 12.587, "eval_wer": 0.37393422655298414, "step": 61500 }, { "epoch": 10.02, "learning_rate": 6.012400065263501e-05, "loss": NaN, "step": 61600 }, { "epoch": 10.02, "eval_loss": 0.42501771450042725, "eval_runtime": 9.4293, "eval_samples_per_second": 10.605, "eval_wer": 0.3690621193666261, "step": 61600 }, { "epoch": 10.03, "learning_rate": 6.005873715124817e-05, "loss": NaN, "step": 61700 }, { "epoch": 10.03, "eval_loss": 0.4137573540210724, "eval_runtime": 8.5889, "eval_samples_per_second": 11.643, "eval_wer": 0.3520097442143727, "step": 61700 }, { "epoch": 10.05, "learning_rate": 5.999347364986132e-05, "loss": NaN, "step": 61800 }, { "epoch": 10.05, "eval_loss": 0.4213745892047882, "eval_runtime": 9.5865, "eval_samples_per_second": 10.431, "eval_wer": 0.36053593179049936, "step": 61800 }, { "epoch": 10.07, "learning_rate": 5.9928210148474475e-05, "loss": NaN, "step": 61900 }, { "epoch": 10.07, "eval_loss": 0.4096081256866455, "eval_runtime": 8.1463, "eval_samples_per_second": 12.275, "eval_wer": 0.3690621193666261, "step": 61900 }, { "epoch": 10.08, "learning_rate": 5.986294664708761e-05, "loss": NaN, "step": 62000 }, { "epoch": 10.08, "eval_loss": 0.41392749547958374, "eval_runtime": 9.4692, "eval_samples_per_second": 10.561, "eval_wer": 0.36662606577344703, "step": 62000 }, { "epoch": 10.1, "learning_rate": 5.9797683145700765e-05, "loss": NaN, "step": 62100 }, { "epoch": 10.1, "eval_loss": 0.41633856296539307, "eval_runtime": 8.7223, "eval_samples_per_second": 11.465, "eval_wer": 0.3690621193666261, "step": 62100 }, { "epoch": 10.12, "learning_rate": 5.973241964431392e-05, "loss": NaN, "step": 62200 }, { "epoch": 10.12, "eval_loss": 0.45410457253456116, "eval_runtime": 7.382, "eval_samples_per_second": 13.546, "eval_wer": 0.3520097442143727, "step": 62200 }, { "epoch": 10.13, "learning_rate": 5.966715614292707e-05, "loss": NaN, "step": 62300 }, { "epoch": 10.13, "eval_loss": 0.456071674823761, "eval_runtime": 8.3133, "eval_samples_per_second": 12.029, "eval_wer": 0.3690621193666261, "step": 62300 }, { "epoch": 10.15, "learning_rate": 5.960189264154023e-05, "loss": NaN, "step": 62400 }, { "epoch": 10.15, "eval_loss": 0.4523433446884155, "eval_runtime": 7.4187, "eval_samples_per_second": 13.479, "eval_wer": 0.35931790499390986, "step": 62400 }, { "epoch": 10.16, "learning_rate": 5.953662914015338e-05, "loss": NaN, "step": 62500 }, { "epoch": 10.16, "eval_loss": 0.4045345187187195, "eval_runtime": 9.0224, "eval_samples_per_second": 11.083, "eval_wer": 0.3556638246041413, "step": 62500 }, { "epoch": 10.18, "learning_rate": 5.947136563876652e-05, "loss": NaN, "step": 62600 }, { "epoch": 10.18, "eval_loss": 0.4067111313343048, "eval_runtime": 7.5666, "eval_samples_per_second": 13.216, "eval_wer": 0.364190012180268, "step": 62600 }, { "epoch": 10.2, "learning_rate": 5.940610213737967e-05, "loss": NaN, "step": 62700 }, { "epoch": 10.2, "eval_loss": 0.4985601007938385, "eval_runtime": 10.6701, "eval_samples_per_second": 9.372, "eval_wer": 0.3812423873325213, "step": 62700 }, { "epoch": 10.21, "learning_rate": 5.934083863599282e-05, "loss": NaN, "step": 62800 }, { "epoch": 10.21, "eval_loss": 0.4605454206466675, "eval_runtime": 7.6443, "eval_samples_per_second": 13.082, "eval_wer": 0.37880633373934225, "step": 62800 }, { "epoch": 10.23, "learning_rate": 5.9275575134605974e-05, "loss": NaN, "step": 62900 }, { "epoch": 10.23, "eval_loss": 0.41414105892181396, "eval_runtime": 9.3718, "eval_samples_per_second": 10.67, "eval_wer": 0.35931790499390986, "step": 62900 }, { "epoch": 10.25, "learning_rate": 5.9210311633219125e-05, "loss": NaN, "step": 63000 }, { "epoch": 10.25, "eval_loss": 0.4487077593803406, "eval_runtime": 8.7749, "eval_samples_per_second": 11.396, "eval_wer": 0.37149817295980514, "step": 63000 }, { "epoch": 10.26, "learning_rate": 5.914504813183227e-05, "loss": NaN, "step": 63100 }, { "epoch": 10.26, "eval_loss": 0.5015296339988708, "eval_runtime": 7.5183, "eval_samples_per_second": 13.301, "eval_wer": 0.3861144945188794, "step": 63100 }, { "epoch": 10.28, "learning_rate": 5.907978463044542e-05, "loss": NaN, "step": 63200 }, { "epoch": 10.28, "eval_loss": 0.49254322052001953, "eval_runtime": 7.8387, "eval_samples_per_second": 12.757, "eval_wer": 0.3617539585870889, "step": 63200 }, { "epoch": 10.29, "learning_rate": 5.9014521129058574e-05, "loss": NaN, "step": 63300 }, { "epoch": 10.29, "eval_loss": 0.4693681001663208, "eval_runtime": 9.0717, "eval_samples_per_second": 11.023, "eval_wer": 0.3812423873325213, "step": 63300 }, { "epoch": 10.31, "learning_rate": 5.8949257627671726e-05, "loss": NaN, "step": 63400 }, { "epoch": 10.31, "eval_loss": 0.4481465220451355, "eval_runtime": 8.4682, "eval_samples_per_second": 11.809, "eval_wer": 0.3702801461632156, "step": 63400 }, { "epoch": 10.33, "learning_rate": 5.888399412628488e-05, "loss": NaN, "step": 63500 }, { "epoch": 10.33, "eval_loss": 0.43376660346984863, "eval_runtime": 9.0956, "eval_samples_per_second": 10.994, "eval_wer": 0.3702801461632156, "step": 63500 }, { "epoch": 10.34, "learning_rate": 5.881873062489803e-05, "loss": NaN, "step": 63600 }, { "epoch": 10.34, "eval_loss": 0.4156494438648224, "eval_runtime": 8.4037, "eval_samples_per_second": 11.899, "eval_wer": 0.35444579780755175, "step": 63600 }, { "epoch": 10.36, "learning_rate": 5.8753467123511175e-05, "loss": NaN, "step": 63700 }, { "epoch": 10.36, "eval_loss": 0.4458553194999695, "eval_runtime": 8.7165, "eval_samples_per_second": 11.473, "eval_wer": 0.37393422655298414, "step": 63700 }, { "epoch": 10.38, "learning_rate": 5.868820362212433e-05, "loss": NaN, "step": 63800 }, { "epoch": 10.38, "eval_loss": 0.466782808303833, "eval_runtime": 8.1618, "eval_samples_per_second": 12.252, "eval_wer": 0.3873325213154689, "step": 63800 }, { "epoch": 10.39, "learning_rate": 5.862294012073748e-05, "loss": NaN, "step": 63900 }, { "epoch": 10.39, "eval_loss": 0.5930745601654053, "eval_runtime": 9.5258, "eval_samples_per_second": 10.498, "eval_wer": 0.39707673568818513, "step": 63900 }, { "epoch": 10.41, "learning_rate": 5.855767661935063e-05, "loss": NaN, "step": 64000 }, { "epoch": 10.41, "eval_loss": 0.45110756158828735, "eval_runtime": 9.4694, "eval_samples_per_second": 10.56, "eval_wer": 0.3617539585870889, "step": 64000 }, { "epoch": 10.42, "learning_rate": 5.849241311796378e-05, "loss": NaN, "step": 64100 }, { "epoch": 10.42, "eval_loss": 0.4962243139743805, "eval_runtime": 8.4633, "eval_samples_per_second": 11.816, "eval_wer": 0.3800243605359318, "step": 64100 }, { "epoch": 10.44, "learning_rate": 5.8427149616576935e-05, "loss": NaN, "step": 64200 }, { "epoch": 10.44, "eval_loss": 0.43860459327697754, "eval_runtime": 8.0809, "eval_samples_per_second": 12.375, "eval_wer": 0.3568818514007308, "step": 64200 }, { "epoch": 10.46, "learning_rate": 5.836188611519008e-05, "loss": NaN, "step": 64300 }, { "epoch": 10.46, "eval_loss": 0.4754991829395294, "eval_runtime": 10.3787, "eval_samples_per_second": 9.635, "eval_wer": 0.3800243605359318, "step": 64300 }, { "epoch": 10.47, "learning_rate": 5.829662261380323e-05, "loss": NaN, "step": 64400 }, { "epoch": 10.47, "eval_loss": 0.44975659251213074, "eval_runtime": 8.6363, "eval_samples_per_second": 11.579, "eval_wer": 0.37393422655298414, "step": 64400 }, { "epoch": 10.49, "learning_rate": 5.8231359112416384e-05, "loss": NaN, "step": 64500 }, { "epoch": 10.49, "eval_loss": 0.4558520019054413, "eval_runtime": 8.2941, "eval_samples_per_second": 12.057, "eval_wer": 0.37271619975639464, "step": 64500 }, { "epoch": 10.51, "learning_rate": 5.8166095611029536e-05, "loss": NaN, "step": 64600 }, { "epoch": 10.51, "eval_loss": 0.40871143341064453, "eval_runtime": 8.7219, "eval_samples_per_second": 11.465, "eval_wer": 0.3556638246041413, "step": 64600 }, { "epoch": 10.52, "learning_rate": 5.810083210964269e-05, "loss": NaN, "step": 64700 }, { "epoch": 10.52, "eval_loss": 0.5071795582771301, "eval_runtime": 8.6766, "eval_samples_per_second": 11.525, "eval_wer": 0.3848964677222899, "step": 64700 }, { "epoch": 10.54, "learning_rate": 5.803556860825583e-05, "loss": NaN, "step": 64800 }, { "epoch": 10.54, "eval_loss": 0.4381246864795685, "eval_runtime": 7.7019, "eval_samples_per_second": 12.984, "eval_wer": 0.364190012180268, "step": 64800 }, { "epoch": 10.55, "learning_rate": 5.7970305106868985e-05, "loss": NaN, "step": 64900 }, { "epoch": 10.55, "eval_loss": 0.42241111397743225, "eval_runtime": 6.9119, "eval_samples_per_second": 14.468, "eval_wer": 0.3520097442143727, "step": 64900 }, { "epoch": 10.57, "learning_rate": 5.790504160548214e-05, "loss": NaN, "step": 65000 }, { "epoch": 10.57, "eval_loss": 0.44368839263916016, "eval_runtime": 8.9514, "eval_samples_per_second": 11.171, "eval_wer": 0.37393422655298414, "step": 65000 }, { "epoch": 10.59, "learning_rate": 5.783977810409529e-05, "loss": NaN, "step": 65100 }, { "epoch": 10.59, "eval_loss": 0.4559805393218994, "eval_runtime": 9.0066, "eval_samples_per_second": 11.103, "eval_wer": 0.3702801461632156, "step": 65100 }, { "epoch": 10.6, "learning_rate": 5.777451460270844e-05, "loss": NaN, "step": 65200 }, { "epoch": 10.6, "eval_loss": 0.3956843912601471, "eval_runtime": 8.016, "eval_samples_per_second": 12.475, "eval_wer": 0.3800243605359318, "step": 65200 }, { "epoch": 10.62, "learning_rate": 5.770925110132159e-05, "loss": NaN, "step": 65300 }, { "epoch": 10.62, "eval_loss": 0.3806883990764618, "eval_runtime": 6.54, "eval_samples_per_second": 15.291, "eval_wer": 0.3568818514007308, "step": 65300 }, { "epoch": 10.64, "learning_rate": 5.764398759993474e-05, "loss": NaN, "step": 65400 }, { "epoch": 10.64, "eval_loss": 0.4815838634967804, "eval_runtime": 8.6182, "eval_samples_per_second": 11.603, "eval_wer": 0.37758830694275275, "step": 65400 }, { "epoch": 10.65, "learning_rate": 5.757872409854789e-05, "loss": NaN, "step": 65500 }, { "epoch": 10.65, "eval_loss": 0.42734912037849426, "eval_runtime": 7.7612, "eval_samples_per_second": 12.885, "eval_wer": 0.3702801461632156, "step": 65500 }, { "epoch": 10.67, "learning_rate": 5.751346059716104e-05, "loss": NaN, "step": 65600 }, { "epoch": 10.67, "eval_loss": 0.453123539686203, "eval_runtime": 8.3059, "eval_samples_per_second": 12.04, "eval_wer": 0.3861144945188794, "step": 65600 }, { "epoch": 10.68, "learning_rate": 5.744819709577419e-05, "loss": NaN, "step": 65700 }, { "epoch": 10.68, "eval_loss": 0.47986891865730286, "eval_runtime": 8.2303, "eval_samples_per_second": 12.15, "eval_wer": 0.3763702801461632, "step": 65700 }, { "epoch": 10.7, "learning_rate": 5.7382933594387345e-05, "loss": NaN, "step": 65800 }, { "epoch": 10.7, "eval_loss": 0.3873835802078247, "eval_runtime": 7.8326, "eval_samples_per_second": 12.767, "eval_wer": 0.3568818514007308, "step": 65800 }, { "epoch": 10.72, "learning_rate": 5.73176700930005e-05, "loss": NaN, "step": 65900 }, { "epoch": 10.72, "eval_loss": 0.41347476840019226, "eval_runtime": 10.5146, "eval_samples_per_second": 9.511, "eval_wer": 0.36784409257003653, "step": 65900 }, { "epoch": 10.73, "learning_rate": 5.7252406591613636e-05, "loss": NaN, "step": 66000 }, { "epoch": 10.73, "eval_loss": 0.39395031332969666, "eval_runtime": 7.1626, "eval_samples_per_second": 13.961, "eval_wer": 0.3629719853836784, "step": 66000 }, { "epoch": 10.75, "learning_rate": 5.7187143090226794e-05, "loss": NaN, "step": 66100 }, { "epoch": 10.75, "eval_loss": 0.38374292850494385, "eval_runtime": 8.2206, "eval_samples_per_second": 12.165, "eval_wer": 0.3690621193666261, "step": 66100 }, { "epoch": 10.77, "learning_rate": 5.7121879588839946e-05, "loss": NaN, "step": 66200 }, { "epoch": 10.77, "eval_loss": 0.4342725872993469, "eval_runtime": 8.1692, "eval_samples_per_second": 12.241, "eval_wer": 0.37149817295980514, "step": 66200 }, { "epoch": 10.78, "learning_rate": 5.70566160874531e-05, "loss": NaN, "step": 66300 }, { "epoch": 10.78, "eval_loss": 0.4155646562576294, "eval_runtime": 6.8934, "eval_samples_per_second": 14.507, "eval_wer": 0.3690621193666261, "step": 66300 }, { "epoch": 10.8, "learning_rate": 5.699135258606625e-05, "loss": NaN, "step": 66400 }, { "epoch": 10.8, "eval_loss": 0.410979300737381, "eval_runtime": 7.7957, "eval_samples_per_second": 12.828, "eval_wer": 0.37149817295980514, "step": 66400 }, { "epoch": 10.81, "learning_rate": 5.692608908467939e-05, "loss": NaN, "step": 66500 }, { "epoch": 10.81, "eval_loss": 0.3924597203731537, "eval_runtime": 7.8199, "eval_samples_per_second": 12.788, "eval_wer": 0.3702801461632156, "step": 66500 }, { "epoch": 10.83, "learning_rate": 5.686082558329254e-05, "loss": NaN, "step": 66600 }, { "epoch": 10.83, "eval_loss": 0.4514992833137512, "eval_runtime": 8.7106, "eval_samples_per_second": 11.48, "eval_wer": 0.3763702801461632, "step": 66600 }, { "epoch": 10.85, "learning_rate": 5.679556208190569e-05, "loss": NaN, "step": 66700 }, { "epoch": 10.85, "eval_loss": 0.46335548162460327, "eval_runtime": 6.7296, "eval_samples_per_second": 14.86, "eval_wer": 0.37271619975639464, "step": 66700 }, { "epoch": 10.86, "learning_rate": 5.673029858051885e-05, "loss": NaN, "step": 66800 }, { "epoch": 10.86, "eval_loss": 0.48735862970352173, "eval_runtime": 8.529, "eval_samples_per_second": 11.725, "eval_wer": 0.38367844092570036, "step": 66800 }, { "epoch": 10.88, "learning_rate": 5.6665035079132e-05, "loss": NaN, "step": 66900 }, { "epoch": 10.88, "eval_loss": 0.4417389929294586, "eval_runtime": 8.1548, "eval_samples_per_second": 12.263, "eval_wer": 0.364190012180268, "step": 66900 }, { "epoch": 10.9, "learning_rate": 5.6599771577745155e-05, "loss": NaN, "step": 67000 }, { "epoch": 10.9, "eval_loss": 0.38281384110450745, "eval_runtime": 7.2321, "eval_samples_per_second": 13.827, "eval_wer": 0.34957369062119364, "step": 67000 }, { "epoch": 10.91, "learning_rate": 5.653450807635829e-05, "loss": NaN, "step": 67100 }, { "epoch": 10.91, "eval_loss": 0.4453480839729309, "eval_runtime": 9.8708, "eval_samples_per_second": 10.131, "eval_wer": 0.37149817295980514, "step": 67100 }, { "epoch": 10.93, "learning_rate": 5.6469244574971445e-05, "loss": NaN, "step": 67200 }, { "epoch": 10.93, "eval_loss": 0.43574249744415283, "eval_runtime": 6.7934, "eval_samples_per_second": 14.72, "eval_wer": 0.3654080389768575, "step": 67200 }, { "epoch": 10.94, "learning_rate": 5.64039810735846e-05, "loss": NaN, "step": 67300 }, { "epoch": 10.94, "eval_loss": 0.4049379825592041, "eval_runtime": 7.1607, "eval_samples_per_second": 13.965, "eval_wer": 0.35931790499390986, "step": 67300 }, { "epoch": 10.96, "learning_rate": 5.6338717572197756e-05, "loss": NaN, "step": 67400 }, { "epoch": 10.96, "eval_loss": 0.40730178356170654, "eval_runtime": 8.7286, "eval_samples_per_second": 11.457, "eval_wer": 0.36784409257003653, "step": 67400 }, { "epoch": 10.98, "learning_rate": 5.627345407081091e-05, "loss": NaN, "step": 67500 }, { "epoch": 10.98, "eval_loss": 0.42172133922576904, "eval_runtime": 7.5099, "eval_samples_per_second": 13.316, "eval_wer": 0.3617539585870889, "step": 67500 }, { "epoch": 10.99, "learning_rate": 5.620819056942406e-05, "loss": NaN, "step": 67600 }, { "epoch": 10.99, "eval_loss": 0.4412268400192261, "eval_runtime": 8.7502, "eval_samples_per_second": 11.428, "eval_wer": 0.3848964677222899, "step": 67600 }, { "epoch": 11.01, "learning_rate": 5.61429270680372e-05, "loss": NaN, "step": 67700 }, { "epoch": 11.01, "eval_loss": 0.4201769232749939, "eval_runtime": 9.2704, "eval_samples_per_second": 10.787, "eval_wer": 0.364190012180268, "step": 67700 }, { "epoch": 11.03, "learning_rate": 5.607766356665035e-05, "loss": NaN, "step": 67800 }, { "epoch": 11.03, "eval_loss": 0.418453574180603, "eval_runtime": 8.1205, "eval_samples_per_second": 12.315, "eval_wer": 0.37758830694275275, "step": 67800 }, { "epoch": 11.04, "learning_rate": 5.60124000652635e-05, "loss": NaN, "step": 67900 }, { "epoch": 11.04, "eval_loss": 0.4066586196422577, "eval_runtime": 7.045, "eval_samples_per_second": 14.194, "eval_wer": 0.36053593179049936, "step": 67900 }, { "epoch": 11.06, "learning_rate": 5.5947136563876653e-05, "loss": NaN, "step": 68000 }, { "epoch": 11.06, "eval_loss": 0.43720924854278564, "eval_runtime": 8.1791, "eval_samples_per_second": 12.226, "eval_wer": 0.3800243605359318, "step": 68000 }, { "epoch": 11.07, "learning_rate": 5.588187306248981e-05, "loss": NaN, "step": 68100 }, { "epoch": 11.07, "eval_loss": 0.40105950832366943, "eval_runtime": 9.6195, "eval_samples_per_second": 10.396, "eval_wer": 0.37880633373934225, "step": 68100 }, { "epoch": 11.09, "learning_rate": 5.581660956110295e-05, "loss": NaN, "step": 68200 }, { "epoch": 11.09, "eval_loss": 0.365195631980896, "eval_runtime": 6.5706, "eval_samples_per_second": 15.219, "eval_wer": 0.3447015834348356, "step": 68200 }, { "epoch": 11.11, "learning_rate": 5.57513460597161e-05, "loss": NaN, "step": 68300 }, { "epoch": 11.11, "eval_loss": 0.4046388268470764, "eval_runtime": 8.1044, "eval_samples_per_second": 12.339, "eval_wer": 0.3617539585870889, "step": 68300 }, { "epoch": 11.12, "learning_rate": 5.5686082558329254e-05, "loss": NaN, "step": 68400 }, { "epoch": 11.12, "eval_loss": 0.39111071825027466, "eval_runtime": 6.8887, "eval_samples_per_second": 14.517, "eval_wer": 0.35931790499390986, "step": 68400 }, { "epoch": 11.14, "learning_rate": 5.5620819056942406e-05, "loss": NaN, "step": 68500 }, { "epoch": 11.14, "eval_loss": 0.4509762227535248, "eval_runtime": 8.7816, "eval_samples_per_second": 11.388, "eval_wer": 0.36053593179049936, "step": 68500 }, { "epoch": 11.16, "learning_rate": 5.555555555555556e-05, "loss": NaN, "step": 68600 }, { "epoch": 11.16, "eval_loss": 0.43242478370666504, "eval_runtime": 9.8683, "eval_samples_per_second": 10.133, "eval_wer": 0.37271619975639464, "step": 68600 }, { "epoch": 11.17, "learning_rate": 5.549029205416871e-05, "loss": NaN, "step": 68700 }, { "epoch": 11.17, "eval_loss": 0.3907853364944458, "eval_runtime": 7.1506, "eval_samples_per_second": 13.985, "eval_wer": 0.3617539585870889, "step": 68700 }, { "epoch": 11.19, "learning_rate": 5.5425028552781855e-05, "loss": NaN, "step": 68800 }, { "epoch": 11.19, "eval_loss": 0.5252321362495422, "eval_runtime": 7.5772, "eval_samples_per_second": 13.197, "eval_wer": 0.3751522533495737, "step": 68800 }, { "epoch": 11.21, "learning_rate": 5.535976505139501e-05, "loss": NaN, "step": 68900 }, { "epoch": 11.21, "eval_loss": 0.3976127505302429, "eval_runtime": 8.8027, "eval_samples_per_second": 11.36, "eval_wer": 0.35809987819732036, "step": 68900 }, { "epoch": 11.22, "learning_rate": 5.529450155000816e-05, "loss": NaN, "step": 69000 }, { "epoch": 11.22, "eval_loss": 0.3901364505290985, "eval_runtime": 7.7268, "eval_samples_per_second": 12.942, "eval_wer": 0.364190012180268, "step": 69000 }, { "epoch": 11.24, "learning_rate": 5.522923804862131e-05, "loss": NaN, "step": 69100 }, { "epoch": 11.24, "eval_loss": 0.42438361048698425, "eval_runtime": 7.1569, "eval_samples_per_second": 13.972, "eval_wer": 0.3751522533495737, "step": 69100 }, { "epoch": 11.25, "learning_rate": 5.516397454723446e-05, "loss": NaN, "step": 69200 }, { "epoch": 11.25, "eval_loss": 0.4562244415283203, "eval_runtime": 8.5825, "eval_samples_per_second": 11.652, "eval_wer": 0.3800243605359318, "step": 69200 }, { "epoch": 11.27, "learning_rate": 5.5098711045847615e-05, "loss": NaN, "step": 69300 }, { "epoch": 11.27, "eval_loss": 0.4827350974082947, "eval_runtime": 7.0866, "eval_samples_per_second": 14.111, "eval_wer": 0.37149817295980514, "step": 69300 }, { "epoch": 11.29, "learning_rate": 5.503344754446076e-05, "loss": NaN, "step": 69400 }, { "epoch": 11.29, "eval_loss": 0.43090012669563293, "eval_runtime": 7.5916, "eval_samples_per_second": 13.172, "eval_wer": 0.36784409257003653, "step": 69400 }, { "epoch": 11.3, "learning_rate": 5.496818404307391e-05, "loss": NaN, "step": 69500 }, { "epoch": 11.3, "eval_loss": 0.42443668842315674, "eval_runtime": 8.0483, "eval_samples_per_second": 12.425, "eval_wer": 0.36053593179049936, "step": 69500 }, { "epoch": 11.32, "learning_rate": 5.4902920541687064e-05, "loss": NaN, "step": 69600 }, { "epoch": 11.32, "eval_loss": 0.42483994364738464, "eval_runtime": 8.6393, "eval_samples_per_second": 11.575, "eval_wer": 0.37880633373934225, "step": 69600 }, { "epoch": 11.34, "learning_rate": 5.4837657040300216e-05, "loss": NaN, "step": 69700 }, { "epoch": 11.34, "eval_loss": 0.47487872838974, "eval_runtime": 7.5637, "eval_samples_per_second": 13.221, "eval_wer": 0.37149817295980514, "step": 69700 }, { "epoch": 11.35, "learning_rate": 5.477239353891337e-05, "loss": NaN, "step": 69800 }, { "epoch": 11.35, "eval_loss": 0.4218917191028595, "eval_runtime": 9.9857, "eval_samples_per_second": 10.014, "eval_wer": 0.3995127892813642, "step": 69800 }, { "epoch": 11.37, "learning_rate": 5.470713003752651e-05, "loss": NaN, "step": 69900 }, { "epoch": 11.37, "eval_loss": 0.4314954876899719, "eval_runtime": 9.0835, "eval_samples_per_second": 11.009, "eval_wer": 0.3751522533495737, "step": 69900 }, { "epoch": 11.38, "learning_rate": 5.4641866536139665e-05, "loss": NaN, "step": 70000 }, { "epoch": 11.38, "eval_loss": 0.38264960050582886, "eval_runtime": 8.6353, "eval_samples_per_second": 11.58, "eval_wer": 0.3751522533495737, "step": 70000 }, { "epoch": 11.4, "learning_rate": 5.457660303475282e-05, "loss": NaN, "step": 70100 }, { "epoch": 11.4, "eval_loss": 0.3891557455062866, "eval_runtime": 8.2828, "eval_samples_per_second": 12.073, "eval_wer": 0.3812423873325213, "step": 70100 }, { "epoch": 11.42, "learning_rate": 5.451133953336597e-05, "loss": NaN, "step": 70200 }, { "epoch": 11.42, "eval_loss": 0.4659789800643921, "eval_runtime": 7.9385, "eval_samples_per_second": 12.597, "eval_wer": 0.37758830694275275, "step": 70200 }, { "epoch": 11.43, "learning_rate": 5.444607603197912e-05, "loss": NaN, "step": 70300 }, { "epoch": 11.43, "eval_loss": 0.4575248062610626, "eval_runtime": 7.6225, "eval_samples_per_second": 13.119, "eval_wer": 0.3702801461632156, "step": 70300 }, { "epoch": 11.45, "learning_rate": 5.438081253059227e-05, "loss": NaN, "step": 70400 }, { "epoch": 11.45, "eval_loss": 0.4173835515975952, "eval_runtime": 7.9279, "eval_samples_per_second": 12.614, "eval_wer": 0.36053593179049936, "step": 70400 }, { "epoch": 11.47, "learning_rate": 5.431554902920542e-05, "loss": NaN, "step": 70500 }, { "epoch": 11.47, "eval_loss": 0.4074372947216034, "eval_runtime": 8.2601, "eval_samples_per_second": 12.106, "eval_wer": 0.3556638246041413, "step": 70500 }, { "epoch": 11.48, "learning_rate": 5.425028552781857e-05, "loss": NaN, "step": 70600 }, { "epoch": 11.48, "eval_loss": 0.4152701497077942, "eval_runtime": 8.2546, "eval_samples_per_second": 12.114, "eval_wer": 0.3617539585870889, "step": 70600 }, { "epoch": 11.5, "learning_rate": 5.418502202643172e-05, "loss": NaN, "step": 70700 }, { "epoch": 11.5, "eval_loss": 0.422438383102417, "eval_runtime": 7.4806, "eval_samples_per_second": 13.368, "eval_wer": 0.3556638246041413, "step": 70700 }, { "epoch": 11.51, "learning_rate": 5.411975852504487e-05, "loss": NaN, "step": 70800 }, { "epoch": 11.51, "eval_loss": 0.40204957127571106, "eval_runtime": 8.0201, "eval_samples_per_second": 12.469, "eval_wer": 0.3654080389768575, "step": 70800 }, { "epoch": 11.53, "learning_rate": 5.4054495023658025e-05, "loss": NaN, "step": 70900 }, { "epoch": 11.53, "eval_loss": 0.4267421066761017, "eval_runtime": 8.9633, "eval_samples_per_second": 11.157, "eval_wer": 0.36053593179049936, "step": 70900 }, { "epoch": 11.55, "learning_rate": 5.398923152227118e-05, "loss": NaN, "step": 71000 }, { "epoch": 11.55, "eval_loss": 0.4199873208999634, "eval_runtime": 8.0756, "eval_samples_per_second": 12.383, "eval_wer": 0.3617539585870889, "step": 71000 }, { "epoch": 11.56, "learning_rate": 5.392396802088432e-05, "loss": NaN, "step": 71100 }, { "epoch": 11.56, "eval_loss": 0.4814501702785492, "eval_runtime": 8.2177, "eval_samples_per_second": 12.169, "eval_wer": 0.3690621193666261, "step": 71100 }, { "epoch": 11.58, "learning_rate": 5.3858704519497474e-05, "loss": NaN, "step": 71200 }, { "epoch": 11.58, "eval_loss": 0.4721526801586151, "eval_runtime": 9.4886, "eval_samples_per_second": 10.539, "eval_wer": 0.36784409257003653, "step": 71200 }, { "epoch": 11.6, "learning_rate": 5.3793441018110626e-05, "loss": NaN, "step": 71300 }, { "epoch": 11.6, "eval_loss": 0.41694724559783936, "eval_runtime": 8.7547, "eval_samples_per_second": 11.422, "eval_wer": 0.3556638246041413, "step": 71300 }, { "epoch": 11.61, "learning_rate": 5.372817751672378e-05, "loss": NaN, "step": 71400 }, { "epoch": 11.61, "eval_loss": 0.43105384707450867, "eval_runtime": 8.4226, "eval_samples_per_second": 11.873, "eval_wer": 0.35322777101096225, "step": 71400 }, { "epoch": 11.63, "learning_rate": 5.366291401533693e-05, "loss": NaN, "step": 71500 }, { "epoch": 11.63, "eval_loss": 0.43795666098594666, "eval_runtime": 7.2699, "eval_samples_per_second": 13.755, "eval_wer": 0.36784409257003653, "step": 71500 }, { "epoch": 11.64, "learning_rate": 5.359765051395007e-05, "loss": NaN, "step": 71600 }, { "epoch": 11.64, "eval_loss": 0.4947461783885956, "eval_runtime": 7.7101, "eval_samples_per_second": 12.97, "eval_wer": 0.36662606577344703, "step": 71600 }, { "epoch": 11.66, "learning_rate": 5.353238701256322e-05, "loss": NaN, "step": 71700 }, { "epoch": 11.66, "eval_loss": 0.4540432095527649, "eval_runtime": 6.9467, "eval_samples_per_second": 14.395, "eval_wer": 0.35931790499390986, "step": 71700 }, { "epoch": 11.68, "learning_rate": 5.346712351117638e-05, "loss": NaN, "step": 71800 }, { "epoch": 11.68, "eval_loss": 0.3812675476074219, "eval_runtime": 7.2252, "eval_samples_per_second": 13.84, "eval_wer": 0.3471376370280146, "step": 71800 }, { "epoch": 11.69, "learning_rate": 5.340186000978953e-05, "loss": NaN, "step": 71900 }, { "epoch": 11.69, "eval_loss": 0.3847273290157318, "eval_runtime": 7.6934, "eval_samples_per_second": 12.998, "eval_wer": 0.3568818514007308, "step": 71900 }, { "epoch": 11.71, "learning_rate": 5.333659650840268e-05, "loss": NaN, "step": 72000 }, { "epoch": 11.71, "eval_loss": 0.4283711910247803, "eval_runtime": 8.7201, "eval_samples_per_second": 11.468, "eval_wer": 0.3751522533495737, "step": 72000 }, { "epoch": 11.73, "learning_rate": 5.3271333007015835e-05, "loss": NaN, "step": 72100 }, { "epoch": 11.73, "eval_loss": 0.4184917211532593, "eval_runtime": 7.324, "eval_samples_per_second": 13.654, "eval_wer": 0.3568818514007308, "step": 72100 }, { "epoch": 11.74, "learning_rate": 5.320606950562897e-05, "loss": NaN, "step": 72200 }, { "epoch": 11.74, "eval_loss": 0.4423336088657379, "eval_runtime": 8.1944, "eval_samples_per_second": 12.203, "eval_wer": 0.37758830694275275, "step": 72200 }, { "epoch": 11.76, "learning_rate": 5.3140806004242125e-05, "loss": NaN, "step": 72300 }, { "epoch": 11.76, "eval_loss": 0.3999084234237671, "eval_runtime": 8.6145, "eval_samples_per_second": 11.608, "eval_wer": 0.36053593179049936, "step": 72300 }, { "epoch": 11.77, "learning_rate": 5.307554250285528e-05, "loss": NaN, "step": 72400 }, { "epoch": 11.77, "eval_loss": 0.428960919380188, "eval_runtime": 7.2399, "eval_samples_per_second": 13.812, "eval_wer": 0.36053593179049936, "step": 72400 }, { "epoch": 11.79, "learning_rate": 5.3010279001468436e-05, "loss": NaN, "step": 72500 }, { "epoch": 11.79, "eval_loss": 0.3995371162891388, "eval_runtime": 7.3237, "eval_samples_per_second": 13.654, "eval_wer": 0.35322777101096225, "step": 72500 }, { "epoch": 11.81, "learning_rate": 5.294501550008159e-05, "loss": NaN, "step": 72600 }, { "epoch": 11.81, "eval_loss": 0.3626769185066223, "eval_runtime": 8.6716, "eval_samples_per_second": 11.532, "eval_wer": 0.35322777101096225, "step": 72600 }, { "epoch": 11.82, "learning_rate": 5.287975199869474e-05, "loss": NaN, "step": 72700 }, { "epoch": 11.82, "eval_loss": 0.4408608675003052, "eval_runtime": 8.3313, "eval_samples_per_second": 12.003, "eval_wer": 0.38976857490864797, "step": 72700 }, { "epoch": 11.84, "learning_rate": 5.281448849730788e-05, "loss": NaN, "step": 72800 }, { "epoch": 11.84, "eval_loss": 0.39294520020484924, "eval_runtime": 9.9612, "eval_samples_per_second": 10.039, "eval_wer": 0.36784409257003653, "step": 72800 }, { "epoch": 11.86, "learning_rate": 5.274922499592103e-05, "loss": NaN, "step": 72900 }, { "epoch": 11.86, "eval_loss": 0.4848403036594391, "eval_runtime": 7.6218, "eval_samples_per_second": 13.12, "eval_wer": 0.37149817295980514, "step": 72900 }, { "epoch": 11.87, "learning_rate": 5.268396149453418e-05, "loss": NaN, "step": 73000 }, { "epoch": 11.87, "eval_loss": 0.41433045268058777, "eval_runtime": 8.3506, "eval_samples_per_second": 11.975, "eval_wer": 0.37271619975639464, "step": 73000 }, { "epoch": 11.89, "learning_rate": 5.2618697993147333e-05, "loss": NaN, "step": 73100 }, { "epoch": 11.89, "eval_loss": 0.38409173488616943, "eval_runtime": 7.2038, "eval_samples_per_second": 13.881, "eval_wer": 0.35444579780755175, "step": 73100 }, { "epoch": 11.9, "learning_rate": 5.255343449176049e-05, "loss": NaN, "step": 73200 }, { "epoch": 11.9, "eval_loss": 0.4268048405647278, "eval_runtime": 9.8281, "eval_samples_per_second": 10.175, "eval_wer": 0.38976857490864797, "step": 73200 }, { "epoch": 11.92, "learning_rate": 5.248817099037363e-05, "loss": NaN, "step": 73300 }, { "epoch": 11.92, "eval_loss": 0.43448886275291443, "eval_runtime": 7.4958, "eval_samples_per_second": 13.341, "eval_wer": 0.3556638246041413, "step": 73300 }, { "epoch": 11.94, "learning_rate": 5.242290748898678e-05, "loss": NaN, "step": 73400 }, { "epoch": 11.94, "eval_loss": 0.43121451139450073, "eval_runtime": 9.4109, "eval_samples_per_second": 10.626, "eval_wer": 0.37880633373934225, "step": 73400 }, { "epoch": 11.95, "learning_rate": 5.2357643987599934e-05, "loss": NaN, "step": 73500 }, { "epoch": 11.95, "eval_loss": 0.3783913552761078, "eval_runtime": 7.8278, "eval_samples_per_second": 12.775, "eval_wer": 0.364190012180268, "step": 73500 }, { "epoch": 11.97, "learning_rate": 5.2292380486213086e-05, "loss": NaN, "step": 73600 }, { "epoch": 11.97, "eval_loss": 0.4278438687324524, "eval_runtime": 9.8748, "eval_samples_per_second": 10.127, "eval_wer": 0.32399512789281365, "step": 73600 }, { "epoch": 11.99, "learning_rate": 5.222711698482624e-05, "loss": NaN, "step": 73700 }, { "epoch": 11.99, "eval_loss": 0.3995451331138611, "eval_runtime": 6.8971, "eval_samples_per_second": 14.499, "eval_wer": 0.3629719853836784, "step": 73700 }, { "epoch": 12.0, "learning_rate": 5.21618534834394e-05, "loss": NaN, "step": 73800 }, { "epoch": 12.0, "eval_loss": 0.43313267827033997, "eval_runtime": 6.688, "eval_samples_per_second": 14.952, "eval_wer": 0.36053593179049936, "step": 73800 }, { "epoch": 12.02, "learning_rate": 5.2096589982052535e-05, "loss": NaN, "step": 73900 }, { "epoch": 12.02, "eval_loss": 0.3490147292613983, "eval_runtime": 8.1685, "eval_samples_per_second": 12.242, "eval_wer": 0.3447015834348356, "step": 73900 }, { "epoch": 12.03, "learning_rate": 5.203132648066569e-05, "loss": NaN, "step": 74000 }, { "epoch": 12.03, "eval_loss": 0.37458693981170654, "eval_runtime": 8.6478, "eval_samples_per_second": 11.564, "eval_wer": 0.3520097442143727, "step": 74000 }, { "epoch": 12.05, "learning_rate": 5.196606297927884e-05, "loss": NaN, "step": 74100 }, { "epoch": 12.05, "eval_loss": 0.3997301459312439, "eval_runtime": 9.0658, "eval_samples_per_second": 11.031, "eval_wer": 0.3617539585870889, "step": 74100 }, { "epoch": 12.07, "learning_rate": 5.190079947789199e-05, "loss": NaN, "step": 74200 }, { "epoch": 12.07, "eval_loss": 0.4225488305091858, "eval_runtime": 8.5571, "eval_samples_per_second": 11.686, "eval_wer": 0.364190012180268, "step": 74200 }, { "epoch": 12.08, "learning_rate": 5.183553597650514e-05, "loss": NaN, "step": 74300 }, { "epoch": 12.08, "eval_loss": 0.4431927800178528, "eval_runtime": 7.6665, "eval_samples_per_second": 13.044, "eval_wer": 0.34957369062119364, "step": 74300 }, { "epoch": 12.1, "learning_rate": 5.1770272475118295e-05, "loss": NaN, "step": 74400 }, { "epoch": 12.1, "eval_loss": 0.39965328574180603, "eval_runtime": 6.9617, "eval_samples_per_second": 14.364, "eval_wer": 0.36053593179049936, "step": 74400 }, { "epoch": 12.12, "learning_rate": 5.170500897373144e-05, "loss": NaN, "step": 74500 }, { "epoch": 12.12, "eval_loss": 0.4133952260017395, "eval_runtime": 10.1253, "eval_samples_per_second": 9.876, "eval_wer": 0.36053593179049936, "step": 74500 }, { "epoch": 12.13, "learning_rate": 5.163974547234459e-05, "loss": NaN, "step": 74600 }, { "epoch": 12.13, "eval_loss": 0.436084508895874, "eval_runtime": 9.4077, "eval_samples_per_second": 10.63, "eval_wer": 0.35931790499390986, "step": 74600 }, { "epoch": 12.15, "learning_rate": 5.1574481970957744e-05, "loss": NaN, "step": 74700 }, { "epoch": 12.15, "eval_loss": 0.42807960510253906, "eval_runtime": 8.0262, "eval_samples_per_second": 12.459, "eval_wer": 0.3520097442143727, "step": 74700 }, { "epoch": 12.16, "learning_rate": 5.1509218469570896e-05, "loss": NaN, "step": 74800 }, { "epoch": 12.16, "eval_loss": 0.6679572463035583, "eval_runtime": 9.4255, "eval_samples_per_second": 10.61, "eval_wer": 0.35444579780755175, "step": 74800 }, { "epoch": 12.18, "learning_rate": 5.144395496818405e-05, "loss": NaN, "step": 74900 }, { "epoch": 12.18, "eval_loss": 0.3985752463340759, "eval_runtime": 7.9339, "eval_samples_per_second": 12.604, "eval_wer": 0.35809987819732036, "step": 74900 }, { "epoch": 12.2, "learning_rate": 5.137869146679719e-05, "loss": NaN, "step": 75000 }, { "epoch": 12.2, "eval_loss": 0.3972986936569214, "eval_runtime": 9.0029, "eval_samples_per_second": 11.108, "eval_wer": 0.35322777101096225, "step": 75000 }, { "epoch": 12.21, "learning_rate": 5.1313427965410345e-05, "loss": NaN, "step": 75100 }, { "epoch": 12.21, "eval_loss": 0.41875389218330383, "eval_runtime": 7.5122, "eval_samples_per_second": 13.312, "eval_wer": 0.3556638246041413, "step": 75100 }, { "epoch": 12.23, "learning_rate": 5.1248164464023497e-05, "loss": NaN, "step": 75200 }, { "epoch": 12.23, "eval_loss": 0.4159642159938812, "eval_runtime": 7.1412, "eval_samples_per_second": 14.003, "eval_wer": 0.33617539585870887, "step": 75200 }, { "epoch": 12.25, "learning_rate": 5.118290096263665e-05, "loss": NaN, "step": 75300 }, { "epoch": 12.25, "eval_loss": 0.44466495513916016, "eval_runtime": 9.1084, "eval_samples_per_second": 10.979, "eval_wer": 0.34957369062119364, "step": 75300 }, { "epoch": 12.26, "learning_rate": 5.11176374612498e-05, "loss": NaN, "step": 75400 }, { "epoch": 12.26, "eval_loss": 0.45291373133659363, "eval_runtime": 10.9268, "eval_samples_per_second": 9.152, "eval_wer": 0.3654080389768575, "step": 75400 }, { "epoch": 12.28, "learning_rate": 5.105237395986295e-05, "loss": NaN, "step": 75500 }, { "epoch": 12.28, "eval_loss": 0.429513156414032, "eval_runtime": 7.1347, "eval_samples_per_second": 14.016, "eval_wer": 0.3507917174177832, "step": 75500 }, { "epoch": 12.29, "learning_rate": 5.09871104584761e-05, "loss": NaN, "step": 75600 }, { "epoch": 12.29, "eval_loss": 0.43607571721076965, "eval_runtime": 8.106, "eval_samples_per_second": 12.336, "eval_wer": 0.36662606577344703, "step": 75600 }, { "epoch": 12.31, "learning_rate": 5.092184695708925e-05, "loss": NaN, "step": 75700 }, { "epoch": 12.31, "eval_loss": 0.505099356174469, "eval_runtime": 9.0741, "eval_samples_per_second": 11.02, "eval_wer": 0.36053593179049936, "step": 75700 }, { "epoch": 12.33, "learning_rate": 5.08565834557024e-05, "loss": NaN, "step": 75800 }, { "epoch": 12.33, "eval_loss": 0.5338563919067383, "eval_runtime": 9.1994, "eval_samples_per_second": 10.87, "eval_wer": 0.35322777101096225, "step": 75800 }, { "epoch": 12.34, "learning_rate": 5.079131995431555e-05, "loss": NaN, "step": 75900 }, { "epoch": 12.34, "eval_loss": 0.43960484862327576, "eval_runtime": 10.6506, "eval_samples_per_second": 9.389, "eval_wer": 0.364190012180268, "step": 75900 }, { "epoch": 12.36, "learning_rate": 5.0726056452928705e-05, "loss": NaN, "step": 76000 }, { "epoch": 12.36, "eval_loss": 0.4200018644332886, "eval_runtime": 8.4143, "eval_samples_per_second": 11.885, "eval_wer": 0.3459196102314251, "step": 76000 }, { "epoch": 12.38, "learning_rate": 5.066079295154186e-05, "loss": NaN, "step": 76100 }, { "epoch": 12.38, "eval_loss": 0.44790372252464294, "eval_runtime": 9.2667, "eval_samples_per_second": 10.791, "eval_wer": 0.36053593179049936, "step": 76100 }, { "epoch": 12.39, "learning_rate": 5.0595529450155e-05, "loss": NaN, "step": 76200 }, { "epoch": 12.39, "eval_loss": 0.4088483154773712, "eval_runtime": 9.4703, "eval_samples_per_second": 10.559, "eval_wer": 0.35809987819732036, "step": 76200 }, { "epoch": 12.41, "learning_rate": 5.0530265948768154e-05, "loss": NaN, "step": 76300 }, { "epoch": 12.41, "eval_loss": 0.4267137944698334, "eval_runtime": 8.6069, "eval_samples_per_second": 11.619, "eval_wer": 0.3763702801461632, "step": 76300 }, { "epoch": 12.42, "learning_rate": 5.0465002447381306e-05, "loss": NaN, "step": 76400 }, { "epoch": 12.42, "eval_loss": 0.4056796133518219, "eval_runtime": 7.7712, "eval_samples_per_second": 12.868, "eval_wer": 0.37149817295980514, "step": 76400 }, { "epoch": 12.44, "learning_rate": 5.039973894599446e-05, "loss": NaN, "step": 76500 }, { "epoch": 12.44, "eval_loss": 0.3797760307788849, "eval_runtime": 8.4756, "eval_samples_per_second": 11.799, "eval_wer": 0.341047503045067, "step": 76500 }, { "epoch": 12.46, "learning_rate": 5.033447544460761e-05, "loss": NaN, "step": 76600 }, { "epoch": 12.46, "eval_loss": 0.3841753900051117, "eval_runtime": 9.2622, "eval_samples_per_second": 10.797, "eval_wer": 0.3617539585870889, "step": 76600 }, { "epoch": 12.47, "learning_rate": 5.026921194322075e-05, "loss": NaN, "step": 76700 }, { "epoch": 12.47, "eval_loss": 0.3942345380783081, "eval_runtime": 7.1118, "eval_samples_per_second": 14.061, "eval_wer": 0.3459196102314251, "step": 76700 }, { "epoch": 12.49, "learning_rate": 5.02039484418339e-05, "loss": NaN, "step": 76800 }, { "epoch": 12.49, "eval_loss": 0.4500068426132202, "eval_runtime": 8.7652, "eval_samples_per_second": 11.409, "eval_wer": 0.36784409257003653, "step": 76800 }, { "epoch": 12.51, "learning_rate": 5.013868494044706e-05, "loss": NaN, "step": 76900 }, { "epoch": 12.51, "eval_loss": 0.36947688460350037, "eval_runtime": 7.5264, "eval_samples_per_second": 13.286, "eval_wer": 0.35322777101096225, "step": 76900 }, { "epoch": 12.52, "learning_rate": 5.007342143906021e-05, "loss": NaN, "step": 77000 }, { "epoch": 12.52, "eval_loss": 0.4559879004955292, "eval_runtime": 7.0948, "eval_samples_per_second": 14.095, "eval_wer": 0.36053593179049936, "step": 77000 }, { "epoch": 12.54, "learning_rate": 5.000815793767336e-05, "loss": NaN, "step": 77100 }, { "epoch": 12.54, "eval_loss": 0.4029790759086609, "eval_runtime": 8.456, "eval_samples_per_second": 11.826, "eval_wer": 0.34835566382460414, "step": 77100 }, { "epoch": 12.55, "learning_rate": 4.994289443628651e-05, "loss": NaN, "step": 77200 }, { "epoch": 12.55, "eval_loss": 0.3982163369655609, "eval_runtime": 7.6143, "eval_samples_per_second": 13.133, "eval_wer": 0.34226552984165654, "step": 77200 }, { "epoch": 12.57, "learning_rate": 4.987763093489966e-05, "loss": NaN, "step": 77300 }, { "epoch": 12.57, "eval_loss": 0.5170900225639343, "eval_runtime": 8.925, "eval_samples_per_second": 11.204, "eval_wer": 0.36784409257003653, "step": 77300 }, { "epoch": 12.59, "learning_rate": 4.9812367433512805e-05, "loss": NaN, "step": 77400 }, { "epoch": 12.59, "eval_loss": 0.42326900362968445, "eval_runtime": 8.9522, "eval_samples_per_second": 11.17, "eval_wer": 0.35931790499390986, "step": 77400 }, { "epoch": 12.6, "learning_rate": 4.9747103932125964e-05, "loss": NaN, "step": 77500 }, { "epoch": 12.6, "eval_loss": 0.4721744656562805, "eval_runtime": 9.3092, "eval_samples_per_second": 10.742, "eval_wer": 0.3763702801461632, "step": 77500 }, { "epoch": 12.62, "learning_rate": 4.9681840430739115e-05, "loss": NaN, "step": 77600 }, { "epoch": 12.62, "eval_loss": 0.40708309412002563, "eval_runtime": 8.9646, "eval_samples_per_second": 11.155, "eval_wer": 0.36053593179049936, "step": 77600 }, { "epoch": 12.64, "learning_rate": 4.961657692935226e-05, "loss": NaN, "step": 77700 }, { "epoch": 12.64, "eval_loss": 0.3885576128959656, "eval_runtime": 6.9779, "eval_samples_per_second": 14.331, "eval_wer": 0.3471376370280146, "step": 77700 }, { "epoch": 12.65, "learning_rate": 4.955131342796541e-05, "loss": NaN, "step": 77800 }, { "epoch": 12.65, "eval_loss": 0.39132988452911377, "eval_runtime": 9.1207, "eval_samples_per_second": 10.964, "eval_wer": 0.33617539585870887, "step": 77800 }, { "epoch": 12.67, "learning_rate": 4.9486049926578564e-05, "loss": NaN, "step": 77900 }, { "epoch": 12.67, "eval_loss": 0.40842190384864807, "eval_runtime": 7.0913, "eval_samples_per_second": 14.102, "eval_wer": 0.35809987819732036, "step": 77900 }, { "epoch": 12.68, "learning_rate": 4.942078642519171e-05, "loss": NaN, "step": 78000 }, { "epoch": 12.68, "eval_loss": 0.3725109398365021, "eval_runtime": 7.7538, "eval_samples_per_second": 12.897, "eval_wer": 0.35809987819732036, "step": 78000 }, { "epoch": 12.7, "learning_rate": 4.935552292380486e-05, "loss": NaN, "step": 78100 }, { "epoch": 12.7, "eval_loss": 0.5190932750701904, "eval_runtime": 8.1388, "eval_samples_per_second": 12.287, "eval_wer": 0.34835566382460414, "step": 78100 }, { "epoch": 12.72, "learning_rate": 4.929025942241802e-05, "loss": NaN, "step": 78200 }, { "epoch": 12.72, "eval_loss": 0.37530940771102905, "eval_runtime": 7.1222, "eval_samples_per_second": 14.041, "eval_wer": 0.35322777101096225, "step": 78200 }, { "epoch": 12.73, "learning_rate": 4.9224995921031165e-05, "loss": NaN, "step": 78300 }, { "epoch": 12.73, "eval_loss": 0.4114912748336792, "eval_runtime": 7.8419, "eval_samples_per_second": 12.752, "eval_wer": 0.36053593179049936, "step": 78300 }, { "epoch": 12.75, "learning_rate": 4.915973241964432e-05, "loss": NaN, "step": 78400 }, { "epoch": 12.75, "eval_loss": 0.4053696095943451, "eval_runtime": 6.6142, "eval_samples_per_second": 15.119, "eval_wer": 0.3507917174177832, "step": 78400 }, { "epoch": 12.77, "learning_rate": 4.909446891825747e-05, "loss": NaN, "step": 78500 }, { "epoch": 12.77, "eval_loss": 0.39146101474761963, "eval_runtime": 9.407, "eval_samples_per_second": 10.63, "eval_wer": 0.3556638246041413, "step": 78500 }, { "epoch": 12.78, "learning_rate": 4.9029205416870614e-05, "loss": NaN, "step": 78600 }, { "epoch": 12.78, "eval_loss": 0.40449854731559753, "eval_runtime": 7.3375, "eval_samples_per_second": 13.629, "eval_wer": 0.3568818514007308, "step": 78600 }, { "epoch": 12.8, "learning_rate": 4.8963941915483766e-05, "loss": NaN, "step": 78700 }, { "epoch": 12.8, "eval_loss": 0.4020620584487915, "eval_runtime": 10.3327, "eval_samples_per_second": 9.678, "eval_wer": 0.35809987819732036, "step": 78700 }, { "epoch": 12.82, "learning_rate": 4.889867841409692e-05, "loss": NaN, "step": 78800 }, { "epoch": 12.82, "eval_loss": 0.39416953921318054, "eval_runtime": 7.3981, "eval_samples_per_second": 13.517, "eval_wer": 0.3507917174177832, "step": 78800 }, { "epoch": 12.83, "learning_rate": 4.883341491271007e-05, "loss": NaN, "step": 78900 }, { "epoch": 12.83, "eval_loss": 0.3987289369106293, "eval_runtime": 8.9882, "eval_samples_per_second": 11.126, "eval_wer": 0.3507917174177832, "step": 78900 }, { "epoch": 12.85, "learning_rate": 4.876815141132322e-05, "loss": NaN, "step": 79000 }, { "epoch": 12.85, "eval_loss": 0.3875060975551605, "eval_runtime": 8.7165, "eval_samples_per_second": 11.472, "eval_wer": 0.35809987819732036, "step": 79000 }, { "epoch": 12.86, "learning_rate": 4.870288790993637e-05, "loss": NaN, "step": 79100 }, { "epoch": 12.86, "eval_loss": 0.4113094210624695, "eval_runtime": 9.2773, "eval_samples_per_second": 10.779, "eval_wer": 0.3702801461632156, "step": 79100 }, { "epoch": 12.88, "learning_rate": 4.863762440854952e-05, "loss": NaN, "step": 79200 }, { "epoch": 12.88, "eval_loss": 0.4063952565193176, "eval_runtime": 8.6562, "eval_samples_per_second": 11.552, "eval_wer": 0.3751522533495737, "step": 79200 }, { "epoch": 12.9, "learning_rate": 4.857236090716267e-05, "loss": NaN, "step": 79300 }, { "epoch": 12.9, "eval_loss": 0.3837190270423889, "eval_runtime": 7.4933, "eval_samples_per_second": 13.345, "eval_wer": 0.3568818514007308, "step": 79300 }, { "epoch": 12.91, "learning_rate": 4.850709740577582e-05, "loss": NaN, "step": 79400 }, { "epoch": 12.91, "eval_loss": 0.40857169032096863, "eval_runtime": 8.4689, "eval_samples_per_second": 11.808, "eval_wer": 0.3568818514007308, "step": 79400 }, { "epoch": 12.93, "learning_rate": 4.8441833904388975e-05, "loss": NaN, "step": 79500 }, { "epoch": 12.93, "eval_loss": 0.3926541209220886, "eval_runtime": 6.7162, "eval_samples_per_second": 14.889, "eval_wer": 0.3459196102314251, "step": 79500 }, { "epoch": 12.95, "learning_rate": 4.837657040300213e-05, "loss": NaN, "step": 79600 }, { "epoch": 12.95, "eval_loss": 0.4522092044353485, "eval_runtime": 8.4503, "eval_samples_per_second": 11.834, "eval_wer": 0.35322777101096225, "step": 79600 }, { "epoch": 12.96, "learning_rate": 4.831130690161527e-05, "loss": NaN, "step": 79700 }, { "epoch": 12.96, "eval_loss": 0.4004019498825073, "eval_runtime": 7.2333, "eval_samples_per_second": 13.825, "eval_wer": 0.35809987819732036, "step": 79700 }, { "epoch": 12.98, "learning_rate": 4.8246043400228424e-05, "loss": NaN, "step": 79800 }, { "epoch": 12.98, "eval_loss": 0.36814793944358826, "eval_runtime": 9.1464, "eval_samples_per_second": 10.933, "eval_wer": 0.34348355663824603, "step": 79800 }, { "epoch": 12.99, "learning_rate": 4.8180779898841576e-05, "loss": NaN, "step": 79900 }, { "epoch": 12.99, "eval_loss": 0.3880935609340668, "eval_runtime": 8.0402, "eval_samples_per_second": 12.438, "eval_wer": 0.364190012180268, "step": 79900 }, { "epoch": 13.01, "learning_rate": 4.811551639745472e-05, "loss": NaN, "step": 80000 }, { "epoch": 13.01, "eval_loss": 0.39711371064186096, "eval_runtime": 8.0714, "eval_samples_per_second": 12.389, "eval_wer": 0.3520097442143727, "step": 80000 }, { "epoch": 13.03, "learning_rate": 4.805025289606788e-05, "loss": NaN, "step": 80100 }, { "epoch": 13.03, "eval_loss": 0.4093989133834839, "eval_runtime": 8.8057, "eval_samples_per_second": 11.356, "eval_wer": 0.3568818514007308, "step": 80100 }, { "epoch": 13.04, "learning_rate": 4.798498939468103e-05, "loss": NaN, "step": 80200 }, { "epoch": 13.04, "eval_loss": 0.39422935247421265, "eval_runtime": 8.3368, "eval_samples_per_second": 11.995, "eval_wer": 0.36784409257003653, "step": 80200 }, { "epoch": 13.06, "learning_rate": 4.7919725893294177e-05, "loss": NaN, "step": 80300 }, { "epoch": 13.06, "eval_loss": 0.40601789951324463, "eval_runtime": 7.678, "eval_samples_per_second": 13.024, "eval_wer": 0.36053593179049936, "step": 80300 }, { "epoch": 13.08, "learning_rate": 4.785446239190733e-05, "loss": NaN, "step": 80400 }, { "epoch": 13.08, "eval_loss": 0.42190930247306824, "eval_runtime": 7.1522, "eval_samples_per_second": 13.982, "eval_wer": 0.3568818514007308, "step": 80400 }, { "epoch": 13.09, "learning_rate": 4.778919889052048e-05, "loss": NaN, "step": 80500 }, { "epoch": 13.09, "eval_loss": 0.45500144362449646, "eval_runtime": 7.293, "eval_samples_per_second": 13.712, "eval_wer": 0.3568818514007308, "step": 80500 }, { "epoch": 13.11, "learning_rate": 4.7723935389133625e-05, "loss": NaN, "step": 80600 }, { "epoch": 13.11, "eval_loss": 0.4279215335845947, "eval_runtime": 8.0851, "eval_samples_per_second": 12.368, "eval_wer": 0.364190012180268, "step": 80600 }, { "epoch": 13.12, "learning_rate": 4.7658671887746784e-05, "loss": NaN, "step": 80700 }, { "epoch": 13.12, "eval_loss": 0.379155695438385, "eval_runtime": 8.3158, "eval_samples_per_second": 12.025, "eval_wer": 0.3447015834348356, "step": 80700 }, { "epoch": 13.14, "learning_rate": 4.759340838635993e-05, "loss": NaN, "step": 80800 }, { "epoch": 13.14, "eval_loss": 0.41694533824920654, "eval_runtime": 9.1011, "eval_samples_per_second": 10.988, "eval_wer": 0.3702801461632156, "step": 80800 }, { "epoch": 13.16, "learning_rate": 4.752814488497308e-05, "loss": NaN, "step": 80900 }, { "epoch": 13.16, "eval_loss": 0.43820008635520935, "eval_runtime": 8.0662, "eval_samples_per_second": 12.397, "eval_wer": 0.35931790499390986, "step": 80900 }, { "epoch": 13.17, "learning_rate": 4.746288138358623e-05, "loss": NaN, "step": 81000 }, { "epoch": 13.17, "eval_loss": 0.38130292296409607, "eval_runtime": 6.6507, "eval_samples_per_second": 15.036, "eval_wer": 0.3471376370280146, "step": 81000 }, { "epoch": 13.19, "learning_rate": 4.739761788219938e-05, "loss": NaN, "step": 81100 }, { "epoch": 13.19, "eval_loss": 0.4210968315601349, "eval_runtime": 8.56, "eval_samples_per_second": 11.682, "eval_wer": 0.35322777101096225, "step": 81100 }, { "epoch": 13.21, "learning_rate": 4.733235438081253e-05, "loss": NaN, "step": 81200 }, { "epoch": 13.21, "eval_loss": 0.379304438829422, "eval_runtime": 7.6806, "eval_samples_per_second": 13.02, "eval_wer": 0.3373934226552984, "step": 81200 }, { "epoch": 13.22, "learning_rate": 4.726709087942568e-05, "loss": NaN, "step": 81300 }, { "epoch": 13.22, "eval_loss": 0.4642069935798645, "eval_runtime": 7.3598, "eval_samples_per_second": 13.587, "eval_wer": 0.3629719853836784, "step": 81300 }, { "epoch": 13.24, "learning_rate": 4.7201827378038834e-05, "loss": NaN, "step": 81400 }, { "epoch": 13.24, "eval_loss": 0.39892637729644775, "eval_runtime": 8.1349, "eval_samples_per_second": 12.293, "eval_wer": 0.35444579780755175, "step": 81400 }, { "epoch": 13.25, "learning_rate": 4.7136563876651986e-05, "loss": NaN, "step": 81500 }, { "epoch": 13.25, "eval_loss": 0.3699035942554474, "eval_runtime": 7.0381, "eval_samples_per_second": 14.208, "eval_wer": 0.3386114494518879, "step": 81500 }, { "epoch": 13.27, "learning_rate": 4.707130037526514e-05, "loss": NaN, "step": 81600 }, { "epoch": 13.27, "eval_loss": 0.4748342037200928, "eval_runtime": 8.5553, "eval_samples_per_second": 11.689, "eval_wer": 0.3654080389768575, "step": 81600 }, { "epoch": 13.29, "learning_rate": 4.700603687387828e-05, "loss": NaN, "step": 81700 }, { "epoch": 13.29, "eval_loss": 0.4026525616645813, "eval_runtime": 6.9498, "eval_samples_per_second": 14.389, "eval_wer": 0.36053593179049936, "step": 81700 }, { "epoch": 13.3, "learning_rate": 4.6940773372491435e-05, "loss": NaN, "step": 81800 }, { "epoch": 13.3, "eval_loss": 0.4426953196525574, "eval_runtime": 9.5632, "eval_samples_per_second": 10.457, "eval_wer": 0.36053593179049936, "step": 81800 }, { "epoch": 13.32, "learning_rate": 4.687550987110459e-05, "loss": NaN, "step": 81900 }, { "epoch": 13.32, "eval_loss": 0.4907471835613251, "eval_runtime": 9.1012, "eval_samples_per_second": 10.988, "eval_wer": 0.38246041412911086, "step": 81900 }, { "epoch": 13.34, "learning_rate": 4.681024636971774e-05, "loss": NaN, "step": 82000 }, { "epoch": 13.34, "eval_loss": 0.39570945501327515, "eval_runtime": 9.1482, "eval_samples_per_second": 10.931, "eval_wer": 0.35931790499390986, "step": 82000 }, { "epoch": 13.35, "learning_rate": 4.674498286833089e-05, "loss": NaN, "step": 82100 }, { "epoch": 13.35, "eval_loss": 0.39692896604537964, "eval_runtime": 8.067, "eval_samples_per_second": 12.396, "eval_wer": 0.3520097442143727, "step": 82100 }, { "epoch": 13.37, "learning_rate": 4.667971936694404e-05, "loss": NaN, "step": 82200 }, { "epoch": 13.37, "eval_loss": 0.41192084550857544, "eval_runtime": 8.128, "eval_samples_per_second": 12.303, "eval_wer": 0.3617539585870889, "step": 82200 }, { "epoch": 13.38, "learning_rate": 4.661445586555719e-05, "loss": NaN, "step": 82300 }, { "epoch": 13.38, "eval_loss": 0.38953062891960144, "eval_runtime": 9.918, "eval_samples_per_second": 10.083, "eval_wer": 0.36053593179049936, "step": 82300 }, { "epoch": 13.4, "learning_rate": 4.654919236417034e-05, "loss": NaN, "step": 82400 }, { "epoch": 13.4, "eval_loss": 0.37186986207962036, "eval_runtime": 8.1376, "eval_samples_per_second": 12.289, "eval_wer": 0.34835566382460414, "step": 82400 }, { "epoch": 13.42, "learning_rate": 4.6483928862783485e-05, "loss": NaN, "step": 82500 }, { "epoch": 13.42, "eval_loss": 0.40984976291656494, "eval_runtime": 8.9721, "eval_samples_per_second": 11.146, "eval_wer": 0.34226552984165654, "step": 82500 }, { "epoch": 13.43, "learning_rate": 4.6418665361396643e-05, "loss": NaN, "step": 82600 }, { "epoch": 13.43, "eval_loss": 0.4037730097770691, "eval_runtime": 6.8614, "eval_samples_per_second": 14.574, "eval_wer": 0.34226552984165654, "step": 82600 }, { "epoch": 13.45, "learning_rate": 4.6353401860009795e-05, "loss": NaN, "step": 82700 }, { "epoch": 13.45, "eval_loss": 0.38672852516174316, "eval_runtime": 7.8242, "eval_samples_per_second": 12.781, "eval_wer": 0.3556638246041413, "step": 82700 }, { "epoch": 13.47, "learning_rate": 4.628813835862294e-05, "loss": NaN, "step": 82800 }, { "epoch": 13.47, "eval_loss": 0.41303497552871704, "eval_runtime": 7.7371, "eval_samples_per_second": 12.925, "eval_wer": 0.34957369062119364, "step": 82800 }, { "epoch": 13.48, "learning_rate": 4.622287485723609e-05, "loss": NaN, "step": 82900 }, { "epoch": 13.48, "eval_loss": 0.3807326853275299, "eval_runtime": 8.6603, "eval_samples_per_second": 11.547, "eval_wer": 0.35444579780755175, "step": 82900 }, { "epoch": 13.5, "learning_rate": 4.6157611355849244e-05, "loss": NaN, "step": 83000 }, { "epoch": 13.5, "eval_loss": 0.3885740637779236, "eval_runtime": 8.1938, "eval_samples_per_second": 12.204, "eval_wer": 0.34348355663824603, "step": 83000 }, { "epoch": 13.51, "learning_rate": 4.609234785446239e-05, "loss": NaN, "step": 83100 }, { "epoch": 13.51, "eval_loss": 0.40991002321243286, "eval_runtime": 8.0699, "eval_samples_per_second": 12.392, "eval_wer": 0.34957369062119364, "step": 83100 }, { "epoch": 13.53, "learning_rate": 4.602708435307554e-05, "loss": NaN, "step": 83200 }, { "epoch": 13.53, "eval_loss": 0.45967453718185425, "eval_runtime": 9.6326, "eval_samples_per_second": 10.381, "eval_wer": 0.3654080389768575, "step": 83200 }, { "epoch": 13.55, "learning_rate": 4.59618208516887e-05, "loss": NaN, "step": 83300 }, { "epoch": 13.55, "eval_loss": 0.41274598240852356, "eval_runtime": 7.4414, "eval_samples_per_second": 13.438, "eval_wer": 0.3520097442143727, "step": 83300 }, { "epoch": 13.56, "learning_rate": 4.5896557350301845e-05, "loss": NaN, "step": 83400 }, { "epoch": 13.56, "eval_loss": 0.39359050989151, "eval_runtime": 7.6776, "eval_samples_per_second": 13.025, "eval_wer": 0.3520097442143727, "step": 83400 }, { "epoch": 13.58, "learning_rate": 4.5831293848915e-05, "loss": NaN, "step": 83500 }, { "epoch": 13.58, "eval_loss": 0.3984470069408417, "eval_runtime": 8.3263, "eval_samples_per_second": 12.01, "eval_wer": 0.3556638246041413, "step": 83500 }, { "epoch": 13.6, "learning_rate": 4.576603034752815e-05, "loss": NaN, "step": 83600 }, { "epoch": 13.6, "eval_loss": 0.39405977725982666, "eval_runtime": 7.0798, "eval_samples_per_second": 14.125, "eval_wer": 0.35809987819732036, "step": 83600 }, { "epoch": 13.61, "learning_rate": 4.5700766846141294e-05, "loss": NaN, "step": 83700 }, { "epoch": 13.61, "eval_loss": 0.45130589604377747, "eval_runtime": 7.6376, "eval_samples_per_second": 13.093, "eval_wer": 0.3629719853836784, "step": 83700 }, { "epoch": 13.63, "learning_rate": 4.5635503344754446e-05, "loss": NaN, "step": 83800 }, { "epoch": 13.63, "eval_loss": 0.4328234791755676, "eval_runtime": 6.7166, "eval_samples_per_second": 14.889, "eval_wer": 0.3520097442143727, "step": 83800 }, { "epoch": 13.64, "learning_rate": 4.55702398433676e-05, "loss": NaN, "step": 83900 }, { "epoch": 13.64, "eval_loss": 0.40169548988342285, "eval_runtime": 8.601, "eval_samples_per_second": 11.626, "eval_wer": 0.35444579780755175, "step": 83900 }, { "epoch": 13.66, "learning_rate": 4.550497634198075e-05, "loss": NaN, "step": 84000 }, { "epoch": 13.66, "eval_loss": 0.40670937299728394, "eval_runtime": 8.6181, "eval_samples_per_second": 11.603, "eval_wer": 0.36662606577344703, "step": 84000 }, { "epoch": 13.68, "learning_rate": 4.54397128405939e-05, "loss": NaN, "step": 84100 }, { "epoch": 13.68, "eval_loss": 0.4055994153022766, "eval_runtime": 8.9478, "eval_samples_per_second": 11.176, "eval_wer": 0.3556638246041413, "step": 84100 }, { "epoch": 13.69, "learning_rate": 4.537444933920705e-05, "loss": NaN, "step": 84200 }, { "epoch": 13.69, "eval_loss": 0.37059950828552246, "eval_runtime": 8.4585, "eval_samples_per_second": 11.822, "eval_wer": 0.3520097442143727, "step": 84200 }, { "epoch": 13.71, "learning_rate": 4.53091858378202e-05, "loss": NaN, "step": 84300 }, { "epoch": 13.71, "eval_loss": 0.3316919207572937, "eval_runtime": 7.6508, "eval_samples_per_second": 13.071, "eval_wer": 0.32521315468940315, "step": 84300 }, { "epoch": 13.73, "learning_rate": 4.524392233643335e-05, "loss": NaN, "step": 84400 }, { "epoch": 13.73, "eval_loss": 0.38926997780799866, "eval_runtime": 7.2992, "eval_samples_per_second": 13.7, "eval_wer": 0.3459196102314251, "step": 84400 }, { "epoch": 13.74, "learning_rate": 4.51786588350465e-05, "loss": NaN, "step": 84500 }, { "epoch": 13.74, "eval_loss": 0.3776205778121948, "eval_runtime": 7.205, "eval_samples_per_second": 13.879, "eval_wer": 0.3398294762484775, "step": 84500 }, { "epoch": 13.76, "learning_rate": 4.5113395333659655e-05, "loss": NaN, "step": 84600 }, { "epoch": 13.76, "eval_loss": 0.4353153705596924, "eval_runtime": 8.1838, "eval_samples_per_second": 12.219, "eval_wer": 0.34957369062119364, "step": 84600 }, { "epoch": 13.77, "learning_rate": 4.5048131832272807e-05, "loss": NaN, "step": 84700 }, { "epoch": 13.77, "eval_loss": 0.3977775573730469, "eval_runtime": 8.5838, "eval_samples_per_second": 11.65, "eval_wer": 0.34226552984165654, "step": 84700 }, { "epoch": 13.79, "learning_rate": 4.498286833088595e-05, "loss": NaN, "step": 84800 }, { "epoch": 13.79, "eval_loss": 0.3765636384487152, "eval_runtime": 7.8414, "eval_samples_per_second": 12.753, "eval_wer": 0.34226552984165654, "step": 84800 }, { "epoch": 13.81, "learning_rate": 4.4917604829499104e-05, "loss": NaN, "step": 84900 }, { "epoch": 13.81, "eval_loss": 0.3906586766242981, "eval_runtime": 9.8562, "eval_samples_per_second": 10.146, "eval_wer": 0.36053593179049936, "step": 84900 }, { "epoch": 13.82, "learning_rate": 4.4852341328112256e-05, "loss": NaN, "step": 85000 }, { "epoch": 13.82, "eval_loss": 0.39076992869377136, "eval_runtime": 7.9184, "eval_samples_per_second": 12.629, "eval_wer": 0.34348355663824603, "step": 85000 }, { "epoch": 13.84, "learning_rate": 4.478707782672541e-05, "loss": NaN, "step": 85100 }, { "epoch": 13.84, "eval_loss": 0.38430699706077576, "eval_runtime": 7.852, "eval_samples_per_second": 12.736, "eval_wer": 0.3471376370280146, "step": 85100 }, { "epoch": 13.86, "learning_rate": 4.472181432533856e-05, "loss": NaN, "step": 85200 }, { "epoch": 13.86, "eval_loss": 0.36845266819000244, "eval_runtime": 7.4373, "eval_samples_per_second": 13.446, "eval_wer": 0.3459196102314251, "step": 85200 }, { "epoch": 13.87, "learning_rate": 4.465655082395171e-05, "loss": NaN, "step": 85300 }, { "epoch": 13.87, "eval_loss": 0.39804258942604065, "eval_runtime": 9.8439, "eval_samples_per_second": 10.159, "eval_wer": 0.3459196102314251, "step": 85300 }, { "epoch": 13.89, "learning_rate": 4.4591287322564856e-05, "loss": NaN, "step": 85400 }, { "epoch": 13.89, "eval_loss": 0.3661288321018219, "eval_runtime": 8.5748, "eval_samples_per_second": 11.662, "eval_wer": 0.3398294762484775, "step": 85400 }, { "epoch": 13.9, "learning_rate": 4.452602382117801e-05, "loss": NaN, "step": 85500 }, { "epoch": 13.9, "eval_loss": 0.3940080404281616, "eval_runtime": 8.4536, "eval_samples_per_second": 11.829, "eval_wer": 0.35444579780755175, "step": 85500 }, { "epoch": 13.92, "learning_rate": 4.446076031979116e-05, "loss": NaN, "step": 85600 }, { "epoch": 13.92, "eval_loss": 0.38597309589385986, "eval_runtime": 7.5301, "eval_samples_per_second": 13.28, "eval_wer": 0.3471376370280146, "step": 85600 }, { "epoch": 13.94, "learning_rate": 4.4395496818404305e-05, "loss": NaN, "step": 85700 }, { "epoch": 13.94, "eval_loss": 0.3475070297718048, "eval_runtime": 7.4895, "eval_samples_per_second": 13.352, "eval_wer": 0.3447015834348356, "step": 85700 }, { "epoch": 13.95, "learning_rate": 4.4330233317017464e-05, "loss": NaN, "step": 85800 }, { "epoch": 13.95, "eval_loss": 0.3472925126552582, "eval_runtime": 7.1585, "eval_samples_per_second": 13.969, "eval_wer": 0.3459196102314251, "step": 85800 }, { "epoch": 13.97, "learning_rate": 4.426496981563061e-05, "loss": NaN, "step": 85900 }, { "epoch": 13.97, "eval_loss": 0.4307803213596344, "eval_runtime": 8.4562, "eval_samples_per_second": 11.826, "eval_wer": 0.35444579780755175, "step": 85900 }, { "epoch": 13.99, "learning_rate": 4.419970631424376e-05, "loss": NaN, "step": 86000 }, { "epoch": 13.99, "eval_loss": 0.3824266791343689, "eval_runtime": 7.6614, "eval_samples_per_second": 13.052, "eval_wer": 0.35444579780755175, "step": 86000 }, { "epoch": 14.0, "learning_rate": 4.413444281285691e-05, "loss": NaN, "step": 86100 }, { "epoch": 14.0, "eval_loss": 0.4147208333015442, "eval_runtime": 8.0603, "eval_samples_per_second": 12.407, "eval_wer": 0.34348355663824603, "step": 86100 }, { "epoch": 14.02, "learning_rate": 4.406917931147006e-05, "loss": NaN, "step": 86200 }, { "epoch": 14.02, "eval_loss": 0.37703704833984375, "eval_runtime": 8.6635, "eval_samples_per_second": 11.543, "eval_wer": 0.35322777101096225, "step": 86200 }, { "epoch": 14.03, "learning_rate": 4.400391581008321e-05, "loss": NaN, "step": 86300 }, { "epoch": 14.03, "eval_loss": 0.38355034589767456, "eval_runtime": 8.3757, "eval_samples_per_second": 11.939, "eval_wer": 0.3507917174177832, "step": 86300 }, { "epoch": 14.05, "learning_rate": 4.393865230869636e-05, "loss": NaN, "step": 86400 }, { "epoch": 14.05, "eval_loss": 0.4052790403366089, "eval_runtime": 9.7614, "eval_samples_per_second": 10.244, "eval_wer": 0.3398294762484775, "step": 86400 }, { "epoch": 14.07, "learning_rate": 4.3873388807309514e-05, "loss": NaN, "step": 86500 }, { "epoch": 14.07, "eval_loss": 0.3577238917350769, "eval_runtime": 7.8702, "eval_samples_per_second": 12.706, "eval_wer": 0.34348355663824603, "step": 86500 }, { "epoch": 14.08, "learning_rate": 4.3808125305922666e-05, "loss": NaN, "step": 86600 }, { "epoch": 14.08, "eval_loss": 0.3567332327365875, "eval_runtime": 8.207, "eval_samples_per_second": 12.185, "eval_wer": 0.3373934226552984, "step": 86600 }, { "epoch": 14.1, "learning_rate": 4.374286180453582e-05, "loss": NaN, "step": 86700 }, { "epoch": 14.1, "eval_loss": 0.46958306431770325, "eval_runtime": 7.2452, "eval_samples_per_second": 13.802, "eval_wer": 0.35444579780755175, "step": 86700 }, { "epoch": 14.12, "learning_rate": 4.367759830314896e-05, "loss": NaN, "step": 86800 }, { "epoch": 14.12, "eval_loss": 0.37138259410858154, "eval_runtime": 8.0019, "eval_samples_per_second": 12.497, "eval_wer": 0.3325213154689403, "step": 86800 }, { "epoch": 14.13, "learning_rate": 4.3612334801762115e-05, "loss": 0.1053, "step": 86900 }, { "epoch": 14.13, "eval_loss": 0.3933388590812683, "eval_runtime": 7.7892, "eval_samples_per_second": 12.838, "eval_wer": 0.35444579780755175, "step": 86900 }, { "epoch": 14.15, "learning_rate": 4.354707130037527e-05, "loss": 0.1085, "step": 87000 }, { "epoch": 14.15, "eval_loss": 0.4454494118690491, "eval_runtime": 9.0708, "eval_samples_per_second": 11.024, "eval_wer": 0.34835566382460414, "step": 87000 }, { "epoch": 14.16, "learning_rate": 4.348180779898842e-05, "loss": 0.1044, "step": 87100 }, { "epoch": 14.16, "eval_loss": 0.35896095633506775, "eval_runtime": 7.3353, "eval_samples_per_second": 13.633, "eval_wer": 0.341047503045067, "step": 87100 }, { "epoch": 14.18, "learning_rate": 4.341654429760157e-05, "loss": 0.1131, "step": 87200 }, { "epoch": 14.18, "eval_loss": 0.4209243655204773, "eval_runtime": 7.4199, "eval_samples_per_second": 13.477, "eval_wer": 0.3459196102314251, "step": 87200 }, { "epoch": 14.2, "learning_rate": 4.335128079621472e-05, "loss": 0.1069, "step": 87300 }, { "epoch": 14.2, "eval_loss": 0.4241653084754944, "eval_runtime": 7.8927, "eval_samples_per_second": 12.67, "eval_wer": 0.341047503045067, "step": 87300 }, { "epoch": 14.21, "learning_rate": 4.328601729482787e-05, "loss": 0.1042, "step": 87400 }, { "epoch": 14.21, "eval_loss": 0.3520914912223816, "eval_runtime": 7.2723, "eval_samples_per_second": 13.751, "eval_wer": 0.3459196102314251, "step": 87400 }, { "epoch": 14.23, "learning_rate": 4.322075379344102e-05, "loss": 0.1017, "step": 87500 }, { "epoch": 14.23, "eval_loss": 0.3735422194004059, "eval_runtime": 7.8531, "eval_samples_per_second": 12.734, "eval_wer": 0.3337393422655298, "step": 87500 }, { "epoch": 14.25, "learning_rate": 4.315549029205417e-05, "loss": 0.099, "step": 87600 }, { "epoch": 14.25, "eval_loss": 0.4072035253047943, "eval_runtime": 6.9486, "eval_samples_per_second": 14.391, "eval_wer": 0.3520097442143727, "step": 87600 }, { "epoch": 14.26, "learning_rate": 4.3090226790667323e-05, "loss": 0.1119, "step": 87700 }, { "epoch": 14.26, "eval_loss": 0.4090457856655121, "eval_runtime": 9.1301, "eval_samples_per_second": 10.953, "eval_wer": 0.33008526187576126, "step": 87700 }, { "epoch": 14.28, "learning_rate": 4.3024963289280475e-05, "loss": 0.1072, "step": 87800 }, { "epoch": 14.28, "eval_loss": 0.3945271372795105, "eval_runtime": 8.9475, "eval_samples_per_second": 11.176, "eval_wer": 0.3556638246041413, "step": 87800 }, { "epoch": 14.3, "learning_rate": 4.295969978789362e-05, "loss": 0.1132, "step": 87900 }, { "epoch": 14.3, "eval_loss": 0.3662361800670624, "eval_runtime": 7.1294, "eval_samples_per_second": 14.026, "eval_wer": 0.33617539585870887, "step": 87900 }, { "epoch": 14.31, "learning_rate": 4.289443628650677e-05, "loss": 0.1037, "step": 88000 }, { "epoch": 14.31, "eval_loss": 0.3741585910320282, "eval_runtime": 7.5993, "eval_samples_per_second": 13.159, "eval_wer": 0.3398294762484775, "step": 88000 }, { "epoch": 14.33, "learning_rate": 4.2829172785119924e-05, "loss": 0.1045, "step": 88100 }, { "epoch": 14.33, "eval_loss": 0.41879794001579285, "eval_runtime": 7.0732, "eval_samples_per_second": 14.138, "eval_wer": 0.3568818514007308, "step": 88100 }, { "epoch": 14.34, "learning_rate": 4.276390928373307e-05, "loss": 0.0999, "step": 88200 }, { "epoch": 14.34, "eval_loss": 0.39614391326904297, "eval_runtime": 9.6972, "eval_samples_per_second": 10.312, "eval_wer": 0.35444579780755175, "step": 88200 }, { "epoch": 14.36, "learning_rate": 4.269864578234623e-05, "loss": 0.1047, "step": 88300 }, { "epoch": 14.36, "eval_loss": 0.3773258328437805, "eval_runtime": 8.0348, "eval_samples_per_second": 12.446, "eval_wer": 0.34835566382460414, "step": 88300 }, { "epoch": 14.38, "learning_rate": 4.263338228095938e-05, "loss": 0.114, "step": 88400 }, { "epoch": 14.38, "eval_loss": 0.37774306535720825, "eval_runtime": 7.4926, "eval_samples_per_second": 13.346, "eval_wer": 0.34835566382460414, "step": 88400 }, { "epoch": 14.39, "learning_rate": 4.2568118779572525e-05, "loss": 0.1038, "step": 88500 }, { "epoch": 14.39, "eval_loss": 0.3713986575603485, "eval_runtime": 7.4849, "eval_samples_per_second": 13.36, "eval_wer": 0.34957369062119364, "step": 88500 }, { "epoch": 14.41, "learning_rate": 4.250285527818568e-05, "loss": 0.0978, "step": 88600 }, { "epoch": 14.41, "eval_loss": 0.3625016510486603, "eval_runtime": 7.1558, "eval_samples_per_second": 13.975, "eval_wer": 0.3398294762484775, "step": 88600 }, { "epoch": 14.43, "learning_rate": 4.243759177679883e-05, "loss": 0.0954, "step": 88700 }, { "epoch": 14.43, "eval_loss": 0.40445342659950256, "eval_runtime": 7.6543, "eval_samples_per_second": 13.064, "eval_wer": 0.34835566382460414, "step": 88700 }, { "epoch": 14.44, "learning_rate": 4.2372328275411974e-05, "loss": 0.1027, "step": 88800 }, { "epoch": 14.44, "eval_loss": 0.4006795585155487, "eval_runtime": 7.2382, "eval_samples_per_second": 13.816, "eval_wer": 0.34226552984165654, "step": 88800 }, { "epoch": 14.46, "learning_rate": 4.2307064774025126e-05, "loss": Infinity, "step": 88900 }, { "epoch": 14.46, "eval_loss": 0.35563650727272034, "eval_runtime": 8.396, "eval_samples_per_second": 11.91, "eval_wer": 0.34957369062119364, "step": 88900 }, { "epoch": 14.47, "learning_rate": 4.2241801272638285e-05, "loss": NaN, "step": 89000 }, { "epoch": 14.47, "eval_loss": 0.3528667688369751, "eval_runtime": 7.9985, "eval_samples_per_second": 12.502, "eval_wer": 0.34835566382460414, "step": 89000 }, { "epoch": 14.49, "learning_rate": 4.217653777125143e-05, "loss": NaN, "step": 89100 }, { "epoch": 14.49, "eval_loss": 0.416147381067276, "eval_runtime": 7.9316, "eval_samples_per_second": 12.608, "eval_wer": 0.35444579780755175, "step": 89100 }, { "epoch": 14.51, "learning_rate": 4.211127426986458e-05, "loss": NaN, "step": 89200 }, { "epoch": 14.51, "eval_loss": 0.4058997631072998, "eval_runtime": 8.2486, "eval_samples_per_second": 12.123, "eval_wer": 0.3520097442143727, "step": 89200 }, { "epoch": 14.52, "learning_rate": 4.204601076847773e-05, "loss": NaN, "step": 89300 }, { "epoch": 14.52, "eval_loss": 0.38170912861824036, "eval_runtime": 9.2084, "eval_samples_per_second": 10.86, "eval_wer": 0.3398294762484775, "step": 89300 }, { "epoch": 14.54, "learning_rate": 4.198074726709088e-05, "loss": NaN, "step": 89400 }, { "epoch": 14.54, "eval_loss": 0.37428218126296997, "eval_runtime": 8.1719, "eval_samples_per_second": 12.237, "eval_wer": 0.341047503045067, "step": 89400 }, { "epoch": 14.56, "learning_rate": 4.191548376570403e-05, "loss": NaN, "step": 89500 }, { "epoch": 14.56, "eval_loss": 0.3986841142177582, "eval_runtime": 10.8754, "eval_samples_per_second": 9.195, "eval_wer": 0.34835566382460414, "step": 89500 }, { "epoch": 14.57, "learning_rate": 4.185022026431718e-05, "loss": NaN, "step": 89600 }, { "epoch": 14.57, "eval_loss": 0.38741618394851685, "eval_runtime": 9.3064, "eval_samples_per_second": 10.745, "eval_wer": 0.3520097442143727, "step": 89600 }, { "epoch": 14.59, "learning_rate": 4.1784956762930335e-05, "loss": NaN, "step": 89700 }, { "epoch": 14.59, "eval_loss": 0.4405732750892639, "eval_runtime": 7.6728, "eval_samples_per_second": 13.033, "eval_wer": 0.3471376370280146, "step": 89700 }, { "epoch": 14.6, "learning_rate": 4.1719693261543487e-05, "loss": NaN, "step": 89800 }, { "epoch": 14.6, "eval_loss": 0.3700186014175415, "eval_runtime": 7.4389, "eval_samples_per_second": 13.443, "eval_wer": 0.341047503045067, "step": 89800 }, { "epoch": 14.62, "learning_rate": 4.165442976015663e-05, "loss": NaN, "step": 89900 }, { "epoch": 14.62, "eval_loss": 0.4012463092803955, "eval_runtime": 8.227, "eval_samples_per_second": 12.155, "eval_wer": 0.3386114494518879, "step": 89900 }, { "epoch": 14.64, "learning_rate": 4.1589166258769784e-05, "loss": NaN, "step": 90000 }, { "epoch": 14.64, "eval_loss": 0.4593057930469513, "eval_runtime": 7.5267, "eval_samples_per_second": 13.286, "eval_wer": 0.3471376370280146, "step": 90000 }, { "epoch": 14.65, "learning_rate": 4.1523902757382936e-05, "loss": NaN, "step": 90100 }, { "epoch": 14.65, "eval_loss": 0.3738018870353699, "eval_runtime": 8.684, "eval_samples_per_second": 11.515, "eval_wer": 0.3325213154689403, "step": 90100 }, { "epoch": 14.67, "learning_rate": 4.145863925599609e-05, "loss": NaN, "step": 90200 }, { "epoch": 14.67, "eval_loss": 0.4285886287689209, "eval_runtime": 8.4528, "eval_samples_per_second": 11.83, "eval_wer": 0.35322777101096225, "step": 90200 }, { "epoch": 14.69, "learning_rate": 4.139337575460924e-05, "loss": NaN, "step": 90300 }, { "epoch": 14.69, "eval_loss": 0.3823952078819275, "eval_runtime": 8.2181, "eval_samples_per_second": 12.168, "eval_wer": 0.33008526187576126, "step": 90300 }, { "epoch": 14.7, "learning_rate": 4.132811225322239e-05, "loss": NaN, "step": 90400 }, { "epoch": 14.7, "eval_loss": 0.4831365644931793, "eval_runtime": 9.718, "eval_samples_per_second": 10.29, "eval_wer": 0.3373934226552984, "step": 90400 }, { "epoch": 14.72, "learning_rate": 4.1262848751835536e-05, "loss": NaN, "step": 90500 }, { "epoch": 14.72, "eval_loss": 0.40132513642311096, "eval_runtime": 8.1178, "eval_samples_per_second": 12.319, "eval_wer": 0.34835566382460414, "step": 90500 }, { "epoch": 14.73, "learning_rate": 4.119758525044869e-05, "loss": NaN, "step": 90600 }, { "epoch": 14.73, "eval_loss": 0.40187588334083557, "eval_runtime": 9.5226, "eval_samples_per_second": 10.501, "eval_wer": 0.35931790499390986, "step": 90600 }, { "epoch": 14.75, "learning_rate": 4.113232174906184e-05, "loss": NaN, "step": 90700 }, { "epoch": 14.75, "eval_loss": 0.46043136715888977, "eval_runtime": 10.1706, "eval_samples_per_second": 9.832, "eval_wer": 0.364190012180268, "step": 90700 }, { "epoch": 14.77, "learning_rate": 4.106705824767499e-05, "loss": NaN, "step": 90800 }, { "epoch": 14.77, "eval_loss": 0.37815314531326294, "eval_runtime": 8.7882, "eval_samples_per_second": 11.379, "eval_wer": 0.3459196102314251, "step": 90800 }, { "epoch": 14.78, "learning_rate": 4.1001794746288144e-05, "loss": NaN, "step": 90900 }, { "epoch": 14.78, "eval_loss": 0.4232279658317566, "eval_runtime": 9.4671, "eval_samples_per_second": 10.563, "eval_wer": 0.3556638246041413, "step": 90900 }, { "epoch": 14.8, "learning_rate": 4.093653124490129e-05, "loss": NaN, "step": 91000 }, { "epoch": 14.8, "eval_loss": 0.42844250798225403, "eval_runtime": 8.6741, "eval_samples_per_second": 11.529, "eval_wer": 0.3654080389768575, "step": 91000 }, { "epoch": 14.82, "learning_rate": 4.087126774351444e-05, "loss": NaN, "step": 91100 }, { "epoch": 14.82, "eval_loss": 0.3949730396270752, "eval_runtime": 7.3535, "eval_samples_per_second": 13.599, "eval_wer": 0.34348355663824603, "step": 91100 }, { "epoch": 14.83, "learning_rate": 4.080600424212759e-05, "loss": NaN, "step": 91200 }, { "epoch": 14.83, "eval_loss": 0.4596826136112213, "eval_runtime": 7.979, "eval_samples_per_second": 12.533, "eval_wer": 0.34226552984165654, "step": 91200 }, { "epoch": 14.85, "learning_rate": 4.074074074074074e-05, "loss": NaN, "step": 91300 }, { "epoch": 14.85, "eval_loss": 0.3969116508960724, "eval_runtime": 7.3471, "eval_samples_per_second": 13.611, "eval_wer": 0.34348355663824603, "step": 91300 }, { "epoch": 14.86, "learning_rate": 4.067547723935389e-05, "loss": NaN, "step": 91400 }, { "epoch": 14.86, "eval_loss": 0.42892399430274963, "eval_runtime": 7.7448, "eval_samples_per_second": 12.912, "eval_wer": 0.33617539585870887, "step": 91400 }, { "epoch": 14.88, "learning_rate": 4.061021373796705e-05, "loss": NaN, "step": 91500 }, { "epoch": 14.88, "eval_loss": 0.3805890679359436, "eval_runtime": 7.337, "eval_samples_per_second": 13.629, "eval_wer": 0.3398294762484775, "step": 91500 }, { "epoch": 14.9, "learning_rate": 4.0544950236580194e-05, "loss": NaN, "step": 91600 }, { "epoch": 14.9, "eval_loss": 0.34959712624549866, "eval_runtime": 9.7552, "eval_samples_per_second": 10.251, "eval_wer": 0.30572472594397077, "step": 91600 }, { "epoch": 14.91, "learning_rate": 4.0479686735193346e-05, "loss": NaN, "step": 91700 }, { "epoch": 14.91, "eval_loss": 0.3602063059806824, "eval_runtime": 6.6405, "eval_samples_per_second": 15.059, "eval_wer": 0.3373934226552984, "step": 91700 }, { "epoch": 14.93, "learning_rate": 4.04144232338065e-05, "loss": NaN, "step": 91800 }, { "epoch": 14.93, "eval_loss": 0.442261666059494, "eval_runtime": 10.1904, "eval_samples_per_second": 9.813, "eval_wer": 0.34835566382460414, "step": 91800 }, { "epoch": 14.95, "learning_rate": 4.034915973241964e-05, "loss": NaN, "step": 91900 }, { "epoch": 14.95, "eval_loss": 0.3955381512641907, "eval_runtime": 9.4798, "eval_samples_per_second": 10.549, "eval_wer": 0.3398294762484775, "step": 91900 }, { "epoch": 14.96, "learning_rate": 4.0283896231032795e-05, "loss": NaN, "step": 92000 }, { "epoch": 14.96, "eval_loss": 0.3891383409500122, "eval_runtime": 8.2087, "eval_samples_per_second": 12.182, "eval_wer": 0.3215590742996346, "step": 92000 }, { "epoch": 14.98, "learning_rate": 4.021863272964595e-05, "loss": NaN, "step": 92100 }, { "epoch": 14.98, "eval_loss": 0.38750743865966797, "eval_runtime": 7.6982, "eval_samples_per_second": 12.99, "eval_wer": 0.3325213154689403, "step": 92100 }, { "epoch": 14.99, "learning_rate": 4.01533692282591e-05, "loss": NaN, "step": 92200 }, { "epoch": 14.99, "eval_loss": 0.45837047696113586, "eval_runtime": 7.4055, "eval_samples_per_second": 13.504, "eval_wer": 0.3507917174177832, "step": 92200 }, { "epoch": 15.01, "learning_rate": 4.008810572687225e-05, "loss": NaN, "step": 92300 }, { "epoch": 15.01, "eval_loss": 0.4188990890979767, "eval_runtime": 8.4196, "eval_samples_per_second": 11.877, "eval_wer": 0.37271619975639464, "step": 92300 }, { "epoch": 15.03, "learning_rate": 4.00228422254854e-05, "loss": NaN, "step": 92400 }, { "epoch": 15.03, "eval_loss": 0.4422924816608429, "eval_runtime": 8.3856, "eval_samples_per_second": 11.925, "eval_wer": 0.35322777101096225, "step": 92400 }, { "epoch": 15.04, "learning_rate": 3.995757872409855e-05, "loss": NaN, "step": 92500 }, { "epoch": 15.04, "eval_loss": 0.414529412984848, "eval_runtime": 8.9456, "eval_samples_per_second": 11.179, "eval_wer": 0.35931790499390986, "step": 92500 }, { "epoch": 15.06, "learning_rate": 3.98923152227117e-05, "loss": NaN, "step": 92600 }, { "epoch": 15.06, "eval_loss": 0.3688591718673706, "eval_runtime": 8.5338, "eval_samples_per_second": 11.718, "eval_wer": 0.33495736906211937, "step": 92600 }, { "epoch": 15.08, "learning_rate": 3.982705172132485e-05, "loss": NaN, "step": 92700 }, { "epoch": 15.08, "eval_loss": 0.396541565656662, "eval_runtime": 8.586, "eval_samples_per_second": 11.647, "eval_wer": 0.3337393422655298, "step": 92700 }, { "epoch": 15.09, "learning_rate": 3.9761788219938e-05, "loss": NaN, "step": 92800 }, { "epoch": 15.09, "eval_loss": 0.4621961712837219, "eval_runtime": 9.2469, "eval_samples_per_second": 10.814, "eval_wer": 0.3507917174177832, "step": 92800 }, { "epoch": 15.11, "learning_rate": 3.9696524718551155e-05, "loss": NaN, "step": 92900 }, { "epoch": 15.11, "eval_loss": 0.39792075753211975, "eval_runtime": 7.6153, "eval_samples_per_second": 13.131, "eval_wer": 0.3447015834348356, "step": 92900 }, { "epoch": 15.12, "learning_rate": 3.96312612171643e-05, "loss": NaN, "step": 93000 }, { "epoch": 15.12, "eval_loss": 0.4314855635166168, "eval_runtime": 8.7472, "eval_samples_per_second": 11.432, "eval_wer": 0.34835566382460414, "step": 93000 }, { "epoch": 15.14, "learning_rate": 3.956599771577745e-05, "loss": NaN, "step": 93100 }, { "epoch": 15.14, "eval_loss": 0.4228772222995758, "eval_runtime": 6.9716, "eval_samples_per_second": 14.344, "eval_wer": 0.34835566382460414, "step": 93100 }, { "epoch": 15.16, "learning_rate": 3.9500734214390604e-05, "loss": NaN, "step": 93200 }, { "epoch": 15.16, "eval_loss": 0.4500848054885864, "eval_runtime": 8.5782, "eval_samples_per_second": 11.657, "eval_wer": 0.3629719853836784, "step": 93200 }, { "epoch": 15.17, "learning_rate": 3.943547071300375e-05, "loss": NaN, "step": 93300 }, { "epoch": 15.17, "eval_loss": 0.4819047451019287, "eval_runtime": 7.8844, "eval_samples_per_second": 12.683, "eval_wer": 0.3313032886723508, "step": 93300 }, { "epoch": 15.19, "learning_rate": 3.937020721161691e-05, "loss": NaN, "step": 93400 }, { "epoch": 15.19, "eval_loss": 0.40653935074806213, "eval_runtime": 8.8297, "eval_samples_per_second": 11.325, "eval_wer": 0.3568818514007308, "step": 93400 }, { "epoch": 15.21, "learning_rate": 3.930494371023006e-05, "loss": NaN, "step": 93500 }, { "epoch": 15.21, "eval_loss": 0.4287218451499939, "eval_runtime": 8.8101, "eval_samples_per_second": 11.351, "eval_wer": 0.3568818514007308, "step": 93500 }, { "epoch": 15.22, "learning_rate": 3.9239680208843205e-05, "loss": NaN, "step": 93600 }, { "epoch": 15.22, "eval_loss": 0.3936750888824463, "eval_runtime": 8.9968, "eval_samples_per_second": 11.115, "eval_wer": 0.33495736906211937, "step": 93600 }, { "epoch": 15.24, "learning_rate": 3.917441670745636e-05, "loss": NaN, "step": 93700 }, { "epoch": 15.24, "eval_loss": 0.4512450098991394, "eval_runtime": 9.9939, "eval_samples_per_second": 10.006, "eval_wer": 0.35444579780755175, "step": 93700 }, { "epoch": 15.25, "learning_rate": 3.910915320606951e-05, "loss": NaN, "step": 93800 }, { "epoch": 15.25, "eval_loss": 0.38099244236946106, "eval_runtime": 8.1003, "eval_samples_per_second": 12.345, "eval_wer": 0.33008526187576126, "step": 93800 }, { "epoch": 15.27, "learning_rate": 3.9043889704682654e-05, "loss": NaN, "step": 93900 }, { "epoch": 15.27, "eval_loss": 0.4231901466846466, "eval_runtime": 8.4197, "eval_samples_per_second": 11.877, "eval_wer": 0.35809987819732036, "step": 93900 }, { "epoch": 15.29, "learning_rate": 3.8978626203295806e-05, "loss": NaN, "step": 94000 }, { "epoch": 15.29, "eval_loss": 0.41978344321250916, "eval_runtime": 9.9333, "eval_samples_per_second": 10.067, "eval_wer": 0.34348355663824603, "step": 94000 }, { "epoch": 15.3, "learning_rate": 3.8913362701908965e-05, "loss": NaN, "step": 94100 }, { "epoch": 15.3, "eval_loss": 0.35810530185699463, "eval_runtime": 8.2325, "eval_samples_per_second": 12.147, "eval_wer": 0.32886723507917176, "step": 94100 }, { "epoch": 15.32, "learning_rate": 3.884809920052211e-05, "loss": NaN, "step": 94200 }, { "epoch": 15.32, "eval_loss": 0.40189048647880554, "eval_runtime": 7.9965, "eval_samples_per_second": 12.505, "eval_wer": 0.3325213154689403, "step": 94200 }, { "epoch": 15.34, "learning_rate": 3.878283569913526e-05, "loss": NaN, "step": 94300 }, { "epoch": 15.34, "eval_loss": 0.39003273844718933, "eval_runtime": 9.1613, "eval_samples_per_second": 10.916, "eval_wer": 0.34835566382460414, "step": 94300 }, { "epoch": 15.35, "learning_rate": 3.871757219774841e-05, "loss": NaN, "step": 94400 }, { "epoch": 15.35, "eval_loss": 0.37178894877433777, "eval_runtime": 8.3496, "eval_samples_per_second": 11.977, "eval_wer": 0.3373934226552984, "step": 94400 }, { "epoch": 15.37, "learning_rate": 3.865230869636156e-05, "loss": NaN, "step": 94500 }, { "epoch": 15.37, "eval_loss": 0.43365535140037537, "eval_runtime": 7.7206, "eval_samples_per_second": 12.952, "eval_wer": 0.3337393422655298, "step": 94500 }, { "epoch": 15.38, "learning_rate": 3.858704519497471e-05, "loss": NaN, "step": 94600 }, { "epoch": 15.38, "eval_loss": 0.4589609205722809, "eval_runtime": 9.1951, "eval_samples_per_second": 10.875, "eval_wer": 0.3507917174177832, "step": 94600 }, { "epoch": 15.4, "learning_rate": 3.852178169358786e-05, "loss": NaN, "step": 94700 }, { "epoch": 15.4, "eval_loss": 0.424941748380661, "eval_runtime": 7.5287, "eval_samples_per_second": 13.283, "eval_wer": 0.34226552984165654, "step": 94700 }, { "epoch": 15.42, "learning_rate": 3.8456518192201015e-05, "loss": NaN, "step": 94800 }, { "epoch": 15.42, "eval_loss": 0.3637240529060364, "eval_runtime": 7.2763, "eval_samples_per_second": 13.743, "eval_wer": 0.33617539585870887, "step": 94800 }, { "epoch": 15.43, "learning_rate": 3.8391254690814166e-05, "loss": NaN, "step": 94900 }, { "epoch": 15.43, "eval_loss": 0.4193127453327179, "eval_runtime": 8.6177, "eval_samples_per_second": 11.604, "eval_wer": 0.34957369062119364, "step": 94900 }, { "epoch": 15.45, "learning_rate": 3.832599118942731e-05, "loss": NaN, "step": 95000 }, { "epoch": 15.45, "eval_loss": 0.4117446839809418, "eval_runtime": 8.8573, "eval_samples_per_second": 11.29, "eval_wer": 0.35322777101096225, "step": 95000 }, { "epoch": 15.47, "learning_rate": 3.8260727688040464e-05, "loss": NaN, "step": 95100 }, { "epoch": 15.47, "eval_loss": 0.4040590226650238, "eval_runtime": 8.3094, "eval_samples_per_second": 12.035, "eval_wer": 0.3325213154689403, "step": 95100 }, { "epoch": 15.48, "learning_rate": 3.8195464186653615e-05, "loss": NaN, "step": 95200 }, { "epoch": 15.48, "eval_loss": 0.4011731445789337, "eval_runtime": 8.1566, "eval_samples_per_second": 12.26, "eval_wer": 0.3447015834348356, "step": 95200 }, { "epoch": 15.5, "learning_rate": 3.813020068526677e-05, "loss": NaN, "step": 95300 }, { "epoch": 15.5, "eval_loss": 0.4071398675441742, "eval_runtime": 8.9786, "eval_samples_per_second": 11.138, "eval_wer": 0.3690621193666261, "step": 95300 }, { "epoch": 15.51, "learning_rate": 3.806493718387992e-05, "loss": NaN, "step": 95400 }, { "epoch": 15.51, "eval_loss": 0.4124356806278229, "eval_runtime": 7.7821, "eval_samples_per_second": 12.85, "eval_wer": 0.36053593179049936, "step": 95400 }, { "epoch": 15.53, "learning_rate": 3.799967368249307e-05, "loss": NaN, "step": 95500 }, { "epoch": 15.53, "eval_loss": 0.43873709440231323, "eval_runtime": 8.5817, "eval_samples_per_second": 11.653, "eval_wer": 0.35322777101096225, "step": 95500 }, { "epoch": 15.55, "learning_rate": 3.7934410181106216e-05, "loss": NaN, "step": 95600 }, { "epoch": 15.55, "eval_loss": 0.43614262342453003, "eval_runtime": 7.3882, "eval_samples_per_second": 13.535, "eval_wer": 0.35322777101096225, "step": 95600 }, { "epoch": 15.56, "learning_rate": 3.786914667971937e-05, "loss": NaN, "step": 95700 }, { "epoch": 15.56, "eval_loss": 0.4307575225830078, "eval_runtime": 7.3712, "eval_samples_per_second": 13.566, "eval_wer": 0.3617539585870889, "step": 95700 }, { "epoch": 15.58, "learning_rate": 3.780388317833252e-05, "loss": NaN, "step": 95800 }, { "epoch": 15.58, "eval_loss": 0.39022716879844666, "eval_runtime": 8.1214, "eval_samples_per_second": 12.313, "eval_wer": 0.34348355663824603, "step": 95800 }, { "epoch": 15.6, "learning_rate": 3.773861967694567e-05, "loss": NaN, "step": 95900 }, { "epoch": 15.6, "eval_loss": 0.5400065779685974, "eval_runtime": 9.4699, "eval_samples_per_second": 10.56, "eval_wer": 0.34226552984165654, "step": 95900 }, { "epoch": 15.61, "learning_rate": 3.7673356175558824e-05, "loss": NaN, "step": 96000 }, { "epoch": 15.61, "eval_loss": 0.4195316433906555, "eval_runtime": 6.7762, "eval_samples_per_second": 14.758, "eval_wer": 0.3471376370280146, "step": 96000 }, { "epoch": 15.63, "learning_rate": 3.760809267417197e-05, "loss": NaN, "step": 96100 }, { "epoch": 15.63, "eval_loss": 0.5240188837051392, "eval_runtime": 7.6344, "eval_samples_per_second": 13.099, "eval_wer": 0.35931790499390986, "step": 96100 }, { "epoch": 15.64, "learning_rate": 3.754282917278512e-05, "loss": NaN, "step": 96200 }, { "epoch": 15.64, "eval_loss": 0.4596652686595917, "eval_runtime": 8.7291, "eval_samples_per_second": 11.456, "eval_wer": 0.3471376370280146, "step": 96200 }, { "epoch": 15.66, "learning_rate": 3.747756567139827e-05, "loss": NaN, "step": 96300 }, { "epoch": 15.66, "eval_loss": 0.5023432374000549, "eval_runtime": 10.5167, "eval_samples_per_second": 9.509, "eval_wer": 0.3459196102314251, "step": 96300 }, { "epoch": 15.68, "learning_rate": 3.741230217001142e-05, "loss": NaN, "step": 96400 }, { "epoch": 15.68, "eval_loss": 0.42950576543807983, "eval_runtime": 9.5929, "eval_samples_per_second": 10.424, "eval_wer": 0.3617539585870889, "step": 96400 }, { "epoch": 15.69, "learning_rate": 3.734703866862457e-05, "loss": NaN, "step": 96500 }, { "epoch": 15.69, "eval_loss": 0.6256393194198608, "eval_runtime": 8.8475, "eval_samples_per_second": 11.303, "eval_wer": 0.3617539585870889, "step": 96500 }, { "epoch": 15.71, "learning_rate": 3.728177516723773e-05, "loss": NaN, "step": 96600 }, { "epoch": 15.71, "eval_loss": 0.40215057134628296, "eval_runtime": 7.4719, "eval_samples_per_second": 13.383, "eval_wer": 0.34835566382460414, "step": 96600 }, { "epoch": 15.73, "learning_rate": 3.7216511665850874e-05, "loss": NaN, "step": 96700 }, { "epoch": 15.73, "eval_loss": 0.5013496279716492, "eval_runtime": 8.1012, "eval_samples_per_second": 12.344, "eval_wer": 0.3520097442143727, "step": 96700 }, { "epoch": 15.74, "learning_rate": 3.7151248164464026e-05, "loss": NaN, "step": 96800 }, { "epoch": 15.74, "eval_loss": 0.4012104868888855, "eval_runtime": 6.7403, "eval_samples_per_second": 14.836, "eval_wer": 0.3459196102314251, "step": 96800 }, { "epoch": 15.76, "learning_rate": 3.708598466307718e-05, "loss": NaN, "step": 96900 }, { "epoch": 15.76, "eval_loss": 0.39129239320755005, "eval_runtime": 7.4628, "eval_samples_per_second": 13.4, "eval_wer": 0.35322777101096225, "step": 96900 }, { "epoch": 15.77, "learning_rate": 3.702072116169032e-05, "loss": NaN, "step": 97000 }, { "epoch": 15.77, "eval_loss": 0.4360794126987457, "eval_runtime": 7.5057, "eval_samples_per_second": 13.323, "eval_wer": 0.35444579780755175, "step": 97000 }, { "epoch": 15.79, "learning_rate": 3.6955457660303475e-05, "loss": NaN, "step": 97100 }, { "epoch": 15.79, "eval_loss": 0.42406460642814636, "eval_runtime": 7.6982, "eval_samples_per_second": 12.99, "eval_wer": 0.3398294762484775, "step": 97100 }, { "epoch": 15.81, "learning_rate": 3.689019415891663e-05, "loss": NaN, "step": 97200 }, { "epoch": 15.81, "eval_loss": 0.4149155020713806, "eval_runtime": 6.9699, "eval_samples_per_second": 14.347, "eval_wer": 0.3556638246041413, "step": 97200 }, { "epoch": 15.82, "learning_rate": 3.682493065752978e-05, "loss": NaN, "step": 97300 }, { "epoch": 15.82, "eval_loss": 0.4104059934616089, "eval_runtime": 7.1554, "eval_samples_per_second": 13.976, "eval_wer": 0.34226552984165654, "step": 97300 }, { "epoch": 15.84, "learning_rate": 3.675966715614293e-05, "loss": NaN, "step": 97400 }, { "epoch": 15.84, "eval_loss": 0.3772718906402588, "eval_runtime": 7.8874, "eval_samples_per_second": 12.678, "eval_wer": 0.3447015834348356, "step": 97400 }, { "epoch": 15.86, "learning_rate": 3.669440365475608e-05, "loss": NaN, "step": 97500 }, { "epoch": 15.86, "eval_loss": 0.37940847873687744, "eval_runtime": 6.9895, "eval_samples_per_second": 14.307, "eval_wer": 0.3373934226552984, "step": 97500 }, { "epoch": 15.87, "learning_rate": 3.662914015336923e-05, "loss": NaN, "step": 97600 }, { "epoch": 15.87, "eval_loss": 0.41447925567626953, "eval_runtime": 7.7777, "eval_samples_per_second": 12.857, "eval_wer": 0.36053593179049936, "step": 97600 }, { "epoch": 15.89, "learning_rate": 3.656387665198238e-05, "loss": NaN, "step": 97700 }, { "epoch": 15.89, "eval_loss": 0.41132599115371704, "eval_runtime": 8.7663, "eval_samples_per_second": 11.407, "eval_wer": 0.37149817295980514, "step": 97700 }, { "epoch": 15.91, "learning_rate": 3.649861315059553e-05, "loss": NaN, "step": 97800 }, { "epoch": 15.91, "eval_loss": 0.5543003678321838, "eval_runtime": 9.1096, "eval_samples_per_second": 10.977, "eval_wer": 0.35444579780755175, "step": 97800 }, { "epoch": 15.92, "learning_rate": 3.643334964920868e-05, "loss": NaN, "step": 97900 }, { "epoch": 15.92, "eval_loss": 0.4039764106273651, "eval_runtime": 8.5411, "eval_samples_per_second": 11.708, "eval_wer": 0.34226552984165654, "step": 97900 }, { "epoch": 15.94, "learning_rate": 3.6368086147821835e-05, "loss": NaN, "step": 98000 }, { "epoch": 15.94, "eval_loss": 0.39489075541496277, "eval_runtime": 7.4333, "eval_samples_per_second": 13.453, "eval_wer": 0.3459196102314251, "step": 98000 }, { "epoch": 15.95, "learning_rate": 3.630282264643498e-05, "loss": NaN, "step": 98100 }, { "epoch": 15.95, "eval_loss": 0.44759106636047363, "eval_runtime": 7.8336, "eval_samples_per_second": 12.766, "eval_wer": 0.35931790499390986, "step": 98100 }, { "epoch": 15.97, "learning_rate": 3.623755914504813e-05, "loss": NaN, "step": 98200 }, { "epoch": 15.97, "eval_loss": 0.42032337188720703, "eval_runtime": 9.2764, "eval_samples_per_second": 10.78, "eval_wer": 0.36053593179049936, "step": 98200 }, { "epoch": 15.99, "learning_rate": 3.6172295643661284e-05, "loss": NaN, "step": 98300 }, { "epoch": 15.99, "eval_loss": 0.3860644996166229, "eval_runtime": 7.7163, "eval_samples_per_second": 12.96, "eval_wer": 0.34226552984165654, "step": 98300 }, { "epoch": 16.0, "learning_rate": 3.6107032142274436e-05, "loss": NaN, "step": 98400 }, { "epoch": 16.0, "eval_loss": 0.5123631954193115, "eval_runtime": 8.6602, "eval_samples_per_second": 11.547, "eval_wer": 0.3459196102314251, "step": 98400 }, { "epoch": 16.02, "learning_rate": 3.604176864088759e-05, "loss": NaN, "step": 98500 }, { "epoch": 16.02, "eval_loss": 0.39611780643463135, "eval_runtime": 7.1716, "eval_samples_per_second": 13.944, "eval_wer": 0.3459196102314251, "step": 98500 }, { "epoch": 16.04, "learning_rate": 3.597650513950074e-05, "loss": NaN, "step": 98600 }, { "epoch": 16.04, "eval_loss": 0.47687721252441406, "eval_runtime": 7.4875, "eval_samples_per_second": 13.356, "eval_wer": 0.3556638246041413, "step": 98600 }, { "epoch": 16.05, "learning_rate": 3.5911241638113885e-05, "loss": NaN, "step": 98700 }, { "epoch": 16.05, "eval_loss": 0.5570668578147888, "eval_runtime": 9.3365, "eval_samples_per_second": 10.711, "eval_wer": 0.35931790499390986, "step": 98700 }, { "epoch": 16.07, "learning_rate": 3.584597813672704e-05, "loss": NaN, "step": 98800 }, { "epoch": 16.07, "eval_loss": 0.4510762691497803, "eval_runtime": 8.9657, "eval_samples_per_second": 11.154, "eval_wer": 0.3629719853836784, "step": 98800 }, { "epoch": 16.08, "learning_rate": 3.578071463534019e-05, "loss": NaN, "step": 98900 }, { "epoch": 16.08, "eval_loss": 0.41739127039909363, "eval_runtime": 8.5583, "eval_samples_per_second": 11.685, "eval_wer": 0.3459196102314251, "step": 98900 }, { "epoch": 16.1, "learning_rate": 3.5715451133953334e-05, "loss": NaN, "step": 99000 }, { "epoch": 16.1, "eval_loss": 0.36998283863067627, "eval_runtime": 9.3054, "eval_samples_per_second": 10.747, "eval_wer": 0.33008526187576126, "step": 99000 }, { "epoch": 16.12, "learning_rate": 3.565018763256649e-05, "loss": NaN, "step": 99100 }, { "epoch": 16.12, "eval_loss": 0.4438319504261017, "eval_runtime": 7.1139, "eval_samples_per_second": 14.057, "eval_wer": 0.35931790499390986, "step": 99100 }, { "epoch": 16.13, "learning_rate": 3.5584924131179645e-05, "loss": NaN, "step": 99200 }, { "epoch": 16.13, "eval_loss": 0.42432862520217896, "eval_runtime": 7.9048, "eval_samples_per_second": 12.651, "eval_wer": 0.30450669914738127, "step": 99200 }, { "epoch": 16.15, "learning_rate": 3.551966062979279e-05, "loss": NaN, "step": 99300 }, { "epoch": 16.15, "eval_loss": 0.39224445819854736, "eval_runtime": 7.1957, "eval_samples_per_second": 13.897, "eval_wer": 0.3447015834348356, "step": 99300 }, { "epoch": 16.17, "learning_rate": 3.545439712840594e-05, "loss": NaN, "step": 99400 }, { "epoch": 16.17, "eval_loss": 0.44131773710250854, "eval_runtime": 8.1898, "eval_samples_per_second": 12.21, "eval_wer": 0.3507917174177832, "step": 99400 }, { "epoch": 16.18, "learning_rate": 3.538913362701909e-05, "loss": NaN, "step": 99500 }, { "epoch": 16.18, "eval_loss": 0.38120517134666443, "eval_runtime": 6.6009, "eval_samples_per_second": 15.149, "eval_wer": 0.3398294762484775, "step": 99500 }, { "epoch": 16.2, "learning_rate": 3.532387012563224e-05, "loss": NaN, "step": 99600 }, { "epoch": 16.2, "eval_loss": 0.4235430955886841, "eval_runtime": 9.0979, "eval_samples_per_second": 10.991, "eval_wer": 0.3447015834348356, "step": 99600 }, { "epoch": 16.21, "learning_rate": 3.525860662424539e-05, "loss": NaN, "step": 99700 }, { "epoch": 16.21, "eval_loss": 0.39221322536468506, "eval_runtime": 7.4156, "eval_samples_per_second": 13.485, "eval_wer": 0.3507917174177832, "step": 99700 }, { "epoch": 16.23, "learning_rate": 3.519334312285854e-05, "loss": NaN, "step": 99800 }, { "epoch": 16.23, "eval_loss": 0.49404698610305786, "eval_runtime": 7.4446, "eval_samples_per_second": 13.433, "eval_wer": 0.3556638246041413, "step": 99800 }, { "epoch": 16.25, "learning_rate": 3.5128079621471695e-05, "loss": NaN, "step": 99900 }, { "epoch": 16.25, "eval_loss": 0.4537053406238556, "eval_runtime": 9.1442, "eval_samples_per_second": 10.936, "eval_wer": 0.3471376370280146, "step": 99900 }, { "epoch": 16.26, "learning_rate": 3.5062816120084846e-05, "loss": NaN, "step": 100000 }, { "epoch": 16.26, "eval_loss": 0.42373108863830566, "eval_runtime": 8.1063, "eval_samples_per_second": 12.336, "eval_wer": 0.33617539585870887, "step": 100000 }, { "epoch": 16.28, "learning_rate": 3.499755261869799e-05, "loss": NaN, "step": 100100 }, { "epoch": 16.28, "eval_loss": 0.5141391754150391, "eval_runtime": 9.0075, "eval_samples_per_second": 11.102, "eval_wer": 0.3459196102314251, "step": 100100 }, { "epoch": 16.3, "learning_rate": 3.4932289117311143e-05, "loss": NaN, "step": 100200 }, { "epoch": 16.3, "eval_loss": 0.4039132297039032, "eval_runtime": 9.3683, "eval_samples_per_second": 10.674, "eval_wer": 0.3459196102314251, "step": 100200 }, { "epoch": 16.31, "learning_rate": 3.4867025615924295e-05, "loss": NaN, "step": 100300 }, { "epoch": 16.31, "eval_loss": 0.46978646516799927, "eval_runtime": 6.7436, "eval_samples_per_second": 14.829, "eval_wer": 0.3471376370280146, "step": 100300 }, { "epoch": 16.33, "learning_rate": 3.480176211453745e-05, "loss": NaN, "step": 100400 }, { "epoch": 16.33, "eval_loss": 0.41287657618522644, "eval_runtime": 8.0877, "eval_samples_per_second": 12.364, "eval_wer": 0.3471376370280146, "step": 100400 }, { "epoch": 16.34, "learning_rate": 3.47364986131506e-05, "loss": NaN, "step": 100500 }, { "epoch": 16.34, "eval_loss": 0.4684438407421112, "eval_runtime": 8.5044, "eval_samples_per_second": 11.759, "eval_wer": 0.3520097442143727, "step": 100500 }, { "epoch": 16.36, "learning_rate": 3.467123511176375e-05, "loss": NaN, "step": 100600 }, { "epoch": 16.36, "eval_loss": 0.4466744363307953, "eval_runtime": 8.8741, "eval_samples_per_second": 11.269, "eval_wer": 0.35809987819732036, "step": 100600 }, { "epoch": 16.38, "learning_rate": 3.4605971610376896e-05, "loss": NaN, "step": 100700 }, { "epoch": 16.38, "eval_loss": 0.38788944482803345, "eval_runtime": 7.8104, "eval_samples_per_second": 12.803, "eval_wer": 0.33008526187576126, "step": 100700 }, { "epoch": 16.39, "learning_rate": 3.454070810899005e-05, "loss": NaN, "step": 100800 }, { "epoch": 16.39, "eval_loss": 0.40568241477012634, "eval_runtime": 9.8132, "eval_samples_per_second": 10.19, "eval_wer": 0.341047503045067, "step": 100800 }, { "epoch": 16.41, "learning_rate": 3.44754446076032e-05, "loss": NaN, "step": 100900 }, { "epoch": 16.41, "eval_loss": 0.43558773398399353, "eval_runtime": 7.63, "eval_samples_per_second": 13.106, "eval_wer": 0.3568818514007308, "step": 100900 }, { "epoch": 16.43, "learning_rate": 3.441018110621635e-05, "loss": NaN, "step": 101000 }, { "epoch": 16.43, "eval_loss": 0.4001496136188507, "eval_runtime": 6.8773, "eval_samples_per_second": 14.541, "eval_wer": 0.3471376370280146, "step": 101000 }, { "epoch": 16.44, "learning_rate": 3.4344917604829504e-05, "loss": NaN, "step": 101100 }, { "epoch": 16.44, "eval_loss": 0.4105696976184845, "eval_runtime": 7.7809, "eval_samples_per_second": 12.852, "eval_wer": 0.3325213154689403, "step": 101100 }, { "epoch": 16.46, "learning_rate": 3.427965410344265e-05, "loss": NaN, "step": 101200 }, { "epoch": 16.46, "eval_loss": 0.4008920192718506, "eval_runtime": 7.3769, "eval_samples_per_second": 13.556, "eval_wer": 0.34348355663824603, "step": 101200 }, { "epoch": 16.47, "learning_rate": 3.42143906020558e-05, "loss": NaN, "step": 101300 }, { "epoch": 16.47, "eval_loss": 0.4045610725879669, "eval_runtime": 8.9725, "eval_samples_per_second": 11.145, "eval_wer": 0.341047503045067, "step": 101300 }, { "epoch": 16.49, "learning_rate": 3.414912710066895e-05, "loss": NaN, "step": 101400 }, { "epoch": 16.49, "eval_loss": 0.43567919731140137, "eval_runtime": 8.8256, "eval_samples_per_second": 11.331, "eval_wer": 0.36053593179049936, "step": 101400 }, { "epoch": 16.51, "learning_rate": 3.40838635992821e-05, "loss": NaN, "step": 101500 }, { "epoch": 16.51, "eval_loss": 0.41516247391700745, "eval_runtime": 7.2706, "eval_samples_per_second": 13.754, "eval_wer": 0.35444579780755175, "step": 101500 }, { "epoch": 16.52, "learning_rate": 3.401860009789526e-05, "loss": NaN, "step": 101600 }, { "epoch": 16.52, "eval_loss": 0.3579968512058258, "eval_runtime": 7.7267, "eval_samples_per_second": 12.942, "eval_wer": 0.34226552984165654, "step": 101600 }, { "epoch": 16.54, "learning_rate": 3.395333659650841e-05, "loss": NaN, "step": 101700 }, { "epoch": 16.54, "eval_loss": 0.3978956639766693, "eval_runtime": 7.5352, "eval_samples_per_second": 13.271, "eval_wer": 0.3373934226552984, "step": 101700 }, { "epoch": 16.56, "learning_rate": 3.3888073095121554e-05, "loss": NaN, "step": 101800 }, { "epoch": 16.56, "eval_loss": 0.4536603093147278, "eval_runtime": 7.7523, "eval_samples_per_second": 12.899, "eval_wer": 0.3105968331303289, "step": 101800 }, { "epoch": 16.57, "learning_rate": 3.3822809593734706e-05, "loss": NaN, "step": 101900 }, { "epoch": 16.57, "eval_loss": 0.44562357664108276, "eval_runtime": 7.9874, "eval_samples_per_second": 12.52, "eval_wer": 0.3447015834348356, "step": 101900 }, { "epoch": 16.59, "learning_rate": 3.375754609234786e-05, "loss": NaN, "step": 102000 }, { "epoch": 16.59, "eval_loss": 0.4070366322994232, "eval_runtime": 7.5818, "eval_samples_per_second": 13.189, "eval_wer": 0.33495736906211937, "step": 102000 }, { "epoch": 16.6, "learning_rate": 3.3692282590961e-05, "loss": NaN, "step": 102100 }, { "epoch": 16.6, "eval_loss": 0.4052729904651642, "eval_runtime": 9.8038, "eval_samples_per_second": 10.2, "eval_wer": 0.3398294762484775, "step": 102100 }, { "epoch": 16.62, "learning_rate": 3.3627019089574155e-05, "loss": NaN, "step": 102200 }, { "epoch": 16.62, "eval_loss": 0.43835657835006714, "eval_runtime": 9.1381, "eval_samples_per_second": 10.943, "eval_wer": 0.3276492082825822, "step": 102200 }, { "epoch": 16.64, "learning_rate": 3.3561755588187313e-05, "loss": NaN, "step": 102300 }, { "epoch": 16.64, "eval_loss": 0.3671765923500061, "eval_runtime": 8.8073, "eval_samples_per_second": 11.354, "eval_wer": 0.33008526187576126, "step": 102300 }, { "epoch": 16.65, "learning_rate": 3.349649208680046e-05, "loss": NaN, "step": 102400 }, { "epoch": 16.65, "eval_loss": 0.3550013303756714, "eval_runtime": 8.81, "eval_samples_per_second": 11.351, "eval_wer": 0.3276492082825822, "step": 102400 }, { "epoch": 16.67, "learning_rate": 3.343122858541361e-05, "loss": NaN, "step": 102500 }, { "epoch": 16.67, "eval_loss": 0.37561336159706116, "eval_runtime": 8.2237, "eval_samples_per_second": 12.16, "eval_wer": 0.341047503045067, "step": 102500 }, { "epoch": 16.69, "learning_rate": 3.336596508402676e-05, "loss": NaN, "step": 102600 }, { "epoch": 16.69, "eval_loss": 0.42471256852149963, "eval_runtime": 10.0, "eval_samples_per_second": 10.0, "eval_wer": 0.341047503045067, "step": 102600 }, { "epoch": 16.7, "learning_rate": 3.330070158263991e-05, "loss": NaN, "step": 102700 }, { "epoch": 16.7, "eval_loss": 0.43302589654922485, "eval_runtime": 8.4874, "eval_samples_per_second": 11.782, "eval_wer": 0.3337393422655298, "step": 102700 }, { "epoch": 16.72, "learning_rate": 3.323543808125306e-05, "loss": NaN, "step": 102800 }, { "epoch": 16.72, "eval_loss": 0.3747265636920929, "eval_runtime": 8.2183, "eval_samples_per_second": 12.168, "eval_wer": 0.3398294762484775, "step": 102800 }, { "epoch": 16.73, "learning_rate": 3.317017457986621e-05, "loss": NaN, "step": 102900 }, { "epoch": 16.73, "eval_loss": 0.44977033138275146, "eval_runtime": 9.9224, "eval_samples_per_second": 10.078, "eval_wer": 0.33617539585870887, "step": 102900 }, { "epoch": 16.75, "learning_rate": 3.310491107847936e-05, "loss": NaN, "step": 103000 }, { "epoch": 16.75, "eval_loss": 0.3952389061450958, "eval_runtime": 7.7792, "eval_samples_per_second": 12.855, "eval_wer": 0.35322777101096225, "step": 103000 }, { "epoch": 16.77, "learning_rate": 3.3039647577092515e-05, "loss": NaN, "step": 103100 }, { "epoch": 16.77, "eval_loss": 0.40458202362060547, "eval_runtime": 8.518, "eval_samples_per_second": 11.74, "eval_wer": 0.3386114494518879, "step": 103100 }, { "epoch": 16.78, "learning_rate": 3.297438407570566e-05, "loss": NaN, "step": 103200 }, { "epoch": 16.78, "eval_loss": 0.4162432849407196, "eval_runtime": 9.1287, "eval_samples_per_second": 10.954, "eval_wer": 0.33617539585870887, "step": 103200 }, { "epoch": 16.8, "learning_rate": 3.290912057431881e-05, "loss": NaN, "step": 103300 }, { "epoch": 16.8, "eval_loss": 0.4272727966308594, "eval_runtime": 10.4704, "eval_samples_per_second": 9.551, "eval_wer": 0.3471376370280146, "step": 103300 }, { "epoch": 16.82, "learning_rate": 3.2843857072931964e-05, "loss": NaN, "step": 103400 }, { "epoch": 16.82, "eval_loss": 0.40407755970954895, "eval_runtime": 9.8048, "eval_samples_per_second": 10.199, "eval_wer": 0.3471376370280146, "step": 103400 }, { "epoch": 16.83, "learning_rate": 3.2778593571545116e-05, "loss": NaN, "step": 103500 }, { "epoch": 16.83, "eval_loss": 0.36328965425491333, "eval_runtime": 7.0675, "eval_samples_per_second": 14.149, "eval_wer": 0.3337393422655298, "step": 103500 }, { "epoch": 16.85, "learning_rate": 3.271333007015827e-05, "loss": NaN, "step": 103600 }, { "epoch": 16.85, "eval_loss": 0.3919774293899536, "eval_runtime": 8.2233, "eval_samples_per_second": 12.161, "eval_wer": 0.3227771010962241, "step": 103600 }, { "epoch": 16.86, "learning_rate": 3.264806656877142e-05, "loss": NaN, "step": 103700 }, { "epoch": 16.86, "eval_loss": 0.41714799404144287, "eval_runtime": 7.8888, "eval_samples_per_second": 12.676, "eval_wer": 0.3459196102314251, "step": 103700 }, { "epoch": 16.88, "learning_rate": 3.2582803067384565e-05, "loss": NaN, "step": 103800 }, { "epoch": 16.88, "eval_loss": 0.3970955014228821, "eval_runtime": 8.7637, "eval_samples_per_second": 11.411, "eval_wer": 0.34348355663824603, "step": 103800 }, { "epoch": 16.9, "learning_rate": 3.251753956599772e-05, "loss": NaN, "step": 103900 }, { "epoch": 16.9, "eval_loss": 0.39458972215652466, "eval_runtime": 7.5247, "eval_samples_per_second": 13.29, "eval_wer": 0.3313032886723508, "step": 103900 }, { "epoch": 16.91, "learning_rate": 3.245227606461087e-05, "loss": NaN, "step": 104000 }, { "epoch": 16.91, "eval_loss": 0.3992546498775482, "eval_runtime": 7.666, "eval_samples_per_second": 13.045, "eval_wer": 0.34348355663824603, "step": 104000 }, { "epoch": 16.93, "learning_rate": 3.2387012563224014e-05, "loss": NaN, "step": 104100 }, { "epoch": 16.93, "eval_loss": 0.3565240502357483, "eval_runtime": 6.8455, "eval_samples_per_second": 14.608, "eval_wer": 0.3313032886723508, "step": 104100 }, { "epoch": 16.95, "learning_rate": 3.232174906183717e-05, "loss": NaN, "step": 104200 }, { "epoch": 16.95, "eval_loss": 0.39272624254226685, "eval_runtime": 8.7645, "eval_samples_per_second": 11.41, "eval_wer": 0.3398294762484775, "step": 104200 }, { "epoch": 16.96, "learning_rate": 3.2256485560450325e-05, "loss": NaN, "step": 104300 }, { "epoch": 16.96, "eval_loss": 0.377750962972641, "eval_runtime": 7.4931, "eval_samples_per_second": 13.346, "eval_wer": 0.32886723507917176, "step": 104300 }, { "epoch": 16.98, "learning_rate": 3.219122205906347e-05, "loss": NaN, "step": 104400 }, { "epoch": 16.98, "eval_loss": 0.3803618550300598, "eval_runtime": 7.7196, "eval_samples_per_second": 12.954, "eval_wer": 0.32521315468940315, "step": 104400 }, { "epoch": 16.99, "learning_rate": 3.212595855767662e-05, "loss": NaN, "step": 104500 }, { "epoch": 16.99, "eval_loss": 0.4160638153553009, "eval_runtime": 7.8399, "eval_samples_per_second": 12.755, "eval_wer": 0.35931790499390986, "step": 104500 }, { "epoch": 17.01, "learning_rate": 3.206069505628977e-05, "loss": NaN, "step": 104600 }, { "epoch": 17.01, "eval_loss": 0.3985629677772522, "eval_runtime": 7.8601, "eval_samples_per_second": 12.723, "eval_wer": 0.36662606577344703, "step": 104600 }, { "epoch": 17.03, "learning_rate": 3.199543155490292e-05, "loss": NaN, "step": 104700 }, { "epoch": 17.03, "eval_loss": 0.362797349691391, "eval_runtime": 7.5799, "eval_samples_per_second": 13.193, "eval_wer": 0.33495736906211937, "step": 104700 }, { "epoch": 17.04, "learning_rate": 3.193016805351608e-05, "loss": NaN, "step": 104800 }, { "epoch": 17.04, "eval_loss": 0.46020495891571045, "eval_runtime": 10.2517, "eval_samples_per_second": 9.754, "eval_wer": 0.35322777101096225, "step": 104800 }, { "epoch": 17.06, "learning_rate": 3.186490455212922e-05, "loss": NaN, "step": 104900 }, { "epoch": 17.06, "eval_loss": 0.4332337975502014, "eval_runtime": 8.5335, "eval_samples_per_second": 11.719, "eval_wer": 0.33617539585870887, "step": 104900 }, { "epoch": 17.08, "learning_rate": 3.1799641050742374e-05, "loss": NaN, "step": 105000 }, { "epoch": 17.08, "eval_loss": 0.39707785844802856, "eval_runtime": 9.4106, "eval_samples_per_second": 10.626, "eval_wer": 0.34348355663824603, "step": 105000 }, { "epoch": 17.09, "learning_rate": 3.1734377549355526e-05, "loss": NaN, "step": 105100 }, { "epoch": 17.09, "eval_loss": 0.4423673152923584, "eval_runtime": 7.0369, "eval_samples_per_second": 14.211, "eval_wer": 0.3373934226552984, "step": 105100 }, { "epoch": 17.11, "learning_rate": 3.166911404796867e-05, "loss": NaN, "step": 105200 }, { "epoch": 17.11, "eval_loss": 0.4622967541217804, "eval_runtime": 8.2948, "eval_samples_per_second": 12.056, "eval_wer": 0.3654080389768575, "step": 105200 }, { "epoch": 17.12, "learning_rate": 3.1603850546581823e-05, "loss": NaN, "step": 105300 }, { "epoch": 17.12, "eval_loss": 0.47677239775657654, "eval_runtime": 7.7449, "eval_samples_per_second": 12.912, "eval_wer": 0.34348355663824603, "step": 105300 }, { "epoch": 17.14, "learning_rate": 3.1538587045194975e-05, "loss": NaN, "step": 105400 }, { "epoch": 17.14, "eval_loss": 0.3996973931789398, "eval_runtime": 8.3747, "eval_samples_per_second": 11.941, "eval_wer": 0.3471376370280146, "step": 105400 }, { "epoch": 17.16, "learning_rate": 3.147332354380813e-05, "loss": NaN, "step": 105500 }, { "epoch": 17.16, "eval_loss": 0.45852556824684143, "eval_runtime": 7.9151, "eval_samples_per_second": 12.634, "eval_wer": 0.34957369062119364, "step": 105500 }, { "epoch": 17.17, "learning_rate": 3.140806004242128e-05, "loss": NaN, "step": 105600 }, { "epoch": 17.17, "eval_loss": 0.3811168670654297, "eval_runtime": 7.7269, "eval_samples_per_second": 12.942, "eval_wer": 0.32886723507917176, "step": 105600 }, { "epoch": 17.19, "learning_rate": 3.134279654103443e-05, "loss": NaN, "step": 105700 }, { "epoch": 17.19, "eval_loss": 0.3853236436843872, "eval_runtime": 8.0078, "eval_samples_per_second": 12.488, "eval_wer": 0.32521315468940315, "step": 105700 }, { "epoch": 17.21, "learning_rate": 3.1277533039647576e-05, "loss": NaN, "step": 105800 }, { "epoch": 17.21, "eval_loss": 0.43565693497657776, "eval_runtime": 8.6327, "eval_samples_per_second": 11.584, "eval_wer": 0.3690621193666261, "step": 105800 }, { "epoch": 17.22, "learning_rate": 3.121226953826073e-05, "loss": NaN, "step": 105900 }, { "epoch": 17.22, "eval_loss": 0.40283602476119995, "eval_runtime": 7.4114, "eval_samples_per_second": 13.493, "eval_wer": 0.3264311814859927, "step": 105900 }, { "epoch": 17.24, "learning_rate": 3.114700603687388e-05, "loss": NaN, "step": 106000 }, { "epoch": 17.24, "eval_loss": 0.4006456434726715, "eval_runtime": 7.4096, "eval_samples_per_second": 13.496, "eval_wer": 0.3325213154689403, "step": 106000 }, { "epoch": 17.25, "learning_rate": 3.108174253548703e-05, "loss": NaN, "step": 106100 }, { "epoch": 17.25, "eval_loss": 0.43152371048927307, "eval_runtime": 7.2864, "eval_samples_per_second": 13.724, "eval_wer": 0.3386114494518879, "step": 106100 }, { "epoch": 17.27, "learning_rate": 3.1016479034100184e-05, "loss": NaN, "step": 106200 }, { "epoch": 17.27, "eval_loss": 0.3727237582206726, "eval_runtime": 9.6507, "eval_samples_per_second": 10.362, "eval_wer": 0.3227771010962241, "step": 106200 }, { "epoch": 17.29, "learning_rate": 3.095121553271333e-05, "loss": NaN, "step": 106300 }, { "epoch": 17.29, "eval_loss": 0.4210117757320404, "eval_runtime": 10.0021, "eval_samples_per_second": 9.998, "eval_wer": 0.3264311814859927, "step": 106300 }, { "epoch": 17.3, "learning_rate": 3.088595203132648e-05, "loss": NaN, "step": 106400 }, { "epoch": 17.3, "eval_loss": 0.40674594044685364, "eval_runtime": 9.4605, "eval_samples_per_second": 10.57, "eval_wer": 0.34226552984165654, "step": 106400 }, { "epoch": 17.32, "learning_rate": 3.082068852993963e-05, "loss": NaN, "step": 106500 }, { "epoch": 17.32, "eval_loss": 0.42881014943122864, "eval_runtime": 8.646, "eval_samples_per_second": 11.566, "eval_wer": 0.3325213154689403, "step": 106500 }, { "epoch": 17.34, "learning_rate": 3.075542502855278e-05, "loss": NaN, "step": 106600 }, { "epoch": 17.34, "eval_loss": 0.3960503339767456, "eval_runtime": 7.5435, "eval_samples_per_second": 13.256, "eval_wer": 0.3313032886723508, "step": 106600 }, { "epoch": 17.35, "learning_rate": 3.069016152716594e-05, "loss": NaN, "step": 106700 }, { "epoch": 17.35, "eval_loss": 0.5093197226524353, "eval_runtime": 8.4275, "eval_samples_per_second": 11.866, "eval_wer": 0.34226552984165654, "step": 106700 }, { "epoch": 17.37, "learning_rate": 3.062489802577909e-05, "loss": NaN, "step": 106800 }, { "epoch": 17.37, "eval_loss": 0.4141642451286316, "eval_runtime": 8.7304, "eval_samples_per_second": 11.454, "eval_wer": 0.3459196102314251, "step": 106800 }, { "epoch": 17.38, "learning_rate": 3.0559634524392234e-05, "loss": NaN, "step": 106900 }, { "epoch": 17.38, "eval_loss": 0.3708423376083374, "eval_runtime": 9.1322, "eval_samples_per_second": 10.95, "eval_wer": 0.3276492082825822, "step": 106900 }, { "epoch": 17.4, "learning_rate": 3.0494371023005386e-05, "loss": NaN, "step": 107000 }, { "epoch": 17.4, "eval_loss": 0.43578729033470154, "eval_runtime": 8.1187, "eval_samples_per_second": 12.317, "eval_wer": 0.3398294762484775, "step": 107000 }, { "epoch": 17.42, "learning_rate": 3.0429107521618538e-05, "loss": NaN, "step": 107100 }, { "epoch": 17.42, "eval_loss": 0.38338860869407654, "eval_runtime": 8.1539, "eval_samples_per_second": 12.264, "eval_wer": 0.32521315468940315, "step": 107100 }, { "epoch": 17.43, "learning_rate": 3.0363844020231686e-05, "loss": NaN, "step": 107200 }, { "epoch": 17.43, "eval_loss": 0.3750736713409424, "eval_runtime": 8.3902, "eval_samples_per_second": 11.919, "eval_wer": 0.34348355663824603, "step": 107200 }, { "epoch": 17.45, "learning_rate": 3.0298580518844838e-05, "loss": NaN, "step": 107300 }, { "epoch": 17.45, "eval_loss": 0.39097708463668823, "eval_runtime": 9.385, "eval_samples_per_second": 10.655, "eval_wer": 0.34348355663824603, "step": 107300 }, { "epoch": 17.47, "learning_rate": 3.023331701745799e-05, "loss": NaN, "step": 107400 }, { "epoch": 17.47, "eval_loss": 0.4204353094100952, "eval_runtime": 8.9165, "eval_samples_per_second": 11.215, "eval_wer": 0.35444579780755175, "step": 107400 }, { "epoch": 17.48, "learning_rate": 3.016805351607114e-05, "loss": NaN, "step": 107500 }, { "epoch": 17.48, "eval_loss": 0.40133535861968994, "eval_runtime": 8.5063, "eval_samples_per_second": 11.756, "eval_wer": 0.34226552984165654, "step": 107500 }, { "epoch": 17.5, "learning_rate": 3.010279001468429e-05, "loss": NaN, "step": 107600 }, { "epoch": 17.5, "eval_loss": 0.3767768144607544, "eval_runtime": 7.8527, "eval_samples_per_second": 12.735, "eval_wer": 0.32521315468940315, "step": 107600 }, { "epoch": 17.52, "learning_rate": 3.0037526513297442e-05, "loss": NaN, "step": 107700 }, { "epoch": 17.52, "eval_loss": 0.3812255859375, "eval_runtime": 8.1107, "eval_samples_per_second": 12.329, "eval_wer": 0.3398294762484775, "step": 107700 }, { "epoch": 17.53, "learning_rate": 2.997226301191059e-05, "loss": NaN, "step": 107800 }, { "epoch": 17.53, "eval_loss": 0.40557724237442017, "eval_runtime": 8.1245, "eval_samples_per_second": 12.308, "eval_wer": 0.33008526187576126, "step": 107800 }, { "epoch": 17.55, "learning_rate": 2.9906999510523743e-05, "loss": NaN, "step": 107900 }, { "epoch": 17.55, "eval_loss": 0.42703160643577576, "eval_runtime": 8.9403, "eval_samples_per_second": 11.185, "eval_wer": 0.3471376370280146, "step": 107900 }, { "epoch": 17.56, "learning_rate": 2.9841736009136888e-05, "loss": NaN, "step": 108000 }, { "epoch": 17.56, "eval_loss": 0.38233357667922974, "eval_runtime": 7.8203, "eval_samples_per_second": 12.787, "eval_wer": 0.34835566382460414, "step": 108000 }, { "epoch": 17.58, "learning_rate": 2.9776472507750043e-05, "loss": NaN, "step": 108100 }, { "epoch": 17.58, "eval_loss": 0.4634896218776703, "eval_runtime": 8.3672, "eval_samples_per_second": 11.951, "eval_wer": 0.3520097442143727, "step": 108100 }, { "epoch": 17.6, "learning_rate": 2.9711209006363195e-05, "loss": NaN, "step": 108200 }, { "epoch": 17.6, "eval_loss": 0.3950602412223816, "eval_runtime": 8.3188, "eval_samples_per_second": 12.021, "eval_wer": 0.33617539585870887, "step": 108200 }, { "epoch": 17.61, "learning_rate": 2.964594550497634e-05, "loss": NaN, "step": 108300 }, { "epoch": 17.61, "eval_loss": 0.3925233781337738, "eval_runtime": 6.759, "eval_samples_per_second": 14.795, "eval_wer": 0.3373934226552984, "step": 108300 }, { "epoch": 17.63, "learning_rate": 2.9580682003589492e-05, "loss": NaN, "step": 108400 }, { "epoch": 17.63, "eval_loss": 0.49706822633743286, "eval_runtime": 9.3441, "eval_samples_per_second": 10.702, "eval_wer": 0.35809987819732036, "step": 108400 }, { "epoch": 17.65, "learning_rate": 2.9515418502202647e-05, "loss": NaN, "step": 108500 }, { "epoch": 17.65, "eval_loss": 0.4032347798347473, "eval_runtime": 8.8075, "eval_samples_per_second": 11.354, "eval_wer": 0.3398294762484775, "step": 108500 }, { "epoch": 17.66, "learning_rate": 2.9450155000815793e-05, "loss": NaN, "step": 108600 }, { "epoch": 17.66, "eval_loss": 0.39194339513778687, "eval_runtime": 10.3759, "eval_samples_per_second": 9.638, "eval_wer": 0.32521315468940315, "step": 108600 }, { "epoch": 17.68, "learning_rate": 2.9384891499428945e-05, "loss": NaN, "step": 108700 }, { "epoch": 17.68, "eval_loss": 0.36986175179481506, "eval_runtime": 7.8636, "eval_samples_per_second": 12.717, "eval_wer": 0.32886723507917176, "step": 108700 }, { "epoch": 17.69, "learning_rate": 2.93196279980421e-05, "loss": NaN, "step": 108800 }, { "epoch": 17.69, "eval_loss": 0.3867470920085907, "eval_runtime": 8.137, "eval_samples_per_second": 12.289, "eval_wer": 0.34348355663824603, "step": 108800 }, { "epoch": 17.71, "learning_rate": 2.9254364496655245e-05, "loss": NaN, "step": 108900 }, { "epoch": 17.71, "eval_loss": 0.3782542943954468, "eval_runtime": 8.4236, "eval_samples_per_second": 11.871, "eval_wer": 0.3325213154689403, "step": 108900 }, { "epoch": 17.73, "learning_rate": 2.9189100995268397e-05, "loss": NaN, "step": 109000 }, { "epoch": 17.73, "eval_loss": 0.4252021312713623, "eval_runtime": 8.512, "eval_samples_per_second": 11.748, "eval_wer": 0.3325213154689403, "step": 109000 }, { "epoch": 17.74, "learning_rate": 2.9123837493881552e-05, "loss": NaN, "step": 109100 }, { "epoch": 17.74, "eval_loss": 0.3819904327392578, "eval_runtime": 6.8511, "eval_samples_per_second": 14.596, "eval_wer": 0.3373934226552984, "step": 109100 }, { "epoch": 17.76, "learning_rate": 2.9058573992494697e-05, "loss": NaN, "step": 109200 }, { "epoch": 17.76, "eval_loss": 0.3850736618041992, "eval_runtime": 8.4679, "eval_samples_per_second": 11.809, "eval_wer": 0.33008526187576126, "step": 109200 }, { "epoch": 17.78, "learning_rate": 2.899331049110785e-05, "loss": NaN, "step": 109300 }, { "epoch": 17.78, "eval_loss": 0.4139541685581207, "eval_runtime": 7.6909, "eval_samples_per_second": 13.002, "eval_wer": 0.3386114494518879, "step": 109300 }, { "epoch": 17.79, "learning_rate": 2.8928046989721e-05, "loss": NaN, "step": 109400 }, { "epoch": 17.79, "eval_loss": 0.4256812334060669, "eval_runtime": 7.0399, "eval_samples_per_second": 14.205, "eval_wer": 0.3507917174177832, "step": 109400 }, { "epoch": 17.81, "learning_rate": 2.886278348833415e-05, "loss": NaN, "step": 109500 }, { "epoch": 17.81, "eval_loss": 0.4498865008354187, "eval_runtime": 9.6258, "eval_samples_per_second": 10.389, "eval_wer": 0.3471376370280146, "step": 109500 }, { "epoch": 17.82, "learning_rate": 2.87975199869473e-05, "loss": NaN, "step": 109600 }, { "epoch": 17.82, "eval_loss": 0.4236893057823181, "eval_runtime": 9.1871, "eval_samples_per_second": 10.885, "eval_wer": 0.3617539585870889, "step": 109600 }, { "epoch": 17.84, "learning_rate": 2.873225648556045e-05, "loss": NaN, "step": 109700 }, { "epoch": 17.84, "eval_loss": 0.46277669072151184, "eval_runtime": 9.6292, "eval_samples_per_second": 10.385, "eval_wer": 0.35809987819732036, "step": 109700 }, { "epoch": 17.86, "learning_rate": 2.8666992984173602e-05, "loss": NaN, "step": 109800 }, { "epoch": 17.86, "eval_loss": 0.46583592891693115, "eval_runtime": 7.8086, "eval_samples_per_second": 12.806, "eval_wer": 0.35322777101096225, "step": 109800 }, { "epoch": 17.87, "learning_rate": 2.8601729482786754e-05, "loss": NaN, "step": 109900 }, { "epoch": 17.87, "eval_loss": 0.3932786285877228, "eval_runtime": 6.8409, "eval_samples_per_second": 14.618, "eval_wer": 0.3373934226552984, "step": 109900 }, { "epoch": 17.89, "learning_rate": 2.8536465981399902e-05, "loss": NaN, "step": 110000 }, { "epoch": 17.89, "eval_loss": 0.40608084201812744, "eval_runtime": 7.3141, "eval_samples_per_second": 13.672, "eval_wer": 0.3373934226552984, "step": 110000 }, { "epoch": 17.91, "learning_rate": 2.8471202480013054e-05, "loss": NaN, "step": 110100 }, { "epoch": 17.91, "eval_loss": 0.4084034860134125, "eval_runtime": 7.1928, "eval_samples_per_second": 13.903, "eval_wer": 0.3373934226552984, "step": 110100 }, { "epoch": 17.92, "learning_rate": 2.8405938978626206e-05, "loss": NaN, "step": 110200 }, { "epoch": 17.92, "eval_loss": 0.40555787086486816, "eval_runtime": 8.5682, "eval_samples_per_second": 11.671, "eval_wer": 0.3459196102314251, "step": 110200 }, { "epoch": 17.94, "learning_rate": 2.8340675477239355e-05, "loss": NaN, "step": 110300 }, { "epoch": 17.94, "eval_loss": 0.4647526443004608, "eval_runtime": 8.7905, "eval_samples_per_second": 11.376, "eval_wer": 0.341047503045067, "step": 110300 }, { "epoch": 17.95, "learning_rate": 2.8275411975852507e-05, "loss": NaN, "step": 110400 }, { "epoch": 17.95, "eval_loss": 0.3823550343513489, "eval_runtime": 8.631, "eval_samples_per_second": 11.586, "eval_wer": 0.341047503045067, "step": 110400 }, { "epoch": 17.97, "learning_rate": 2.821014847446566e-05, "loss": NaN, "step": 110500 }, { "epoch": 17.97, "eval_loss": 0.4006991982460022, "eval_runtime": 7.1345, "eval_samples_per_second": 14.016, "eval_wer": 0.3471376370280146, "step": 110500 }, { "epoch": 17.99, "learning_rate": 2.8144884973078807e-05, "loss": NaN, "step": 110600 }, { "epoch": 17.99, "eval_loss": 0.3922583758831024, "eval_runtime": 6.9349, "eval_samples_per_second": 14.42, "eval_wer": 0.3507917174177832, "step": 110600 }, { "epoch": 18.0, "learning_rate": 2.807962147169196e-05, "loss": NaN, "step": 110700 }, { "epoch": 18.0, "eval_loss": 0.3946372866630554, "eval_runtime": 6.8519, "eval_samples_per_second": 14.594, "eval_wer": 0.341047503045067, "step": 110700 }, { "epoch": 18.02, "learning_rate": 2.801435797030511e-05, "loss": NaN, "step": 110800 }, { "epoch": 18.02, "eval_loss": 0.4183802306652069, "eval_runtime": 7.1866, "eval_samples_per_second": 13.915, "eval_wer": 0.341047503045067, "step": 110800 }, { "epoch": 18.04, "learning_rate": 2.7949094468918256e-05, "loss": NaN, "step": 110900 }, { "epoch": 18.04, "eval_loss": 0.37478265166282654, "eval_runtime": 8.3068, "eval_samples_per_second": 12.038, "eval_wer": 0.3471376370280146, "step": 110900 }, { "epoch": 18.05, "learning_rate": 2.788383096753141e-05, "loss": NaN, "step": 111000 }, { "epoch": 18.05, "eval_loss": 0.3887958526611328, "eval_runtime": 7.7706, "eval_samples_per_second": 12.869, "eval_wer": 0.34957369062119364, "step": 111000 }, { "epoch": 18.07, "learning_rate": 2.7818567466144557e-05, "loss": NaN, "step": 111100 }, { "epoch": 18.07, "eval_loss": 0.3766718804836273, "eval_runtime": 7.7942, "eval_samples_per_second": 12.83, "eval_wer": 0.3447015834348356, "step": 111100 }, { "epoch": 18.08, "learning_rate": 2.775330396475771e-05, "loss": NaN, "step": 111200 }, { "epoch": 18.08, "eval_loss": 0.39117416739463806, "eval_runtime": 8.1811, "eval_samples_per_second": 12.223, "eval_wer": 0.341047503045067, "step": 111200 }, { "epoch": 18.1, "learning_rate": 2.7688040463370864e-05, "loss": NaN, "step": 111300 }, { "epoch": 18.1, "eval_loss": 0.41156256198883057, "eval_runtime": 8.6071, "eval_samples_per_second": 11.618, "eval_wer": 0.341047503045067, "step": 111300 }, { "epoch": 18.12, "learning_rate": 2.762277696198401e-05, "loss": NaN, "step": 111400 }, { "epoch": 18.12, "eval_loss": 0.39620694518089294, "eval_runtime": 8.9372, "eval_samples_per_second": 11.189, "eval_wer": 0.35322777101096225, "step": 111400 }, { "epoch": 18.13, "learning_rate": 2.755751346059716e-05, "loss": NaN, "step": 111500 }, { "epoch": 18.13, "eval_loss": 0.40653663873672485, "eval_runtime": 7.1536, "eval_samples_per_second": 13.979, "eval_wer": 0.3313032886723508, "step": 111500 }, { "epoch": 18.15, "learning_rate": 2.7492249959210313e-05, "loss": NaN, "step": 111600 }, { "epoch": 18.15, "eval_loss": 0.43940940499305725, "eval_runtime": 7.214, "eval_samples_per_second": 13.862, "eval_wer": 0.34835566382460414, "step": 111600 }, { "epoch": 18.17, "learning_rate": 2.742698645782346e-05, "loss": NaN, "step": 111700 }, { "epoch": 18.17, "eval_loss": 0.43023011088371277, "eval_runtime": 9.4948, "eval_samples_per_second": 10.532, "eval_wer": 0.35931790499390986, "step": 111700 }, { "epoch": 18.18, "learning_rate": 2.7361722956436613e-05, "loss": NaN, "step": 111800 }, { "epoch": 18.18, "eval_loss": 0.47506821155548096, "eval_runtime": 8.7209, "eval_samples_per_second": 11.467, "eval_wer": 0.3507917174177832, "step": 111800 }, { "epoch": 18.2, "learning_rate": 2.7296459455049765e-05, "loss": NaN, "step": 111900 }, { "epoch": 18.2, "eval_loss": 0.4082556962966919, "eval_runtime": 9.4452, "eval_samples_per_second": 10.587, "eval_wer": 0.364190012180268, "step": 111900 }, { "epoch": 18.21, "learning_rate": 2.7231195953662914e-05, "loss": NaN, "step": 112000 }, { "epoch": 18.21, "eval_loss": 0.44821274280548096, "eval_runtime": 7.7256, "eval_samples_per_second": 12.944, "eval_wer": 0.3313032886723508, "step": 112000 }, { "epoch": 18.23, "learning_rate": 2.7165932452276066e-05, "loss": NaN, "step": 112100 }, { "epoch": 18.23, "eval_loss": 0.4030204117298126, "eval_runtime": 8.0067, "eval_samples_per_second": 12.49, "eval_wer": 0.3507917174177832, "step": 112100 }, { "epoch": 18.25, "learning_rate": 2.7100668950889218e-05, "loss": NaN, "step": 112200 }, { "epoch": 18.25, "eval_loss": 0.3854163885116577, "eval_runtime": 8.2701, "eval_samples_per_second": 12.092, "eval_wer": 0.3398294762484775, "step": 112200 }, { "epoch": 18.26, "learning_rate": 2.7035405449502366e-05, "loss": NaN, "step": 112300 }, { "epoch": 18.26, "eval_loss": 0.4053157866001129, "eval_runtime": 7.0908, "eval_samples_per_second": 14.103, "eval_wer": 0.3313032886723508, "step": 112300 }, { "epoch": 18.28, "learning_rate": 2.6970141948115518e-05, "loss": NaN, "step": 112400 }, { "epoch": 18.28, "eval_loss": 0.3890162706375122, "eval_runtime": 7.2231, "eval_samples_per_second": 13.844, "eval_wer": 0.33008526187576126, "step": 112400 }, { "epoch": 18.3, "learning_rate": 2.690487844672867e-05, "loss": NaN, "step": 112500 }, { "epoch": 18.3, "eval_loss": 0.3915853500366211, "eval_runtime": 8.7452, "eval_samples_per_second": 11.435, "eval_wer": 0.3447015834348356, "step": 112500 }, { "epoch": 18.31, "learning_rate": 2.683961494534182e-05, "loss": NaN, "step": 112600 }, { "epoch": 18.31, "eval_loss": 0.3701234459877014, "eval_runtime": 7.3669, "eval_samples_per_second": 13.574, "eval_wer": 0.3313032886723508, "step": 112600 }, { "epoch": 18.33, "learning_rate": 2.677435144395497e-05, "loss": NaN, "step": 112700 }, { "epoch": 18.33, "eval_loss": 0.399958074092865, "eval_runtime": 8.536, "eval_samples_per_second": 11.715, "eval_wer": 0.34226552984165654, "step": 112700 }, { "epoch": 18.34, "learning_rate": 2.670908794256812e-05, "loss": NaN, "step": 112800 }, { "epoch": 18.34, "eval_loss": 0.3959391117095947, "eval_runtime": 7.6581, "eval_samples_per_second": 13.058, "eval_wer": 0.341047503045067, "step": 112800 }, { "epoch": 18.36, "learning_rate": 2.664382444118127e-05, "loss": NaN, "step": 112900 }, { "epoch": 18.36, "eval_loss": 0.4151996672153473, "eval_runtime": 8.5593, "eval_samples_per_second": 11.683, "eval_wer": 0.3398294762484775, "step": 112900 }, { "epoch": 18.38, "learning_rate": 2.6578560939794423e-05, "loss": NaN, "step": 113000 }, { "epoch": 18.38, "eval_loss": 0.388653039932251, "eval_runtime": 7.3021, "eval_samples_per_second": 13.695, "eval_wer": 0.341047503045067, "step": 113000 }, { "epoch": 18.39, "learning_rate": 2.6513297438407568e-05, "loss": NaN, "step": 113100 }, { "epoch": 18.39, "eval_loss": 0.3932548761367798, "eval_runtime": 7.3475, "eval_samples_per_second": 13.61, "eval_wer": 0.3447015834348356, "step": 113100 }, { "epoch": 18.41, "learning_rate": 2.6448033937020723e-05, "loss": NaN, "step": 113200 }, { "epoch": 18.41, "eval_loss": 0.5715663433074951, "eval_runtime": 6.4752, "eval_samples_per_second": 15.444, "eval_wer": 0.3459196102314251, "step": 113200 }, { "epoch": 18.43, "learning_rate": 2.6382770435633875e-05, "loss": NaN, "step": 113300 }, { "epoch": 18.43, "eval_loss": 0.5505608320236206, "eval_runtime": 8.5504, "eval_samples_per_second": 11.695, "eval_wer": 0.3459196102314251, "step": 113300 }, { "epoch": 18.44, "learning_rate": 2.631750693424702e-05, "loss": NaN, "step": 113400 }, { "epoch": 18.44, "eval_loss": 0.4306776523590088, "eval_runtime": 8.0297, "eval_samples_per_second": 12.454, "eval_wer": 0.33008526187576126, "step": 113400 }, { "epoch": 18.46, "learning_rate": 2.6252243432860175e-05, "loss": NaN, "step": 113500 }, { "epoch": 18.46, "eval_loss": 0.3789026737213135, "eval_runtime": 8.1239, "eval_samples_per_second": 12.309, "eval_wer": 0.3325213154689403, "step": 113500 }, { "epoch": 18.47, "learning_rate": 2.6186979931473327e-05, "loss": NaN, "step": 113600 }, { "epoch": 18.47, "eval_loss": 0.42162245512008667, "eval_runtime": 8.6954, "eval_samples_per_second": 11.5, "eval_wer": 0.35322777101096225, "step": 113600 }, { "epoch": 18.49, "learning_rate": 2.6121716430086473e-05, "loss": NaN, "step": 113700 }, { "epoch": 18.49, "eval_loss": 0.5023617744445801, "eval_runtime": 9.6846, "eval_samples_per_second": 10.326, "eval_wer": 0.3507917174177832, "step": 113700 }, { "epoch": 18.51, "learning_rate": 2.6056452928699628e-05, "loss": NaN, "step": 113800 }, { "epoch": 18.51, "eval_loss": 0.395231693983078, "eval_runtime": 9.953, "eval_samples_per_second": 10.047, "eval_wer": 0.3471376370280146, "step": 113800 }, { "epoch": 18.52, "learning_rate": 2.599118942731278e-05, "loss": NaN, "step": 113900 }, { "epoch": 18.52, "eval_loss": 0.39416807889938354, "eval_runtime": 7.819, "eval_samples_per_second": 12.789, "eval_wer": 0.33617539585870887, "step": 113900 }, { "epoch": 18.54, "learning_rate": 2.5925925925925925e-05, "loss": NaN, "step": 114000 }, { "epoch": 18.54, "eval_loss": 0.5159714221954346, "eval_runtime": 7.203, "eval_samples_per_second": 13.883, "eval_wer": 0.3337393422655298, "step": 114000 }, { "epoch": 18.56, "learning_rate": 2.5860662424539077e-05, "loss": NaN, "step": 114100 }, { "epoch": 18.56, "eval_loss": 0.39711394906044006, "eval_runtime": 8.1764, "eval_samples_per_second": 12.23, "eval_wer": 0.341047503045067, "step": 114100 }, { "epoch": 18.57, "learning_rate": 2.5795398923152232e-05, "loss": NaN, "step": 114200 }, { "epoch": 18.57, "eval_loss": 0.3980695605278015, "eval_runtime": 7.8237, "eval_samples_per_second": 12.782, "eval_wer": 0.341047503045067, "step": 114200 }, { "epoch": 18.59, "learning_rate": 2.5730135421765377e-05, "loss": NaN, "step": 114300 }, { "epoch": 18.59, "eval_loss": 0.39846745133399963, "eval_runtime": 9.4234, "eval_samples_per_second": 10.612, "eval_wer": 0.3398294762484775, "step": 114300 }, { "epoch": 18.6, "learning_rate": 2.566487192037853e-05, "loss": NaN, "step": 114400 }, { "epoch": 18.6, "eval_loss": 0.4071855843067169, "eval_runtime": 7.858, "eval_samples_per_second": 12.726, "eval_wer": 0.341047503045067, "step": 114400 }, { "epoch": 18.62, "learning_rate": 2.5599608418991678e-05, "loss": NaN, "step": 114500 }, { "epoch": 18.62, "eval_loss": 0.41952818632125854, "eval_runtime": 8.1596, "eval_samples_per_second": 12.256, "eval_wer": 0.3447015834348356, "step": 114500 }, { "epoch": 18.64, "learning_rate": 2.553434491760483e-05, "loss": NaN, "step": 114600 }, { "epoch": 18.64, "eval_loss": 0.44777679443359375, "eval_runtime": 8.1577, "eval_samples_per_second": 12.258, "eval_wer": 0.3325213154689403, "step": 114600 }, { "epoch": 18.65, "learning_rate": 2.546908141621798e-05, "loss": NaN, "step": 114700 }, { "epoch": 18.65, "eval_loss": 0.39139124751091003, "eval_runtime": 7.223, "eval_samples_per_second": 13.845, "eval_wer": 0.32399512789281365, "step": 114700 }, { "epoch": 18.67, "learning_rate": 2.540381791483113e-05, "loss": NaN, "step": 114800 }, { "epoch": 18.67, "eval_loss": 0.40552714467048645, "eval_runtime": 8.0589, "eval_samples_per_second": 12.409, "eval_wer": 0.3313032886723508, "step": 114800 }, { "epoch": 18.69, "learning_rate": 2.5338554413444282e-05, "loss": NaN, "step": 114900 }, { "epoch": 18.69, "eval_loss": 0.4118463397026062, "eval_runtime": 8.077, "eval_samples_per_second": 12.381, "eval_wer": 0.3276492082825822, "step": 114900 }, { "epoch": 18.7, "learning_rate": 2.5273290912057434e-05, "loss": NaN, "step": 115000 }, { "epoch": 18.7, "eval_loss": 0.4166834354400635, "eval_runtime": 8.1784, "eval_samples_per_second": 12.227, "eval_wer": 0.34348355663824603, "step": 115000 }, { "epoch": 18.72, "learning_rate": 2.5208027410670582e-05, "loss": NaN, "step": 115100 }, { "epoch": 18.72, "eval_loss": 0.4071851074695587, "eval_runtime": 10.5991, "eval_samples_per_second": 9.435, "eval_wer": 0.3276492082825822, "step": 115100 }, { "epoch": 18.73, "learning_rate": 2.5142763909283734e-05, "loss": NaN, "step": 115200 }, { "epoch": 18.73, "eval_loss": 0.44569680094718933, "eval_runtime": 7.985, "eval_samples_per_second": 12.523, "eval_wer": 0.3398294762484775, "step": 115200 }, { "epoch": 18.75, "learning_rate": 2.5077500407896886e-05, "loss": NaN, "step": 115300 }, { "epoch": 18.75, "eval_loss": 0.4303815960884094, "eval_runtime": 7.2375, "eval_samples_per_second": 13.817, "eval_wer": 0.3337393422655298, "step": 115300 }, { "epoch": 18.77, "learning_rate": 2.5012236906510035e-05, "loss": NaN, "step": 115400 }, { "epoch": 18.77, "eval_loss": 0.4490242898464203, "eval_runtime": 8.2404, "eval_samples_per_second": 12.135, "eval_wer": 0.34226552984165654, "step": 115400 }, { "epoch": 18.78, "learning_rate": 2.4946973405123187e-05, "loss": NaN, "step": 115500 }, { "epoch": 18.78, "eval_loss": 0.49515098333358765, "eval_runtime": 7.3002, "eval_samples_per_second": 13.698, "eval_wer": 0.3373934226552984, "step": 115500 }, { "epoch": 18.8, "learning_rate": 2.4881709903736335e-05, "loss": NaN, "step": 115600 }, { "epoch": 18.8, "eval_loss": 0.4241500496864319, "eval_runtime": 8.6244, "eval_samples_per_second": 11.595, "eval_wer": 0.3276492082825822, "step": 115600 }, { "epoch": 18.82, "learning_rate": 2.4816446402349487e-05, "loss": NaN, "step": 115700 }, { "epoch": 18.82, "eval_loss": 0.4969961941242218, "eval_runtime": 8.4269, "eval_samples_per_second": 11.867, "eval_wer": 0.34835566382460414, "step": 115700 }, { "epoch": 18.83, "learning_rate": 2.475118290096264e-05, "loss": NaN, "step": 115800 }, { "epoch": 18.83, "eval_loss": 0.5238353610038757, "eval_runtime": 8.3935, "eval_samples_per_second": 11.914, "eval_wer": 0.34226552984165654, "step": 115800 }, { "epoch": 18.85, "learning_rate": 2.4685919399575788e-05, "loss": NaN, "step": 115900 }, { "epoch": 18.85, "eval_loss": 0.43089020252227783, "eval_runtime": 7.219, "eval_samples_per_second": 13.852, "eval_wer": 0.32034104750304504, "step": 115900 }, { "epoch": 18.86, "learning_rate": 2.462065589818894e-05, "loss": NaN, "step": 116000 }, { "epoch": 18.86, "eval_loss": 0.41796696186065674, "eval_runtime": 7.5558, "eval_samples_per_second": 13.235, "eval_wer": 0.3313032886723508, "step": 116000 }, { "epoch": 18.88, "learning_rate": 2.455539239680209e-05, "loss": NaN, "step": 116100 }, { "epoch": 18.88, "eval_loss": 0.4422737956047058, "eval_runtime": 7.9398, "eval_samples_per_second": 12.595, "eval_wer": 0.32886723507917176, "step": 116100 }, { "epoch": 18.9, "learning_rate": 2.449012889541524e-05, "loss": NaN, "step": 116200 }, { "epoch": 18.9, "eval_loss": 0.43862995505332947, "eval_runtime": 8.9085, "eval_samples_per_second": 11.225, "eval_wer": 0.3337393422655298, "step": 116200 }, { "epoch": 18.91, "learning_rate": 2.442486539402839e-05, "loss": NaN, "step": 116300 }, { "epoch": 18.91, "eval_loss": 0.4497430920600891, "eval_runtime": 9.2945, "eval_samples_per_second": 10.759, "eval_wer": 0.3447015834348356, "step": 116300 }, { "epoch": 18.93, "learning_rate": 2.4359601892641544e-05, "loss": NaN, "step": 116400 }, { "epoch": 18.93, "eval_loss": 0.4064001739025116, "eval_runtime": 9.3152, "eval_samples_per_second": 10.735, "eval_wer": 0.3276492082825822, "step": 116400 }, { "epoch": 18.95, "learning_rate": 2.4294338391254692e-05, "loss": NaN, "step": 116500 }, { "epoch": 18.95, "eval_loss": 0.5357220768928528, "eval_runtime": 10.268, "eval_samples_per_second": 9.739, "eval_wer": 0.35444579780755175, "step": 116500 }, { "epoch": 18.96, "learning_rate": 2.422907488986784e-05, "loss": NaN, "step": 116600 }, { "epoch": 18.96, "eval_loss": 0.4020291864871979, "eval_runtime": 6.8978, "eval_samples_per_second": 14.497, "eval_wer": 0.341047503045067, "step": 116600 }, { "epoch": 18.98, "learning_rate": 2.4163811388480993e-05, "loss": NaN, "step": 116700 }, { "epoch": 18.98, "eval_loss": 0.5173760056495667, "eval_runtime": 8.2411, "eval_samples_per_second": 12.134, "eval_wer": 0.3447015834348356, "step": 116700 }, { "epoch": 18.99, "learning_rate": 2.4098547887094145e-05, "loss": NaN, "step": 116800 }, { "epoch": 18.99, "eval_loss": 0.4323920011520386, "eval_runtime": 8.3858, "eval_samples_per_second": 11.925, "eval_wer": 0.3556638246041413, "step": 116800 }, { "epoch": 19.01, "learning_rate": 2.4033284385707293e-05, "loss": NaN, "step": 116900 }, { "epoch": 19.01, "eval_loss": 0.4196859300136566, "eval_runtime": 8.9105, "eval_samples_per_second": 11.223, "eval_wer": 0.33617539585870887, "step": 116900 }, { "epoch": 19.03, "learning_rate": 2.3968020884320445e-05, "loss": NaN, "step": 117000 }, { "epoch": 19.03, "eval_loss": 0.4224309027194977, "eval_runtime": 7.9389, "eval_samples_per_second": 12.596, "eval_wer": 0.3325213154689403, "step": 117000 }, { "epoch": 19.04, "learning_rate": 2.3902757382933597e-05, "loss": NaN, "step": 117100 }, { "epoch": 19.04, "eval_loss": 0.44540169835090637, "eval_runtime": 8.0457, "eval_samples_per_second": 12.429, "eval_wer": 0.33008526187576126, "step": 117100 }, { "epoch": 19.06, "learning_rate": 2.3837493881546746e-05, "loss": NaN, "step": 117200 }, { "epoch": 19.06, "eval_loss": 0.5561581254005432, "eval_runtime": 8.6307, "eval_samples_per_second": 11.587, "eval_wer": 0.32521315468940315, "step": 117200 }, { "epoch": 19.08, "learning_rate": 2.3772230380159897e-05, "loss": NaN, "step": 117300 }, { "epoch": 19.08, "eval_loss": 0.49928075075149536, "eval_runtime": 7.705, "eval_samples_per_second": 12.979, "eval_wer": 0.3386114494518879, "step": 117300 }, { "epoch": 19.09, "learning_rate": 2.370696687877305e-05, "loss": NaN, "step": 117400 }, { "epoch": 19.09, "eval_loss": 0.36428502202033997, "eval_runtime": 8.6228, "eval_samples_per_second": 11.597, "eval_wer": 0.32886723507917176, "step": 117400 }, { "epoch": 19.11, "learning_rate": 2.3641703377386198e-05, "loss": NaN, "step": 117500 }, { "epoch": 19.11, "eval_loss": 0.4284897744655609, "eval_runtime": 9.3991, "eval_samples_per_second": 10.639, "eval_wer": 0.3373934226552984, "step": 117500 }, { "epoch": 19.13, "learning_rate": 2.357643987599935e-05, "loss": NaN, "step": 117600 }, { "epoch": 19.13, "eval_loss": 0.4161425828933716, "eval_runtime": 7.4568, "eval_samples_per_second": 13.411, "eval_wer": 0.3313032886723508, "step": 117600 }, { "epoch": 19.14, "learning_rate": 2.35111763746125e-05, "loss": NaN, "step": 117700 }, { "epoch": 19.14, "eval_loss": 0.4765840470790863, "eval_runtime": 9.8648, "eval_samples_per_second": 10.137, "eval_wer": 0.34226552984165654, "step": 117700 }, { "epoch": 19.16, "learning_rate": 2.344591287322565e-05, "loss": NaN, "step": 117800 }, { "epoch": 19.16, "eval_loss": 0.41543564200401306, "eval_runtime": 7.7288, "eval_samples_per_second": 12.939, "eval_wer": 0.32886723507917176, "step": 117800 }, { "epoch": 19.17, "learning_rate": 2.33806493718388e-05, "loss": NaN, "step": 117900 }, { "epoch": 19.17, "eval_loss": 0.4077683985233307, "eval_runtime": 6.5049, "eval_samples_per_second": 15.373, "eval_wer": 0.32886723507917176, "step": 117900 }, { "epoch": 19.19, "learning_rate": 2.331538587045195e-05, "loss": NaN, "step": 118000 }, { "epoch": 19.19, "eval_loss": 0.4288666546344757, "eval_runtime": 7.3525, "eval_samples_per_second": 13.601, "eval_wer": 0.3325213154689403, "step": 118000 }, { "epoch": 19.21, "learning_rate": 2.3250122369065103e-05, "loss": NaN, "step": 118100 }, { "epoch": 19.21, "eval_loss": 0.3833557963371277, "eval_runtime": 8.6001, "eval_samples_per_second": 11.628, "eval_wer": 0.32521315468940315, "step": 118100 }, { "epoch": 19.22, "learning_rate": 2.318485886767825e-05, "loss": NaN, "step": 118200 }, { "epoch": 19.22, "eval_loss": 0.4251144528388977, "eval_runtime": 8.0377, "eval_samples_per_second": 12.441, "eval_wer": 0.315468940316687, "step": 118200 }, { "epoch": 19.24, "learning_rate": 2.3119595366291403e-05, "loss": NaN, "step": 118300 }, { "epoch": 19.24, "eval_loss": 0.48235252499580383, "eval_runtime": 9.9197, "eval_samples_per_second": 10.081, "eval_wer": 0.3373934226552984, "step": 118300 }, { "epoch": 19.26, "learning_rate": 2.305433186490455e-05, "loss": NaN, "step": 118400 }, { "epoch": 19.26, "eval_loss": 0.45876410603523254, "eval_runtime": 8.0238, "eval_samples_per_second": 12.463, "eval_wer": 0.3398294762484775, "step": 118400 }, { "epoch": 19.27, "learning_rate": 2.2989068363517704e-05, "loss": NaN, "step": 118500 }, { "epoch": 19.27, "eval_loss": 0.42962944507598877, "eval_runtime": 7.6922, "eval_samples_per_second": 13.0, "eval_wer": 0.32886723507917176, "step": 118500 }, { "epoch": 19.29, "learning_rate": 2.2923804862130855e-05, "loss": NaN, "step": 118600 }, { "epoch": 19.29, "eval_loss": 0.43103399872779846, "eval_runtime": 8.5247, "eval_samples_per_second": 11.731, "eval_wer": 0.3313032886723508, "step": 118600 }, { "epoch": 19.3, "learning_rate": 2.2858541360744004e-05, "loss": NaN, "step": 118700 }, { "epoch": 19.3, "eval_loss": 0.41755372285842896, "eval_runtime": 7.9327, "eval_samples_per_second": 12.606, "eval_wer": 0.3264311814859927, "step": 118700 }, { "epoch": 19.32, "learning_rate": 2.2793277859357156e-05, "loss": NaN, "step": 118800 }, { "epoch": 19.32, "eval_loss": 0.40416061878204346, "eval_runtime": 7.7154, "eval_samples_per_second": 12.961, "eval_wer": 0.3215590742996346, "step": 118800 }, { "epoch": 19.34, "learning_rate": 2.2728014357970308e-05, "loss": NaN, "step": 118900 }, { "epoch": 19.34, "eval_loss": 0.42045220732688904, "eval_runtime": 7.9703, "eval_samples_per_second": 12.547, "eval_wer": 0.3325213154689403, "step": 118900 }, { "epoch": 19.35, "learning_rate": 2.2662750856583456e-05, "loss": NaN, "step": 119000 }, { "epoch": 19.35, "eval_loss": 0.4497748613357544, "eval_runtime": 8.152, "eval_samples_per_second": 12.267, "eval_wer": 0.33495736906211937, "step": 119000 }, { "epoch": 19.37, "learning_rate": 2.2597487355196608e-05, "loss": NaN, "step": 119100 }, { "epoch": 19.37, "eval_loss": 0.4549383819103241, "eval_runtime": 8.0924, "eval_samples_per_second": 12.357, "eval_wer": 0.3447015834348356, "step": 119100 }, { "epoch": 19.39, "learning_rate": 2.253222385380976e-05, "loss": NaN, "step": 119200 }, { "epoch": 19.39, "eval_loss": 0.4458554983139038, "eval_runtime": 8.5049, "eval_samples_per_second": 11.758, "eval_wer": 0.33495736906211937, "step": 119200 }, { "epoch": 19.4, "learning_rate": 2.246696035242291e-05, "loss": NaN, "step": 119300 }, { "epoch": 19.4, "eval_loss": 0.43120619654655457, "eval_runtime": 7.0431, "eval_samples_per_second": 14.198, "eval_wer": 0.3264311814859927, "step": 119300 }, { "epoch": 19.42, "learning_rate": 2.2401696851036057e-05, "loss": NaN, "step": 119400 }, { "epoch": 19.42, "eval_loss": 0.4251594841480255, "eval_runtime": 7.4385, "eval_samples_per_second": 13.444, "eval_wer": 0.3386114494518879, "step": 119400 }, { "epoch": 19.43, "learning_rate": 2.233643334964921e-05, "loss": NaN, "step": 119500 }, { "epoch": 19.43, "eval_loss": 0.42931661009788513, "eval_runtime": 9.2934, "eval_samples_per_second": 10.76, "eval_wer": 0.3507917174177832, "step": 119500 }, { "epoch": 19.45, "learning_rate": 2.227116984826236e-05, "loss": NaN, "step": 119600 }, { "epoch": 19.45, "eval_loss": 0.42289912700653076, "eval_runtime": 9.665, "eval_samples_per_second": 10.347, "eval_wer": 0.3398294762484775, "step": 119600 }, { "epoch": 19.47, "learning_rate": 2.220590634687551e-05, "loss": NaN, "step": 119700 }, { "epoch": 19.47, "eval_loss": 0.487996369600296, "eval_runtime": 8.5886, "eval_samples_per_second": 11.643, "eval_wer": 0.34348355663824603, "step": 119700 }, { "epoch": 19.48, "learning_rate": 2.214064284548866e-05, "loss": NaN, "step": 119800 }, { "epoch": 19.48, "eval_loss": 0.550142228603363, "eval_runtime": 9.4924, "eval_samples_per_second": 10.535, "eval_wer": 0.3556638246041413, "step": 119800 }, { "epoch": 19.5, "learning_rate": 2.2075379344101813e-05, "loss": NaN, "step": 119900 }, { "epoch": 19.5, "eval_loss": 0.43226540088653564, "eval_runtime": 7.492, "eval_samples_per_second": 13.348, "eval_wer": 0.32886723507917176, "step": 119900 }, { "epoch": 19.52, "learning_rate": 2.2010115842714962e-05, "loss": NaN, "step": 120000 }, { "epoch": 19.52, "eval_loss": 0.3998276889324188, "eval_runtime": 7.4602, "eval_samples_per_second": 13.404, "eval_wer": 0.3325213154689403, "step": 120000 }, { "epoch": 19.53, "learning_rate": 2.194485234132811e-05, "loss": NaN, "step": 120100 }, { "epoch": 19.53, "eval_loss": 0.4583325982093811, "eval_runtime": 7.7177, "eval_samples_per_second": 12.957, "eval_wer": 0.34348355663824603, "step": 120100 }, { "epoch": 19.55, "learning_rate": 2.1879588839941266e-05, "loss": NaN, "step": 120200 }, { "epoch": 19.55, "eval_loss": 0.44406771659851074, "eval_runtime": 8.2416, "eval_samples_per_second": 12.134, "eval_wer": 0.341047503045067, "step": 120200 }, { "epoch": 19.56, "learning_rate": 2.1814325338554414e-05, "loss": NaN, "step": 120300 }, { "epoch": 19.56, "eval_loss": 0.41883566975593567, "eval_runtime": 7.3107, "eval_samples_per_second": 13.679, "eval_wer": 0.34348355663824603, "step": 120300 }, { "epoch": 19.58, "learning_rate": 2.1749061837167563e-05, "loss": NaN, "step": 120400 }, { "epoch": 19.58, "eval_loss": 0.4323764741420746, "eval_runtime": 8.8296, "eval_samples_per_second": 11.325, "eval_wer": 0.341047503045067, "step": 120400 }, { "epoch": 19.6, "learning_rate": 2.1683798335780718e-05, "loss": NaN, "step": 120500 }, { "epoch": 19.6, "eval_loss": 0.41844385862350464, "eval_runtime": 8.8708, "eval_samples_per_second": 11.273, "eval_wer": 0.34957369062119364, "step": 120500 }, { "epoch": 19.61, "learning_rate": 2.1618534834393867e-05, "loss": NaN, "step": 120600 }, { "epoch": 19.61, "eval_loss": 0.39420318603515625, "eval_runtime": 9.8796, "eval_samples_per_second": 10.122, "eval_wer": 0.3325213154689403, "step": 120600 }, { "epoch": 19.63, "learning_rate": 2.1553271333007015e-05, "loss": NaN, "step": 120700 }, { "epoch": 19.63, "eval_loss": 0.475872278213501, "eval_runtime": 8.1761, "eval_samples_per_second": 12.231, "eval_wer": 0.3471376370280146, "step": 120700 }, { "epoch": 19.65, "learning_rate": 2.148800783162017e-05, "loss": NaN, "step": 120800 }, { "epoch": 19.65, "eval_loss": 0.4005354642868042, "eval_runtime": 8.1599, "eval_samples_per_second": 12.255, "eval_wer": 0.34226552984165654, "step": 120800 }, { "epoch": 19.66, "learning_rate": 2.142274433023332e-05, "loss": NaN, "step": 120900 }, { "epoch": 19.66, "eval_loss": 0.3836045563220978, "eval_runtime": 8.6109, "eval_samples_per_second": 11.613, "eval_wer": 0.3459196102314251, "step": 120900 }, { "epoch": 19.68, "learning_rate": 2.1357480828846468e-05, "loss": NaN, "step": 121000 }, { "epoch": 19.68, "eval_loss": 0.36968758702278137, "eval_runtime": 8.2911, "eval_samples_per_second": 12.061, "eval_wer": 0.33495736906211937, "step": 121000 }, { "epoch": 19.69, "learning_rate": 2.129221732745962e-05, "loss": NaN, "step": 121100 }, { "epoch": 19.69, "eval_loss": 0.4322676360607147, "eval_runtime": 8.1328, "eval_samples_per_second": 12.296, "eval_wer": 0.34348355663824603, "step": 121100 }, { "epoch": 19.71, "learning_rate": 2.122695382607277e-05, "loss": NaN, "step": 121200 }, { "epoch": 19.71, "eval_loss": 0.42114943265914917, "eval_runtime": 9.3436, "eval_samples_per_second": 10.703, "eval_wer": 0.341047503045067, "step": 121200 }, { "epoch": 19.73, "learning_rate": 2.116169032468592e-05, "loss": NaN, "step": 121300 }, { "epoch": 19.73, "eval_loss": 0.40339621901512146, "eval_runtime": 7.8643, "eval_samples_per_second": 12.716, "eval_wer": 0.3337393422655298, "step": 121300 }, { "epoch": 19.74, "learning_rate": 2.1096426823299072e-05, "loss": NaN, "step": 121400 }, { "epoch": 19.74, "eval_loss": 0.3980773985385895, "eval_runtime": 7.5335, "eval_samples_per_second": 13.274, "eval_wer": 0.3373934226552984, "step": 121400 }, { "epoch": 19.76, "learning_rate": 2.1031163321912224e-05, "loss": NaN, "step": 121500 }, { "epoch": 19.76, "eval_loss": 0.5062117576599121, "eval_runtime": 8.2053, "eval_samples_per_second": 12.187, "eval_wer": 0.3471376370280146, "step": 121500 }, { "epoch": 19.78, "learning_rate": 2.0965899820525372e-05, "loss": NaN, "step": 121600 }, { "epoch": 19.78, "eval_loss": 0.4986831247806549, "eval_runtime": 8.3443, "eval_samples_per_second": 11.984, "eval_wer": 0.3447015834348356, "step": 121600 }, { "epoch": 19.79, "learning_rate": 2.090063631913852e-05, "loss": NaN, "step": 121700 }, { "epoch": 19.79, "eval_loss": 0.5382255911827087, "eval_runtime": 9.0263, "eval_samples_per_second": 11.079, "eval_wer": 0.3568818514007308, "step": 121700 }, { "epoch": 19.81, "learning_rate": 2.0835372817751673e-05, "loss": NaN, "step": 121800 }, { "epoch": 19.81, "eval_loss": 0.5431269407272339, "eval_runtime": 10.0339, "eval_samples_per_second": 9.966, "eval_wer": 0.3471376370280146, "step": 121800 }, { "epoch": 19.82, "learning_rate": 2.0770109316364825e-05, "loss": NaN, "step": 121900 }, { "epoch": 19.82, "eval_loss": 0.39853399991989136, "eval_runtime": 8.1763, "eval_samples_per_second": 12.231, "eval_wer": 0.3373934226552984, "step": 121900 }, { "epoch": 19.84, "learning_rate": 2.0704845814977973e-05, "loss": NaN, "step": 122000 }, { "epoch": 19.84, "eval_loss": 0.563309907913208, "eval_runtime": 7.9985, "eval_samples_per_second": 12.502, "eval_wer": 0.3447015834348356, "step": 122000 }, { "epoch": 19.86, "learning_rate": 2.0639582313591125e-05, "loss": NaN, "step": 122100 }, { "epoch": 19.86, "eval_loss": 0.38848280906677246, "eval_runtime": 7.9406, "eval_samples_per_second": 12.593, "eval_wer": 0.33495736906211937, "step": 122100 }, { "epoch": 19.87, "learning_rate": 2.0574318812204277e-05, "loss": NaN, "step": 122200 }, { "epoch": 19.87, "eval_loss": 0.3947732448577881, "eval_runtime": 8.1644, "eval_samples_per_second": 12.248, "eval_wer": 0.35444579780755175, "step": 122200 }, { "epoch": 19.89, "learning_rate": 2.0509055310817426e-05, "loss": NaN, "step": 122300 }, { "epoch": 19.89, "eval_loss": 0.4206204116344452, "eval_runtime": 8.6753, "eval_samples_per_second": 11.527, "eval_wer": 0.3471376370280146, "step": 122300 }, { "epoch": 19.91, "learning_rate": 2.0443791809430577e-05, "loss": NaN, "step": 122400 }, { "epoch": 19.91, "eval_loss": 0.41722992062568665, "eval_runtime": 7.7422, "eval_samples_per_second": 12.916, "eval_wer": 0.341047503045067, "step": 122400 }, { "epoch": 19.92, "learning_rate": 2.0378528308043726e-05, "loss": NaN, "step": 122500 }, { "epoch": 19.92, "eval_loss": 0.4375925362110138, "eval_runtime": 6.9864, "eval_samples_per_second": 14.313, "eval_wer": 0.34348355663824603, "step": 122500 }, { "epoch": 19.94, "learning_rate": 2.0313264806656878e-05, "loss": NaN, "step": 122600 }, { "epoch": 19.94, "eval_loss": 0.40097764134407043, "eval_runtime": 6.79, "eval_samples_per_second": 14.728, "eval_wer": 0.33617539585870887, "step": 122600 }, { "epoch": 19.95, "learning_rate": 2.024800130527003e-05, "loss": NaN, "step": 122700 }, { "epoch": 19.95, "eval_loss": 0.4545166790485382, "eval_runtime": 7.8384, "eval_samples_per_second": 12.758, "eval_wer": 0.3398294762484775, "step": 122700 }, { "epoch": 19.97, "learning_rate": 2.0182737803883178e-05, "loss": NaN, "step": 122800 }, { "epoch": 19.97, "eval_loss": 0.3846965730190277, "eval_runtime": 7.3303, "eval_samples_per_second": 13.642, "eval_wer": 0.3264311814859927, "step": 122800 }, { "epoch": 19.99, "learning_rate": 2.011747430249633e-05, "loss": NaN, "step": 122900 }, { "epoch": 19.99, "eval_loss": 0.38395482301712036, "eval_runtime": 7.3923, "eval_samples_per_second": 13.528, "eval_wer": 0.3373934226552984, "step": 122900 }, { "epoch": 20.0, "learning_rate": 2.0052210801109482e-05, "loss": NaN, "step": 123000 }, { "epoch": 20.0, "eval_loss": 0.43827033042907715, "eval_runtime": 8.7235, "eval_samples_per_second": 11.463, "eval_wer": 0.3507917174177832, "step": 123000 }, { "epoch": 20.02, "learning_rate": 1.998694729972263e-05, "loss": NaN, "step": 123100 }, { "epoch": 20.02, "eval_loss": 0.43740010261535645, "eval_runtime": 8.0253, "eval_samples_per_second": 12.461, "eval_wer": 0.34348355663824603, "step": 123100 }, { "epoch": 20.04, "learning_rate": 1.9921683798335783e-05, "loss": NaN, "step": 123200 }, { "epoch": 20.04, "eval_loss": 0.3877253830432892, "eval_runtime": 7.9016, "eval_samples_per_second": 12.656, "eval_wer": 0.33008526187576126, "step": 123200 }, { "epoch": 20.05, "learning_rate": 1.985642029694893e-05, "loss": NaN, "step": 123300 }, { "epoch": 20.05, "eval_loss": 0.46851950883865356, "eval_runtime": 8.2945, "eval_samples_per_second": 12.056, "eval_wer": 0.3690621193666261, "step": 123300 }, { "epoch": 20.07, "learning_rate": 1.9791156795562083e-05, "loss": NaN, "step": 123400 }, { "epoch": 20.07, "eval_loss": 0.5597333312034607, "eval_runtime": 8.7953, "eval_samples_per_second": 11.37, "eval_wer": 0.34835566382460414, "step": 123400 }, { "epoch": 20.08, "learning_rate": 1.972589329417523e-05, "loss": NaN, "step": 123500 }, { "epoch": 20.08, "eval_loss": 0.4044766128063202, "eval_runtime": 8.1152, "eval_samples_per_second": 12.323, "eval_wer": 0.33495736906211937, "step": 123500 }, { "epoch": 20.1, "learning_rate": 1.9660629792788383e-05, "loss": NaN, "step": 123600 }, { "epoch": 20.1, "eval_loss": 0.39406195282936096, "eval_runtime": 7.6836, "eval_samples_per_second": 13.015, "eval_wer": 0.3325213154689403, "step": 123600 }, { "epoch": 20.12, "learning_rate": 1.9595366291401535e-05, "loss": NaN, "step": 123700 }, { "epoch": 20.12, "eval_loss": 0.4256425201892853, "eval_runtime": 8.9263, "eval_samples_per_second": 11.203, "eval_wer": 0.33495736906211937, "step": 123700 }, { "epoch": 20.13, "learning_rate": 1.9530102790014684e-05, "loss": NaN, "step": 123800 }, { "epoch": 20.13, "eval_loss": 0.39307454228401184, "eval_runtime": 7.7688, "eval_samples_per_second": 12.872, "eval_wer": 0.3398294762484775, "step": 123800 }, { "epoch": 20.15, "learning_rate": 1.9464839288627836e-05, "loss": NaN, "step": 123900 }, { "epoch": 20.15, "eval_loss": 0.4074282944202423, "eval_runtime": 7.4446, "eval_samples_per_second": 13.433, "eval_wer": 0.33617539585870887, "step": 123900 }, { "epoch": 20.17, "learning_rate": 1.9399575787240988e-05, "loss": NaN, "step": 124000 }, { "epoch": 20.17, "eval_loss": 0.38621366024017334, "eval_runtime": 8.5491, "eval_samples_per_second": 11.697, "eval_wer": 0.341047503045067, "step": 124000 }, { "epoch": 20.18, "learning_rate": 1.9334312285854136e-05, "loss": NaN, "step": 124100 }, { "epoch": 20.18, "eval_loss": 0.3924228549003601, "eval_runtime": 8.8405, "eval_samples_per_second": 11.312, "eval_wer": 0.34348355663824603, "step": 124100 }, { "epoch": 20.2, "learning_rate": 1.9269048784467285e-05, "loss": NaN, "step": 124200 }, { "epoch": 20.2, "eval_loss": 0.3702751398086548, "eval_runtime": 6.8704, "eval_samples_per_second": 14.555, "eval_wer": 0.3386114494518879, "step": 124200 }, { "epoch": 20.21, "learning_rate": 1.920378528308044e-05, "loss": NaN, "step": 124300 }, { "epoch": 20.21, "eval_loss": 0.4109724760055542, "eval_runtime": 8.6105, "eval_samples_per_second": 11.614, "eval_wer": 0.3568818514007308, "step": 124300 }, { "epoch": 20.23, "learning_rate": 1.913852178169359e-05, "loss": NaN, "step": 124400 }, { "epoch": 20.23, "eval_loss": 0.40841957926750183, "eval_runtime": 7.8666, "eval_samples_per_second": 12.712, "eval_wer": 0.3264311814859927, "step": 124400 }, { "epoch": 20.25, "learning_rate": 1.9073258280306737e-05, "loss": NaN, "step": 124500 }, { "epoch": 20.25, "eval_loss": 0.44555091857910156, "eval_runtime": 8.1778, "eval_samples_per_second": 12.228, "eval_wer": 0.341047503045067, "step": 124500 }, { "epoch": 20.26, "learning_rate": 1.9007994778919892e-05, "loss": NaN, "step": 124600 }, { "epoch": 20.26, "eval_loss": 0.5727394819259644, "eval_runtime": 8.2574, "eval_samples_per_second": 12.11, "eval_wer": 0.3386114494518879, "step": 124600 }, { "epoch": 20.28, "learning_rate": 1.894273127753304e-05, "loss": NaN, "step": 124700 }, { "epoch": 20.28, "eval_loss": 0.43890708684921265, "eval_runtime": 7.5362, "eval_samples_per_second": 13.269, "eval_wer": 0.3507917174177832, "step": 124700 }, { "epoch": 20.3, "learning_rate": 1.887746777614619e-05, "loss": NaN, "step": 124800 }, { "epoch": 20.3, "eval_loss": 0.4767882525920868, "eval_runtime": 9.0744, "eval_samples_per_second": 11.02, "eval_wer": 0.34226552984165654, "step": 124800 }, { "epoch": 20.31, "learning_rate": 1.881220427475934e-05, "loss": NaN, "step": 124900 }, { "epoch": 20.31, "eval_loss": 0.3942064046859741, "eval_runtime": 9.3212, "eval_samples_per_second": 10.728, "eval_wer": 0.3373934226552984, "step": 124900 }, { "epoch": 20.33, "learning_rate": 1.8746940773372493e-05, "loss": NaN, "step": 125000 }, { "epoch": 20.33, "eval_loss": 0.4494655132293701, "eval_runtime": 9.6714, "eval_samples_per_second": 10.34, "eval_wer": 0.3447015834348356, "step": 125000 }, { "epoch": 20.34, "learning_rate": 1.8681677271985642e-05, "loss": NaN, "step": 125100 }, { "epoch": 20.34, "eval_loss": 0.39226436614990234, "eval_runtime": 8.7962, "eval_samples_per_second": 11.369, "eval_wer": 0.32886723507917176, "step": 125100 }, { "epoch": 20.36, "learning_rate": 1.8616413770598794e-05, "loss": NaN, "step": 125200 }, { "epoch": 20.36, "eval_loss": 0.41099902987480164, "eval_runtime": 8.4883, "eval_samples_per_second": 11.781, "eval_wer": 0.3373934226552984, "step": 125200 }, { "epoch": 20.38, "learning_rate": 1.8551150269211946e-05, "loss": NaN, "step": 125300 }, { "epoch": 20.38, "eval_loss": 0.4286768436431885, "eval_runtime": 7.7395, "eval_samples_per_second": 12.921, "eval_wer": 0.341047503045067, "step": 125300 }, { "epoch": 20.39, "learning_rate": 1.8485886767825094e-05, "loss": NaN, "step": 125400 }, { "epoch": 20.39, "eval_loss": 0.4009086489677429, "eval_runtime": 7.1964, "eval_samples_per_second": 13.896, "eval_wer": 0.33495736906211937, "step": 125400 }, { "epoch": 20.41, "learning_rate": 1.8420623266438243e-05, "loss": NaN, "step": 125500 }, { "epoch": 20.41, "eval_loss": 0.40821143984794617, "eval_runtime": 8.3655, "eval_samples_per_second": 11.954, "eval_wer": 0.34226552984165654, "step": 125500 }, { "epoch": 20.43, "learning_rate": 1.8355359765051398e-05, "loss": NaN, "step": 125600 }, { "epoch": 20.43, "eval_loss": 0.4229655861854553, "eval_runtime": 8.8125, "eval_samples_per_second": 11.348, "eval_wer": 0.3568818514007308, "step": 125600 }, { "epoch": 20.44, "learning_rate": 1.8290096263664547e-05, "loss": NaN, "step": 125700 }, { "epoch": 20.44, "eval_loss": 0.45079144835472107, "eval_runtime": 9.8702, "eval_samples_per_second": 10.131, "eval_wer": 0.34348355663824603, "step": 125700 }, { "epoch": 20.46, "learning_rate": 1.8224832762277695e-05, "loss": NaN, "step": 125800 }, { "epoch": 20.46, "eval_loss": 0.42513442039489746, "eval_runtime": 7.4321, "eval_samples_per_second": 13.455, "eval_wer": 0.3313032886723508, "step": 125800 }, { "epoch": 20.47, "learning_rate": 1.8159569260890847e-05, "loss": NaN, "step": 125900 }, { "epoch": 20.47, "eval_loss": 0.4858975112438202, "eval_runtime": 7.8101, "eval_samples_per_second": 12.804, "eval_wer": 0.3568818514007308, "step": 125900 }, { "epoch": 20.49, "learning_rate": 1.8094305759504e-05, "loss": NaN, "step": 126000 }, { "epoch": 20.49, "eval_loss": 0.4102497398853302, "eval_runtime": 9.5076, "eval_samples_per_second": 10.518, "eval_wer": 0.35444579780755175, "step": 126000 }, { "epoch": 20.51, "learning_rate": 1.8029042258117147e-05, "loss": NaN, "step": 126100 }, { "epoch": 20.51, "eval_loss": 0.4684319794178009, "eval_runtime": 7.5644, "eval_samples_per_second": 13.22, "eval_wer": 0.3373934226552984, "step": 126100 }, { "epoch": 20.52, "learning_rate": 1.79637787567303e-05, "loss": NaN, "step": 126200 }, { "epoch": 20.52, "eval_loss": 0.6590189933776855, "eval_runtime": 8.2168, "eval_samples_per_second": 12.17, "eval_wer": 0.35931790499390986, "step": 126200 }, { "epoch": 20.54, "learning_rate": 1.789851525534345e-05, "loss": NaN, "step": 126300 }, { "epoch": 20.54, "eval_loss": 0.4641081988811493, "eval_runtime": 7.7606, "eval_samples_per_second": 12.886, "eval_wer": 0.315468940316687, "step": 126300 }, { "epoch": 20.56, "learning_rate": 1.78332517539566e-05, "loss": NaN, "step": 126400 }, { "epoch": 20.56, "eval_loss": 0.5528498888015747, "eval_runtime": 9.1648, "eval_samples_per_second": 10.911, "eval_wer": 0.3629719853836784, "step": 126400 }, { "epoch": 20.57, "learning_rate": 1.7767988252569752e-05, "loss": NaN, "step": 126500 }, { "epoch": 20.57, "eval_loss": 0.433257132768631, "eval_runtime": 7.6174, "eval_samples_per_second": 13.128, "eval_wer": 0.34348355663824603, "step": 126500 }, { "epoch": 20.59, "learning_rate": 1.7702724751182904e-05, "loss": NaN, "step": 126600 }, { "epoch": 20.59, "eval_loss": 0.3999103307723999, "eval_runtime": 7.888, "eval_samples_per_second": 12.677, "eval_wer": 0.3373934226552984, "step": 126600 }, { "epoch": 20.6, "learning_rate": 1.7637461249796052e-05, "loss": NaN, "step": 126700 }, { "epoch": 20.6, "eval_loss": 0.4195931553840637, "eval_runtime": 7.5791, "eval_samples_per_second": 13.194, "eval_wer": 0.3447015834348356, "step": 126700 }, { "epoch": 20.62, "learning_rate": 1.7572197748409204e-05, "loss": NaN, "step": 126800 }, { "epoch": 20.62, "eval_loss": 0.4389355778694153, "eval_runtime": 6.9812, "eval_samples_per_second": 14.324, "eval_wer": 0.34226552984165654, "step": 126800 }, { "epoch": 20.64, "learning_rate": 1.7506934247022353e-05, "loss": NaN, "step": 126900 }, { "epoch": 20.64, "eval_loss": 0.4806211590766907, "eval_runtime": 9.6568, "eval_samples_per_second": 10.355, "eval_wer": 0.34957369062119364, "step": 126900 }, { "epoch": 20.65, "learning_rate": 1.7441670745635505e-05, "loss": NaN, "step": 127000 }, { "epoch": 20.65, "eval_loss": 0.48015937209129333, "eval_runtime": 9.1133, "eval_samples_per_second": 10.973, "eval_wer": 0.35322777101096225, "step": 127000 }, { "epoch": 20.67, "learning_rate": 1.7376407244248653e-05, "loss": NaN, "step": 127100 }, { "epoch": 20.67, "eval_loss": 0.4087853729724884, "eval_runtime": 7.6535, "eval_samples_per_second": 13.066, "eval_wer": 0.3337393422655298, "step": 127100 }, { "epoch": 20.69, "learning_rate": 1.7311143742861805e-05, "loss": NaN, "step": 127200 }, { "epoch": 20.69, "eval_loss": 0.43684786558151245, "eval_runtime": 8.3464, "eval_samples_per_second": 11.981, "eval_wer": 0.33495736906211937, "step": 127200 }, { "epoch": 20.7, "learning_rate": 1.7245880241474957e-05, "loss": NaN, "step": 127300 }, { "epoch": 20.7, "eval_loss": 0.46926018595695496, "eval_runtime": 9.6189, "eval_samples_per_second": 10.396, "eval_wer": 0.3447015834348356, "step": 127300 }, { "epoch": 20.72, "learning_rate": 1.7180616740088105e-05, "loss": NaN, "step": 127400 }, { "epoch": 20.72, "eval_loss": 0.45676276087760925, "eval_runtime": 9.0225, "eval_samples_per_second": 11.083, "eval_wer": 0.3459196102314251, "step": 127400 }, { "epoch": 20.74, "learning_rate": 1.7115353238701257e-05, "loss": NaN, "step": 127500 }, { "epoch": 20.74, "eval_loss": 0.4165736734867096, "eval_runtime": 8.8912, "eval_samples_per_second": 11.247, "eval_wer": 0.3459196102314251, "step": 127500 }, { "epoch": 20.75, "learning_rate": 1.7050089737314406e-05, "loss": NaN, "step": 127600 }, { "epoch": 20.75, "eval_loss": 0.4191476106643677, "eval_runtime": 8.1249, "eval_samples_per_second": 12.308, "eval_wer": 0.3398294762484775, "step": 127600 }, { "epoch": 20.77, "learning_rate": 1.6984826235927558e-05, "loss": NaN, "step": 127700 }, { "epoch": 20.77, "eval_loss": 0.4200890362262726, "eval_runtime": 7.7999, "eval_samples_per_second": 12.821, "eval_wer": 0.3313032886723508, "step": 127700 }, { "epoch": 20.78, "learning_rate": 1.691956273454071e-05, "loss": NaN, "step": 127800 }, { "epoch": 20.78, "eval_loss": 0.41486749053001404, "eval_runtime": 9.2941, "eval_samples_per_second": 10.76, "eval_wer": 0.34348355663824603, "step": 127800 }, { "epoch": 20.8, "learning_rate": 1.6854299233153858e-05, "loss": NaN, "step": 127900 }, { "epoch": 20.8, "eval_loss": 0.4273871183395386, "eval_runtime": 9.7275, "eval_samples_per_second": 10.28, "eval_wer": 0.3386114494518879, "step": 127900 }, { "epoch": 20.82, "learning_rate": 1.678903573176701e-05, "loss": NaN, "step": 128000 }, { "epoch": 20.82, "eval_loss": 0.44087138772010803, "eval_runtime": 8.9574, "eval_samples_per_second": 11.164, "eval_wer": 0.3447015834348356, "step": 128000 }, { "epoch": 20.83, "learning_rate": 1.6723772230380162e-05, "loss": NaN, "step": 128100 }, { "epoch": 20.83, "eval_loss": 0.3781212270259857, "eval_runtime": 7.5604, "eval_samples_per_second": 13.227, "eval_wer": 0.3325213154689403, "step": 128100 }, { "epoch": 20.85, "learning_rate": 1.665850872899331e-05, "loss": NaN, "step": 128200 }, { "epoch": 20.85, "eval_loss": 0.4753413498401642, "eval_runtime": 8.6899, "eval_samples_per_second": 11.508, "eval_wer": 0.3337393422655298, "step": 128200 }, { "epoch": 20.87, "learning_rate": 1.6593245227606463e-05, "loss": NaN, "step": 128300 }, { "epoch": 20.87, "eval_loss": 0.40558329224586487, "eval_runtime": 7.5404, "eval_samples_per_second": 13.262, "eval_wer": 0.3313032886723508, "step": 128300 }, { "epoch": 20.88, "learning_rate": 1.6527981726219614e-05, "loss": NaN, "step": 128400 }, { "epoch": 20.88, "eval_loss": 0.4515651762485504, "eval_runtime": 8.2888, "eval_samples_per_second": 12.065, "eval_wer": 0.3398294762484775, "step": 128400 }, { "epoch": 20.9, "learning_rate": 1.6462718224832763e-05, "loss": NaN, "step": 128500 }, { "epoch": 20.9, "eval_loss": 0.43877291679382324, "eval_runtime": 7.2241, "eval_samples_per_second": 13.843, "eval_wer": 0.3507917174177832, "step": 128500 }, { "epoch": 20.91, "learning_rate": 1.639745472344591e-05, "loss": NaN, "step": 128600 }, { "epoch": 20.91, "eval_loss": 0.457927405834198, "eval_runtime": 8.7365, "eval_samples_per_second": 11.446, "eval_wer": 0.34348355663824603, "step": 128600 }, { "epoch": 20.93, "learning_rate": 1.6332191222059063e-05, "loss": NaN, "step": 128700 }, { "epoch": 20.93, "eval_loss": 0.40025395154953003, "eval_runtime": 8.0467, "eval_samples_per_second": 12.428, "eval_wer": 0.34348355663824603, "step": 128700 }, { "epoch": 20.95, "learning_rate": 1.6266927720672215e-05, "loss": NaN, "step": 128800 }, { "epoch": 20.95, "eval_loss": 0.5182440280914307, "eval_runtime": 7.1852, "eval_samples_per_second": 13.918, "eval_wer": 0.35444579780755175, "step": 128800 }, { "epoch": 20.96, "learning_rate": 1.6201664219285364e-05, "loss": NaN, "step": 128900 }, { "epoch": 20.96, "eval_loss": 0.4123252034187317, "eval_runtime": 8.1302, "eval_samples_per_second": 12.3, "eval_wer": 0.3386114494518879, "step": 128900 }, { "epoch": 20.98, "learning_rate": 1.6136400717898516e-05, "loss": NaN, "step": 129000 }, { "epoch": 20.98, "eval_loss": 0.4326474070549011, "eval_runtime": 7.6986, "eval_samples_per_second": 12.989, "eval_wer": 0.3398294762484775, "step": 129000 }, { "epoch": 21.0, "learning_rate": 1.6071137216511668e-05, "loss": NaN, "step": 129100 }, { "epoch": 21.0, "eval_loss": 0.4750351011753082, "eval_runtime": 7.5824, "eval_samples_per_second": 13.188, "eval_wer": 0.3373934226552984, "step": 129100 }, { "epoch": 21.01, "learning_rate": 1.6005873715124816e-05, "loss": NaN, "step": 129200 }, { "epoch": 21.01, "eval_loss": 0.4125843942165375, "eval_runtime": 8.0836, "eval_samples_per_second": 12.371, "eval_wer": 0.3386114494518879, "step": 129200 }, { "epoch": 21.03, "learning_rate": 1.5940610213737968e-05, "loss": NaN, "step": 129300 }, { "epoch": 21.03, "eval_loss": 0.4247395396232605, "eval_runtime": 8.0802, "eval_samples_per_second": 12.376, "eval_wer": 0.3373934226552984, "step": 129300 }, { "epoch": 21.04, "learning_rate": 1.587534671235112e-05, "loss": NaN, "step": 129400 }, { "epoch": 21.04, "eval_loss": 0.43337181210517883, "eval_runtime": 7.6212, "eval_samples_per_second": 13.121, "eval_wer": 0.32886723507917176, "step": 129400 }, { "epoch": 21.06, "learning_rate": 1.581008321096427e-05, "loss": NaN, "step": 129500 }, { "epoch": 21.06, "eval_loss": 0.35774993896484375, "eval_runtime": 8.103, "eval_samples_per_second": 12.341, "eval_wer": 0.315468940316687, "step": 129500 }, { "epoch": 21.08, "learning_rate": 1.5744819709577417e-05, "loss": NaN, "step": 129600 }, { "epoch": 21.08, "eval_loss": 0.4800620973110199, "eval_runtime": 8.5222, "eval_samples_per_second": 11.734, "eval_wer": 0.32521315468940315, "step": 129600 }, { "epoch": 21.09, "learning_rate": 1.5679556208190572e-05, "loss": NaN, "step": 129700 }, { "epoch": 21.09, "eval_loss": 0.4503170847892761, "eval_runtime": 8.4578, "eval_samples_per_second": 11.823, "eval_wer": 0.34226552984165654, "step": 129700 }, { "epoch": 21.11, "learning_rate": 1.561429270680372e-05, "loss": NaN, "step": 129800 }, { "epoch": 21.11, "eval_loss": 0.4079561233520508, "eval_runtime": 7.3872, "eval_samples_per_second": 13.537, "eval_wer": 0.3325213154689403, "step": 129800 }, { "epoch": 21.13, "learning_rate": 1.554902920541687e-05, "loss": NaN, "step": 129900 }, { "epoch": 21.13, "eval_loss": 0.44905129075050354, "eval_runtime": 7.1484, "eval_samples_per_second": 13.989, "eval_wer": 0.3398294762484775, "step": 129900 }, { "epoch": 21.14, "learning_rate": 1.5483765704030025e-05, "loss": NaN, "step": 130000 }, { "epoch": 21.14, "eval_loss": 0.4295308291912079, "eval_runtime": 8.0526, "eval_samples_per_second": 12.418, "eval_wer": 0.33617539585870887, "step": 130000 }, { "epoch": 21.16, "learning_rate": 1.5418502202643173e-05, "loss": NaN, "step": 130100 }, { "epoch": 21.16, "eval_loss": 0.3925670385360718, "eval_runtime": 8.4253, "eval_samples_per_second": 11.869, "eval_wer": 0.3325213154689403, "step": 130100 }, { "epoch": 21.17, "learning_rate": 1.5353238701256322e-05, "loss": NaN, "step": 130200 }, { "epoch": 21.17, "eval_loss": 0.46943891048431396, "eval_runtime": 6.9244, "eval_samples_per_second": 14.442, "eval_wer": 0.34957369062119364, "step": 130200 }, { "epoch": 21.19, "learning_rate": 1.5287975199869474e-05, "loss": NaN, "step": 130300 }, { "epoch": 21.19, "eval_loss": 0.3773401975631714, "eval_runtime": 9.0744, "eval_samples_per_second": 11.02, "eval_wer": 0.3471376370280146, "step": 130300 }, { "epoch": 21.21, "learning_rate": 1.5222711698482626e-05, "loss": NaN, "step": 130400 }, { "epoch": 21.21, "eval_loss": 0.4215690493583679, "eval_runtime": 8.1736, "eval_samples_per_second": 12.235, "eval_wer": 0.341047503045067, "step": 130400 }, { "epoch": 21.22, "learning_rate": 1.5157448197095774e-05, "loss": NaN, "step": 130500 }, { "epoch": 21.22, "eval_loss": 0.4928508400917053, "eval_runtime": 8.1815, "eval_samples_per_second": 12.223, "eval_wer": 0.3459196102314251, "step": 130500 }, { "epoch": 21.24, "learning_rate": 1.5092184695708924e-05, "loss": NaN, "step": 130600 }, { "epoch": 21.24, "eval_loss": 0.4258655309677124, "eval_runtime": 8.8623, "eval_samples_per_second": 11.284, "eval_wer": 0.33617539585870887, "step": 130600 }, { "epoch": 21.26, "learning_rate": 1.5026921194322078e-05, "loss": NaN, "step": 130700 }, { "epoch": 21.26, "eval_loss": 0.40194839239120483, "eval_runtime": 8.8628, "eval_samples_per_second": 11.283, "eval_wer": 0.3276492082825822, "step": 130700 }, { "epoch": 21.27, "learning_rate": 1.4961657692935227e-05, "loss": NaN, "step": 130800 }, { "epoch": 21.27, "eval_loss": 0.4380399286746979, "eval_runtime": 8.0782, "eval_samples_per_second": 12.379, "eval_wer": 0.34835566382460414, "step": 130800 }, { "epoch": 21.29, "learning_rate": 1.4896394191548377e-05, "loss": NaN, "step": 130900 }, { "epoch": 21.29, "eval_loss": 0.40339186787605286, "eval_runtime": 9.2102, "eval_samples_per_second": 10.858, "eval_wer": 0.34226552984165654, "step": 130900 }, { "epoch": 21.3, "learning_rate": 1.4831130690161527e-05, "loss": NaN, "step": 131000 }, { "epoch": 21.3, "eval_loss": 0.4713993966579437, "eval_runtime": 8.5421, "eval_samples_per_second": 11.707, "eval_wer": 0.3507917174177832, "step": 131000 }, { "epoch": 21.32, "learning_rate": 1.4765867188774679e-05, "loss": NaN, "step": 131100 }, { "epoch": 21.32, "eval_loss": 0.5234803557395935, "eval_runtime": 7.9161, "eval_samples_per_second": 12.632, "eval_wer": 0.3568818514007308, "step": 131100 }, { "epoch": 21.34, "learning_rate": 1.4700603687387829e-05, "loss": NaN, "step": 131200 }, { "epoch": 21.34, "eval_loss": 0.46438494324684143, "eval_runtime": 9.1223, "eval_samples_per_second": 10.962, "eval_wer": 0.3520097442143727, "step": 131200 }, { "epoch": 21.35, "learning_rate": 1.463534018600098e-05, "loss": NaN, "step": 131300 }, { "epoch": 21.35, "eval_loss": 0.44316136837005615, "eval_runtime": 9.5471, "eval_samples_per_second": 10.474, "eval_wer": 0.3373934226552984, "step": 131300 }, { "epoch": 21.37, "learning_rate": 1.4570076684614131e-05, "loss": NaN, "step": 131400 }, { "epoch": 21.37, "eval_loss": 0.442475825548172, "eval_runtime": 7.1952, "eval_samples_per_second": 13.898, "eval_wer": 0.33617539585870887, "step": 131400 }, { "epoch": 21.39, "learning_rate": 1.4504813183227281e-05, "loss": NaN, "step": 131500 }, { "epoch": 21.39, "eval_loss": 0.5654551982879639, "eval_runtime": 8.1407, "eval_samples_per_second": 12.284, "eval_wer": 0.35322777101096225, "step": 131500 }, { "epoch": 21.4, "learning_rate": 1.443954968184043e-05, "loss": NaN, "step": 131600 }, { "epoch": 21.4, "eval_loss": 0.4513855278491974, "eval_runtime": 8.8967, "eval_samples_per_second": 11.24, "eval_wer": 0.34835566382460414, "step": 131600 }, { "epoch": 21.42, "learning_rate": 1.4374286180453584e-05, "loss": NaN, "step": 131700 }, { "epoch": 21.42, "eval_loss": 0.4416217803955078, "eval_runtime": 9.1103, "eval_samples_per_second": 10.977, "eval_wer": 0.34835566382460414, "step": 131700 }, { "epoch": 21.43, "learning_rate": 1.4309022679066734e-05, "loss": NaN, "step": 131800 }, { "epoch": 21.43, "eval_loss": 0.391195148229599, "eval_runtime": 8.6493, "eval_samples_per_second": 11.562, "eval_wer": 0.3386114494518879, "step": 131800 }, { "epoch": 21.45, "learning_rate": 1.4243759177679882e-05, "loss": NaN, "step": 131900 }, { "epoch": 21.45, "eval_loss": 0.4384614825248718, "eval_runtime": 8.481, "eval_samples_per_second": 11.791, "eval_wer": 0.3447015834348356, "step": 131900 }, { "epoch": 21.47, "learning_rate": 1.4178495676293033e-05, "loss": NaN, "step": 132000 }, { "epoch": 21.47, "eval_loss": 0.42818814516067505, "eval_runtime": 8.6608, "eval_samples_per_second": 11.546, "eval_wer": 0.3386114494518879, "step": 132000 }, { "epoch": 21.48, "learning_rate": 1.4113232174906185e-05, "loss": NaN, "step": 132100 }, { "epoch": 21.48, "eval_loss": 0.4142271876335144, "eval_runtime": 7.784, "eval_samples_per_second": 12.847, "eval_wer": 0.32521315468940315, "step": 132100 }, { "epoch": 21.5, "learning_rate": 1.4047968673519335e-05, "loss": NaN, "step": 132200 }, { "epoch": 21.5, "eval_loss": 0.42976322770118713, "eval_runtime": 11.0885, "eval_samples_per_second": 9.018, "eval_wer": 0.35809987819732036, "step": 132200 }, { "epoch": 21.52, "learning_rate": 1.3982705172132485e-05, "loss": NaN, "step": 132300 }, { "epoch": 21.52, "eval_loss": 0.44189947843551636, "eval_runtime": 8.1376, "eval_samples_per_second": 12.289, "eval_wer": 0.3447015834348356, "step": 132300 }, { "epoch": 21.53, "learning_rate": 1.3917441670745637e-05, "loss": NaN, "step": 132400 }, { "epoch": 21.53, "eval_loss": 0.4482198655605316, "eval_runtime": 8.3756, "eval_samples_per_second": 11.939, "eval_wer": 0.3507917174177832, "step": 132400 }, { "epoch": 21.55, "learning_rate": 1.3852178169358787e-05, "loss": NaN, "step": 132500 }, { "epoch": 21.55, "eval_loss": 0.37959039211273193, "eval_runtime": 7.1877, "eval_samples_per_second": 13.913, "eval_wer": 0.3337393422655298, "step": 132500 }, { "epoch": 21.56, "learning_rate": 1.3786914667971937e-05, "loss": NaN, "step": 132600 }, { "epoch": 21.56, "eval_loss": 0.4015367925167084, "eval_runtime": 7.0749, "eval_samples_per_second": 14.134, "eval_wer": 0.3373934226552984, "step": 132600 }, { "epoch": 21.58, "learning_rate": 1.3721651166585086e-05, "loss": NaN, "step": 132700 }, { "epoch": 21.58, "eval_loss": 0.4340609014034271, "eval_runtime": 10.0027, "eval_samples_per_second": 9.997, "eval_wer": 0.34835566382460414, "step": 132700 }, { "epoch": 21.6, "learning_rate": 1.365638766519824e-05, "loss": NaN, "step": 132800 }, { "epoch": 21.6, "eval_loss": 0.5372726917266846, "eval_runtime": 8.4121, "eval_samples_per_second": 11.888, "eval_wer": 0.33617539585870887, "step": 132800 }, { "epoch": 21.61, "learning_rate": 1.359112416381139e-05, "loss": NaN, "step": 132900 }, { "epoch": 21.61, "eval_loss": 0.39388373494148254, "eval_runtime": 8.9479, "eval_samples_per_second": 11.176, "eval_wer": 0.3264311814859927, "step": 132900 }, { "epoch": 21.63, "learning_rate": 1.3525860662424538e-05, "loss": NaN, "step": 133000 }, { "epoch": 21.63, "eval_loss": 0.44166165590286255, "eval_runtime": 8.2657, "eval_samples_per_second": 12.098, "eval_wer": 0.3471376370280146, "step": 133000 }, { "epoch": 21.65, "learning_rate": 1.3460597161037692e-05, "loss": NaN, "step": 133100 }, { "epoch": 21.65, "eval_loss": 0.41540205478668213, "eval_runtime": 8.1998, "eval_samples_per_second": 12.195, "eval_wer": 0.34348355663824603, "step": 133100 }, { "epoch": 21.66, "learning_rate": 1.339533365965084e-05, "loss": NaN, "step": 133200 }, { "epoch": 21.66, "eval_loss": 0.4051262140274048, "eval_runtime": 7.0885, "eval_samples_per_second": 14.107, "eval_wer": 0.33617539585870887, "step": 133200 }, { "epoch": 21.68, "learning_rate": 1.333007015826399e-05, "loss": NaN, "step": 133300 }, { "epoch": 21.68, "eval_loss": 0.41227516531944275, "eval_runtime": 8.2062, "eval_samples_per_second": 12.186, "eval_wer": 0.3459196102314251, "step": 133300 }, { "epoch": 21.69, "learning_rate": 1.3264806656877144e-05, "loss": NaN, "step": 133400 }, { "epoch": 21.69, "eval_loss": 0.42322754859924316, "eval_runtime": 9.0314, "eval_samples_per_second": 11.073, "eval_wer": 0.3398294762484775, "step": 133400 }, { "epoch": 21.71, "learning_rate": 1.3199543155490293e-05, "loss": NaN, "step": 133500 }, { "epoch": 21.71, "eval_loss": 0.3802301287651062, "eval_runtime": 8.7387, "eval_samples_per_second": 11.443, "eval_wer": 0.3325213154689403, "step": 133500 }, { "epoch": 21.73, "learning_rate": 1.3134279654103443e-05, "loss": NaN, "step": 133600 }, { "epoch": 21.73, "eval_loss": 0.40790998935699463, "eval_runtime": 7.0036, "eval_samples_per_second": 14.278, "eval_wer": 0.3398294762484775, "step": 133600 }, { "epoch": 21.74, "learning_rate": 1.3069016152716593e-05, "loss": NaN, "step": 133700 }, { "epoch": 21.74, "eval_loss": 0.41051357984542847, "eval_runtime": 8.2179, "eval_samples_per_second": 12.168, "eval_wer": 0.341047503045067, "step": 133700 }, { "epoch": 21.76, "learning_rate": 1.3003752651329745e-05, "loss": NaN, "step": 133800 }, { "epoch": 21.76, "eval_loss": 0.40564852952957153, "eval_runtime": 8.5003, "eval_samples_per_second": 11.764, "eval_wer": 0.3325213154689403, "step": 133800 }, { "epoch": 21.78, "learning_rate": 1.2938489149942895e-05, "loss": NaN, "step": 133900 }, { "epoch": 21.78, "eval_loss": 0.4392382800579071, "eval_runtime": 7.6928, "eval_samples_per_second": 12.999, "eval_wer": 0.34835566382460414, "step": 133900 }, { "epoch": 21.79, "learning_rate": 1.2873225648556045e-05, "loss": NaN, "step": 134000 }, { "epoch": 21.79, "eval_loss": 0.3991428017616272, "eval_runtime": 9.3346, "eval_samples_per_second": 10.713, "eval_wer": 0.3386114494518879, "step": 134000 }, { "epoch": 21.81, "learning_rate": 1.2807962147169197e-05, "loss": NaN, "step": 134100 }, { "epoch": 21.81, "eval_loss": 0.4022715389728546, "eval_runtime": 7.981, "eval_samples_per_second": 12.53, "eval_wer": 0.34226552984165654, "step": 134100 }, { "epoch": 21.82, "learning_rate": 1.2742698645782348e-05, "loss": NaN, "step": 134200 }, { "epoch": 21.82, "eval_loss": 0.4230504631996155, "eval_runtime": 8.7343, "eval_samples_per_second": 11.449, "eval_wer": 0.341047503045067, "step": 134200 }, { "epoch": 21.84, "learning_rate": 1.2677435144395496e-05, "loss": NaN, "step": 134300 }, { "epoch": 21.84, "eval_loss": 0.45141318440437317, "eval_runtime": 9.2929, "eval_samples_per_second": 10.761, "eval_wer": 0.3447015834348356, "step": 134300 }, { "epoch": 21.86, "learning_rate": 1.2612171643008646e-05, "loss": NaN, "step": 134400 }, { "epoch": 21.86, "eval_loss": 0.42951327562332153, "eval_runtime": 9.4873, "eval_samples_per_second": 10.54, "eval_wer": 0.31303288672350793, "step": 134400 }, { "epoch": 21.87, "learning_rate": 1.25469081416218e-05, "loss": NaN, "step": 134500 }, { "epoch": 21.87, "eval_loss": 0.46236321330070496, "eval_runtime": 10.0535, "eval_samples_per_second": 9.947, "eval_wer": 0.3337393422655298, "step": 134500 }, { "epoch": 21.89, "learning_rate": 1.2481644640234949e-05, "loss": NaN, "step": 134600 }, { "epoch": 21.89, "eval_loss": 0.49196091294288635, "eval_runtime": 8.3873, "eval_samples_per_second": 11.923, "eval_wer": 0.33495736906211937, "step": 134600 }, { "epoch": 21.91, "learning_rate": 1.24163811388481e-05, "loss": NaN, "step": 134700 }, { "epoch": 21.91, "eval_loss": 0.4672481417655945, "eval_runtime": 9.8356, "eval_samples_per_second": 10.167, "eval_wer": 0.35444579780755175, "step": 134700 }, { "epoch": 21.92, "learning_rate": 1.235111763746125e-05, "loss": NaN, "step": 134800 }, { "epoch": 21.92, "eval_loss": 0.4398852586746216, "eval_runtime": 7.9762, "eval_samples_per_second": 12.537, "eval_wer": 0.35931790499390986, "step": 134800 }, { "epoch": 21.94, "learning_rate": 1.2285854136074401e-05, "loss": NaN, "step": 134900 }, { "epoch": 21.94, "eval_loss": 0.40451163053512573, "eval_runtime": 7.6202, "eval_samples_per_second": 13.123, "eval_wer": 0.3337393422655298, "step": 134900 }, { "epoch": 21.95, "learning_rate": 1.2220590634687551e-05, "loss": NaN, "step": 135000 }, { "epoch": 21.95, "eval_loss": 0.41924548149108887, "eval_runtime": 9.3656, "eval_samples_per_second": 10.677, "eval_wer": 0.34226552984165654, "step": 135000 }, { "epoch": 21.97, "learning_rate": 1.2155327133300701e-05, "loss": NaN, "step": 135100 }, { "epoch": 21.97, "eval_loss": 0.42516928911209106, "eval_runtime": 8.4901, "eval_samples_per_second": 11.778, "eval_wer": 0.3447015834348356, "step": 135100 }, { "epoch": 21.99, "learning_rate": 1.2090063631913853e-05, "loss": NaN, "step": 135200 }, { "epoch": 21.99, "eval_loss": 0.40347903966903687, "eval_runtime": 8.9415, "eval_samples_per_second": 11.184, "eval_wer": 0.33008526187576126, "step": 135200 }, { "epoch": 22.0, "learning_rate": 1.2024800130527003e-05, "loss": NaN, "step": 135300 }, { "epoch": 22.0, "eval_loss": 0.5743076801300049, "eval_runtime": 8.6933, "eval_samples_per_second": 11.503, "eval_wer": 0.3373934226552984, "step": 135300 }, { "epoch": 22.02, "learning_rate": 1.1959536629140154e-05, "loss": NaN, "step": 135400 }, { "epoch": 22.02, "eval_loss": 0.40245911478996277, "eval_runtime": 8.8702, "eval_samples_per_second": 11.274, "eval_wer": 0.32886723507917176, "step": 135400 }, { "epoch": 22.04, "learning_rate": 1.1894273127753304e-05, "loss": NaN, "step": 135500 }, { "epoch": 22.04, "eval_loss": 0.4054236114025116, "eval_runtime": 8.0844, "eval_samples_per_second": 12.369, "eval_wer": 0.33617539585870887, "step": 135500 }, { "epoch": 22.05, "learning_rate": 1.1829009626366456e-05, "loss": NaN, "step": 135600 }, { "epoch": 22.05, "eval_loss": 0.40440499782562256, "eval_runtime": 8.0393, "eval_samples_per_second": 12.439, "eval_wer": 0.33495736906211937, "step": 135600 }, { "epoch": 22.07, "learning_rate": 1.1763746124979606e-05, "loss": NaN, "step": 135700 }, { "epoch": 22.07, "eval_loss": 0.41659045219421387, "eval_runtime": 7.7624, "eval_samples_per_second": 12.883, "eval_wer": 0.35322777101096225, "step": 135700 }, { "epoch": 22.08, "learning_rate": 1.1698482623592756e-05, "loss": NaN, "step": 135800 }, { "epoch": 22.08, "eval_loss": 0.47099122405052185, "eval_runtime": 6.8327, "eval_samples_per_second": 14.635, "eval_wer": 0.341047503045067, "step": 135800 }, { "epoch": 22.1, "learning_rate": 1.1633219122205906e-05, "loss": NaN, "step": 135900 }, { "epoch": 22.1, "eval_loss": 0.4006298780441284, "eval_runtime": 6.5785, "eval_samples_per_second": 15.201, "eval_wer": 0.33008526187576126, "step": 135900 }, { "epoch": 22.12, "learning_rate": 1.1567955620819057e-05, "loss": NaN, "step": 136000 }, { "epoch": 22.12, "eval_loss": 0.47020214796066284, "eval_runtime": 8.3159, "eval_samples_per_second": 12.025, "eval_wer": 0.3471376370280146, "step": 136000 }, { "epoch": 22.13, "learning_rate": 1.1502692119432209e-05, "loss": NaN, "step": 136100 }, { "epoch": 22.13, "eval_loss": 0.43791496753692627, "eval_runtime": 8.3887, "eval_samples_per_second": 11.921, "eval_wer": 0.3471376370280146, "step": 136100 }, { "epoch": 22.15, "learning_rate": 1.1437428618045359e-05, "loss": NaN, "step": 136200 }, { "epoch": 22.15, "eval_loss": 0.4248058795928955, "eval_runtime": 10.0383, "eval_samples_per_second": 9.962, "eval_wer": 0.3447015834348356, "step": 136200 }, { "epoch": 22.17, "learning_rate": 1.1372165116658509e-05, "loss": NaN, "step": 136300 }, { "epoch": 22.17, "eval_loss": 0.40560001134872437, "eval_runtime": 7.8536, "eval_samples_per_second": 12.733, "eval_wer": 0.3325213154689403, "step": 136300 }, { "epoch": 22.18, "learning_rate": 1.1306901615271661e-05, "loss": NaN, "step": 136400 }, { "epoch": 22.18, "eval_loss": 0.41141241788864136, "eval_runtime": 7.712, "eval_samples_per_second": 12.967, "eval_wer": 0.33617539585870887, "step": 136400 }, { "epoch": 22.2, "learning_rate": 1.124163811388481e-05, "loss": NaN, "step": 136500 }, { "epoch": 22.2, "eval_loss": 0.37809231877326965, "eval_runtime": 6.7786, "eval_samples_per_second": 14.752, "eval_wer": 0.3398294762484775, "step": 136500 }, { "epoch": 22.21, "learning_rate": 1.1176374612497961e-05, "loss": NaN, "step": 136600 }, { "epoch": 22.21, "eval_loss": 0.48994365334510803, "eval_runtime": 8.9346, "eval_samples_per_second": 11.192, "eval_wer": 0.3471376370280146, "step": 136600 }, { "epoch": 22.23, "learning_rate": 1.1111111111111112e-05, "loss": NaN, "step": 136700 }, { "epoch": 22.23, "eval_loss": 0.43884292244911194, "eval_runtime": 9.9578, "eval_samples_per_second": 10.042, "eval_wer": 0.3520097442143727, "step": 136700 }, { "epoch": 22.25, "learning_rate": 1.1045847609724262e-05, "loss": NaN, "step": 136800 }, { "epoch": 22.25, "eval_loss": 0.4258538782596588, "eval_runtime": 7.3965, "eval_samples_per_second": 13.52, "eval_wer": 0.3459196102314251, "step": 136800 }, { "epoch": 22.26, "learning_rate": 1.0980584108337414e-05, "loss": NaN, "step": 136900 }, { "epoch": 22.26, "eval_loss": 0.44286561012268066, "eval_runtime": 8.7957, "eval_samples_per_second": 11.369, "eval_wer": 0.3520097442143727, "step": 136900 }, { "epoch": 22.28, "learning_rate": 1.0915320606950562e-05, "loss": NaN, "step": 137000 }, { "epoch": 22.28, "eval_loss": 0.41971367597579956, "eval_runtime": 9.2318, "eval_samples_per_second": 10.832, "eval_wer": 0.35809987819732036, "step": 137000 }, { "epoch": 22.3, "learning_rate": 1.0850057105563714e-05, "loss": NaN, "step": 137100 }, { "epoch": 22.3, "eval_loss": 0.45038101077079773, "eval_runtime": 7.8919, "eval_samples_per_second": 12.671, "eval_wer": 0.3447015834348356, "step": 137100 }, { "epoch": 22.31, "learning_rate": 1.0784793604176864e-05, "loss": NaN, "step": 137200 }, { "epoch": 22.31, "eval_loss": 0.417258620262146, "eval_runtime": 9.4776, "eval_samples_per_second": 10.551, "eval_wer": 0.3459196102314251, "step": 137200 }, { "epoch": 22.33, "learning_rate": 1.0719530102790015e-05, "loss": NaN, "step": 137300 }, { "epoch": 22.33, "eval_loss": 0.40922966599464417, "eval_runtime": 7.7162, "eval_samples_per_second": 12.96, "eval_wer": 0.33008526187576126, "step": 137300 }, { "epoch": 22.35, "learning_rate": 1.0654266601403167e-05, "loss": NaN, "step": 137400 }, { "epoch": 22.35, "eval_loss": 0.42340758442878723, "eval_runtime": 7.7407, "eval_samples_per_second": 12.919, "eval_wer": 0.3459196102314251, "step": 137400 }, { "epoch": 22.36, "learning_rate": 1.0589003100016317e-05, "loss": NaN, "step": 137500 }, { "epoch": 22.36, "eval_loss": 0.43829768896102905, "eval_runtime": 9.0473, "eval_samples_per_second": 11.053, "eval_wer": 0.3471376370280146, "step": 137500 }, { "epoch": 22.38, "learning_rate": 1.0523739598629467e-05, "loss": NaN, "step": 137600 }, { "epoch": 22.38, "eval_loss": 0.4190714955329895, "eval_runtime": 7.2713, "eval_samples_per_second": 13.753, "eval_wer": 0.3373934226552984, "step": 137600 }, { "epoch": 22.39, "learning_rate": 1.0458476097242617e-05, "loss": NaN, "step": 137700 }, { "epoch": 22.39, "eval_loss": 0.38507279753685, "eval_runtime": 8.2207, "eval_samples_per_second": 12.164, "eval_wer": 0.33617539585870887, "step": 137700 }, { "epoch": 22.41, "learning_rate": 1.0393212595855767e-05, "loss": NaN, "step": 137800 }, { "epoch": 22.41, "eval_loss": 0.3674430847167969, "eval_runtime": 9.7115, "eval_samples_per_second": 10.297, "eval_wer": 0.3313032886723508, "step": 137800 }, { "epoch": 22.43, "learning_rate": 1.0327949094468918e-05, "loss": NaN, "step": 137900 }, { "epoch": 22.43, "eval_loss": 0.40191754698753357, "eval_runtime": 7.543, "eval_samples_per_second": 13.257, "eval_wer": 0.33008526187576126, "step": 137900 }, { "epoch": 22.44, "learning_rate": 1.026268559308207e-05, "loss": NaN, "step": 138000 }, { "epoch": 22.44, "eval_loss": 0.4558006525039673, "eval_runtime": 8.3592, "eval_samples_per_second": 11.963, "eval_wer": 0.3507917174177832, "step": 138000 }, { "epoch": 22.46, "learning_rate": 1.019742209169522e-05, "loss": NaN, "step": 138100 }, { "epoch": 22.46, "eval_loss": 0.5849547386169434, "eval_runtime": 8.4615, "eval_samples_per_second": 11.818, "eval_wer": 0.33495736906211937, "step": 138100 }, { "epoch": 22.48, "learning_rate": 1.013215859030837e-05, "loss": NaN, "step": 138200 }, { "epoch": 22.48, "eval_loss": 0.45433205366134644, "eval_runtime": 8.487, "eval_samples_per_second": 11.783, "eval_wer": 0.33008526187576126, "step": 138200 }, { "epoch": 22.49, "learning_rate": 1.0066895088921522e-05, "loss": NaN, "step": 138300 }, { "epoch": 22.49, "eval_loss": 0.420282781124115, "eval_runtime": 9.2501, "eval_samples_per_second": 10.811, "eval_wer": 0.33617539585870887, "step": 138300 }, { "epoch": 22.51, "learning_rate": 1.000163158753467e-05, "loss": NaN, "step": 138400 }, { "epoch": 22.51, "eval_loss": 0.4292939305305481, "eval_runtime": 8.0963, "eval_samples_per_second": 12.351, "eval_wer": 0.3337393422655298, "step": 138400 }, { "epoch": 22.52, "learning_rate": 9.936368086147822e-06, "loss": NaN, "step": 138500 }, { "epoch": 22.52, "eval_loss": 0.4376954138278961, "eval_runtime": 8.5678, "eval_samples_per_second": 11.672, "eval_wer": 0.3093788063337393, "step": 138500 }, { "epoch": 22.54, "learning_rate": 9.871104584760973e-06, "loss": NaN, "step": 138600 }, { "epoch": 22.54, "eval_loss": 0.4139672815799713, "eval_runtime": 8.398, "eval_samples_per_second": 11.908, "eval_wer": 0.3313032886723508, "step": 138600 }, { "epoch": 22.56, "learning_rate": 9.805841083374123e-06, "loss": NaN, "step": 138700 }, { "epoch": 22.56, "eval_loss": 0.4242633581161499, "eval_runtime": 10.5113, "eval_samples_per_second": 9.514, "eval_wer": 0.34835566382460414, "step": 138700 }, { "epoch": 22.57, "learning_rate": 9.740577581987275e-06, "loss": NaN, "step": 138800 }, { "epoch": 22.57, "eval_loss": 0.44767504930496216, "eval_runtime": 7.6566, "eval_samples_per_second": 13.061, "eval_wer": 0.3386114494518879, "step": 138800 }, { "epoch": 22.59, "learning_rate": 9.675314080600425e-06, "loss": NaN, "step": 138900 }, { "epoch": 22.59, "eval_loss": 0.43390411138534546, "eval_runtime": 8.5202, "eval_samples_per_second": 11.737, "eval_wer": 0.341047503045067, "step": 138900 }, { "epoch": 22.61, "learning_rate": 9.610050579213575e-06, "loss": NaN, "step": 139000 }, { "epoch": 22.61, "eval_loss": 0.42713436484336853, "eval_runtime": 7.4028, "eval_samples_per_second": 13.508, "eval_wer": 0.32521315468940315, "step": 139000 }, { "epoch": 22.62, "learning_rate": 9.544787077826727e-06, "loss": NaN, "step": 139100 }, { "epoch": 22.62, "eval_loss": 0.4049948751926422, "eval_runtime": 9.4604, "eval_samples_per_second": 10.57, "eval_wer": 0.3276492082825822, "step": 139100 }, { "epoch": 22.64, "learning_rate": 9.479523576439876e-06, "loss": NaN, "step": 139200 }, { "epoch": 22.64, "eval_loss": 0.4711925983428955, "eval_runtime": 7.5699, "eval_samples_per_second": 13.21, "eval_wer": 0.341047503045067, "step": 139200 }, { "epoch": 22.65, "learning_rate": 9.414260075053028e-06, "loss": NaN, "step": 139300 }, { "epoch": 22.65, "eval_loss": 0.40160369873046875, "eval_runtime": 7.5911, "eval_samples_per_second": 13.173, "eval_wer": 0.32886723507917176, "step": 139300 }, { "epoch": 22.67, "learning_rate": 9.348996573666178e-06, "loss": NaN, "step": 139400 }, { "epoch": 22.67, "eval_loss": 0.45362401008605957, "eval_runtime": 6.8691, "eval_samples_per_second": 14.558, "eval_wer": 0.32886723507917176, "step": 139400 }, { "epoch": 22.69, "learning_rate": 9.283733072279328e-06, "loss": NaN, "step": 139500 }, { "epoch": 22.69, "eval_loss": 0.4383563995361328, "eval_runtime": 9.4025, "eval_samples_per_second": 10.635, "eval_wer": 0.3386114494518879, "step": 139500 }, { "epoch": 22.7, "learning_rate": 9.218469570892478e-06, "loss": NaN, "step": 139600 }, { "epoch": 22.7, "eval_loss": 0.445679634809494, "eval_runtime": 9.7736, "eval_samples_per_second": 10.232, "eval_wer": 0.3386114494518879, "step": 139600 }, { "epoch": 22.72, "learning_rate": 9.15320606950563e-06, "loss": NaN, "step": 139700 }, { "epoch": 22.72, "eval_loss": 0.4067118763923645, "eval_runtime": 7.3892, "eval_samples_per_second": 13.533, "eval_wer": 0.3264311814859927, "step": 139700 }, { "epoch": 22.74, "learning_rate": 9.08794256811878e-06, "loss": NaN, "step": 139800 }, { "epoch": 22.74, "eval_loss": 0.3995942771434784, "eval_runtime": 7.8855, "eval_samples_per_second": 12.681, "eval_wer": 0.3373934226552984, "step": 139800 }, { "epoch": 22.75, "learning_rate": 9.02267906673193e-06, "loss": NaN, "step": 139900 }, { "epoch": 22.75, "eval_loss": 0.39302563667297363, "eval_runtime": 8.6481, "eval_samples_per_second": 11.563, "eval_wer": 0.3398294762484775, "step": 139900 }, { "epoch": 22.77, "learning_rate": 8.95741556534508e-06, "loss": NaN, "step": 140000 }, { "epoch": 22.77, "eval_loss": 0.5054168701171875, "eval_runtime": 8.0714, "eval_samples_per_second": 12.389, "eval_wer": 0.3520097442143727, "step": 140000 }, { "epoch": 22.78, "learning_rate": 8.892152063958231e-06, "loss": NaN, "step": 140100 }, { "epoch": 22.78, "eval_loss": 0.37638041377067566, "eval_runtime": 7.885, "eval_samples_per_second": 12.682, "eval_wer": 0.3325213154689403, "step": 140100 }, { "epoch": 22.8, "learning_rate": 8.826888562571383e-06, "loss": NaN, "step": 140200 }, { "epoch": 22.8, "eval_loss": 0.4191051423549652, "eval_runtime": 8.5703, "eval_samples_per_second": 11.668, "eval_wer": 0.3459196102314251, "step": 140200 }, { "epoch": 22.82, "learning_rate": 8.761625061184533e-06, "loss": NaN, "step": 140300 }, { "epoch": 22.82, "eval_loss": 0.47149497270584106, "eval_runtime": 7.6448, "eval_samples_per_second": 13.081, "eval_wer": 0.3520097442143727, "step": 140300 }, { "epoch": 22.83, "learning_rate": 8.696361559797683e-06, "loss": NaN, "step": 140400 }, { "epoch": 22.83, "eval_loss": 0.4407516419887543, "eval_runtime": 7.1529, "eval_samples_per_second": 13.98, "eval_wer": 0.3386114494518879, "step": 140400 }, { "epoch": 22.85, "learning_rate": 8.631098058410834e-06, "loss": NaN, "step": 140500 }, { "epoch": 22.85, "eval_loss": 0.40118682384490967, "eval_runtime": 8.4283, "eval_samples_per_second": 11.865, "eval_wer": 0.341047503045067, "step": 140500 }, { "epoch": 22.87, "learning_rate": 8.565834557023984e-06, "loss": NaN, "step": 140600 }, { "epoch": 22.87, "eval_loss": 0.4191232919692993, "eval_runtime": 9.0572, "eval_samples_per_second": 11.041, "eval_wer": 0.3459196102314251, "step": 140600 }, { "epoch": 22.88, "learning_rate": 8.500571055637136e-06, "loss": NaN, "step": 140700 }, { "epoch": 22.88, "eval_loss": 0.39035916328430176, "eval_runtime": 8.5729, "eval_samples_per_second": 11.665, "eval_wer": 0.3520097442143727, "step": 140700 }, { "epoch": 22.9, "learning_rate": 8.435307554250286e-06, "loss": NaN, "step": 140800 }, { "epoch": 22.9, "eval_loss": 0.3838728070259094, "eval_runtime": 7.4544, "eval_samples_per_second": 13.415, "eval_wer": 0.32886723507917176, "step": 140800 }, { "epoch": 22.91, "learning_rate": 8.370044052863436e-06, "loss": NaN, "step": 140900 }, { "epoch": 22.91, "eval_loss": 0.4352475702762604, "eval_runtime": 8.9386, "eval_samples_per_second": 11.187, "eval_wer": 0.3520097442143727, "step": 140900 }, { "epoch": 22.93, "learning_rate": 8.304780551476588e-06, "loss": NaN, "step": 141000 }, { "epoch": 22.93, "eval_loss": 0.37819182872772217, "eval_runtime": 8.645, "eval_samples_per_second": 11.567, "eval_wer": 0.3373934226552984, "step": 141000 }, { "epoch": 22.95, "learning_rate": 8.239517050089737e-06, "loss": NaN, "step": 141100 }, { "epoch": 22.95, "eval_loss": 0.3652733266353607, "eval_runtime": 8.9186, "eval_samples_per_second": 11.212, "eval_wer": 0.3471376370280146, "step": 141100 }, { "epoch": 22.96, "learning_rate": 8.174253548702889e-06, "loss": NaN, "step": 141200 }, { "epoch": 22.96, "eval_loss": 0.4218634068965912, "eval_runtime": 7.892, "eval_samples_per_second": 12.671, "eval_wer": 0.34226552984165654, "step": 141200 }, { "epoch": 22.98, "learning_rate": 8.108990047316039e-06, "loss": NaN, "step": 141300 }, { "epoch": 22.98, "eval_loss": 0.40318989753723145, "eval_runtime": 8.686, "eval_samples_per_second": 11.513, "eval_wer": 0.34835566382460414, "step": 141300 }, { "epoch": 23.0, "learning_rate": 8.043726545929189e-06, "loss": NaN, "step": 141400 }, { "epoch": 23.0, "eval_loss": 0.4164011478424072, "eval_runtime": 8.8437, "eval_samples_per_second": 11.307, "eval_wer": 0.34835566382460414, "step": 141400 }, { "epoch": 23.01, "learning_rate": 7.978463044542341e-06, "loss": NaN, "step": 141500 }, { "epoch": 23.01, "eval_loss": 0.4907635450363159, "eval_runtime": 7.8965, "eval_samples_per_second": 12.664, "eval_wer": 0.33617539585870887, "step": 141500 }, { "epoch": 23.03, "learning_rate": 7.913199543155491e-06, "loss": NaN, "step": 141600 }, { "epoch": 23.03, "eval_loss": 0.4023902118206024, "eval_runtime": 8.1256, "eval_samples_per_second": 12.307, "eval_wer": 0.3398294762484775, "step": 141600 }, { "epoch": 23.04, "learning_rate": 7.847936041768641e-06, "loss": NaN, "step": 141700 }, { "epoch": 23.04, "eval_loss": 0.4590035676956177, "eval_runtime": 10.0026, "eval_samples_per_second": 9.997, "eval_wer": 0.3386114494518879, "step": 141700 }, { "epoch": 23.06, "learning_rate": 7.782672540381792e-06, "loss": NaN, "step": 141800 }, { "epoch": 23.06, "eval_loss": 0.4697200655937195, "eval_runtime": 8.4733, "eval_samples_per_second": 11.802, "eval_wer": 0.3276492082825822, "step": 141800 }, { "epoch": 23.08, "learning_rate": 7.717409038994942e-06, "loss": NaN, "step": 141900 }, { "epoch": 23.08, "eval_loss": 0.4211934804916382, "eval_runtime": 8.4528, "eval_samples_per_second": 11.83, "eval_wer": 0.33617539585870887, "step": 141900 }, { "epoch": 23.09, "learning_rate": 7.652145537608094e-06, "loss": NaN, "step": 142000 }, { "epoch": 23.09, "eval_loss": 0.39060890674591064, "eval_runtime": 7.5777, "eval_samples_per_second": 13.197, "eval_wer": 0.3373934226552984, "step": 142000 }, { "epoch": 23.11, "learning_rate": 7.586882036221243e-06, "loss": NaN, "step": 142100 }, { "epoch": 23.11, "eval_loss": 0.37855765223503113, "eval_runtime": 7.3666, "eval_samples_per_second": 13.575, "eval_wer": 0.29963459196102316, "step": 142100 }, { "epoch": 23.13, "learning_rate": 7.521618534834394e-06, "loss": NaN, "step": 142200 }, { "epoch": 23.13, "eval_loss": 0.46709468960762024, "eval_runtime": 7.4759, "eval_samples_per_second": 13.376, "eval_wer": 0.3337393422655298, "step": 142200 }, { "epoch": 23.14, "learning_rate": 7.456355033447544e-06, "loss": NaN, "step": 142300 }, { "epoch": 23.14, "eval_loss": 0.3746023178100586, "eval_runtime": 7.6965, "eval_samples_per_second": 12.993, "eval_wer": 0.3325213154689403, "step": 142300 }, { "epoch": 23.16, "learning_rate": 7.3910915320606955e-06, "loss": NaN, "step": 142400 }, { "epoch": 23.16, "eval_loss": 0.4183931052684784, "eval_runtime": 10.5082, "eval_samples_per_second": 9.516, "eval_wer": 0.33617539585870887, "step": 142400 }, { "epoch": 23.17, "learning_rate": 7.3258280306738465e-06, "loss": NaN, "step": 142500 }, { "epoch": 23.17, "eval_loss": 0.387781023979187, "eval_runtime": 8.2483, "eval_samples_per_second": 12.124, "eval_wer": 0.3337393422655298, "step": 142500 }, { "epoch": 23.19, "learning_rate": 7.260564529286997e-06, "loss": NaN, "step": 142600 }, { "epoch": 23.19, "eval_loss": 0.4201037883758545, "eval_runtime": 9.0845, "eval_samples_per_second": 11.008, "eval_wer": 0.33495736906211937, "step": 142600 }, { "epoch": 23.21, "learning_rate": 7.195301027900148e-06, "loss": NaN, "step": 142700 }, { "epoch": 23.21, "eval_loss": 0.40640342235565186, "eval_runtime": 8.611, "eval_samples_per_second": 11.613, "eval_wer": 0.33495736906211937, "step": 142700 }, { "epoch": 23.22, "learning_rate": 7.130037526513297e-06, "loss": NaN, "step": 142800 }, { "epoch": 23.22, "eval_loss": 0.36859330534935, "eval_runtime": 6.9585, "eval_samples_per_second": 14.371, "eval_wer": 0.33008526187576126, "step": 142800 }, { "epoch": 23.24, "learning_rate": 7.064774025126448e-06, "loss": NaN, "step": 142900 }, { "epoch": 23.24, "eval_loss": 0.5641127824783325, "eval_runtime": 9.3783, "eval_samples_per_second": 10.663, "eval_wer": 0.30572472594397077, "step": 142900 }, { "epoch": 23.26, "learning_rate": 6.9995105237395985e-06, "loss": NaN, "step": 143000 }, { "epoch": 23.26, "eval_loss": 0.390995591878891, "eval_runtime": 9.1316, "eval_samples_per_second": 10.951, "eval_wer": 0.32886723507917176, "step": 143000 }, { "epoch": 23.27, "learning_rate": 6.9342470223527496e-06, "loss": NaN, "step": 143100 }, { "epoch": 23.27, "eval_loss": 0.3884507119655609, "eval_runtime": 7.4684, "eval_samples_per_second": 13.39, "eval_wer": 0.33008526187576126, "step": 143100 }, { "epoch": 23.29, "learning_rate": 6.868983520965901e-06, "loss": NaN, "step": 143200 }, { "epoch": 23.29, "eval_loss": 0.37767794728279114, "eval_runtime": 7.8276, "eval_samples_per_second": 12.775, "eval_wer": 0.3337393422655298, "step": 143200 }, { "epoch": 23.3, "learning_rate": 6.803720019579051e-06, "loss": NaN, "step": 143300 }, { "epoch": 23.3, "eval_loss": 0.39070072770118713, "eval_runtime": 7.9301, "eval_samples_per_second": 12.61, "eval_wer": 0.3373934226552984, "step": 143300 }, { "epoch": 23.32, "learning_rate": 6.738456518192202e-06, "loss": NaN, "step": 143400 }, { "epoch": 23.32, "eval_loss": 0.3968910276889801, "eval_runtime": 8.388, "eval_samples_per_second": 11.922, "eval_wer": 0.33495736906211937, "step": 143400 }, { "epoch": 23.34, "learning_rate": 6.673193016805351e-06, "loss": NaN, "step": 143500 }, { "epoch": 23.34, "eval_loss": 0.55922931432724, "eval_runtime": 8.0437, "eval_samples_per_second": 12.432, "eval_wer": 0.3520097442143727, "step": 143500 }, { "epoch": 23.35, "learning_rate": 6.607929515418502e-06, "loss": NaN, "step": 143600 }, { "epoch": 23.35, "eval_loss": 0.3922981321811676, "eval_runtime": 7.1209, "eval_samples_per_second": 14.043, "eval_wer": 0.3386114494518879, "step": 143600 }, { "epoch": 23.37, "learning_rate": 6.5426660140316534e-06, "loss": NaN, "step": 143700 }, { "epoch": 23.37, "eval_loss": 0.39172208309173584, "eval_runtime": 7.6116, "eval_samples_per_second": 13.138, "eval_wer": 0.3373934226552984, "step": 143700 }, { "epoch": 23.39, "learning_rate": 6.477402512644804e-06, "loss": NaN, "step": 143800 }, { "epoch": 23.39, "eval_loss": 0.4471363127231598, "eval_runtime": 8.7619, "eval_samples_per_second": 11.413, "eval_wer": 0.3373934226552984, "step": 143800 }, { "epoch": 23.4, "learning_rate": 6.412139011257955e-06, "loss": NaN, "step": 143900 }, { "epoch": 23.4, "eval_loss": 0.44637829065322876, "eval_runtime": 7.6648, "eval_samples_per_second": 13.047, "eval_wer": 0.34226552984165654, "step": 143900 }, { "epoch": 23.42, "learning_rate": 6.346875509871104e-06, "loss": NaN, "step": 144000 }, { "epoch": 23.42, "eval_loss": 0.3966550827026367, "eval_runtime": 9.137, "eval_samples_per_second": 10.944, "eval_wer": 0.3373934226552984, "step": 144000 }, { "epoch": 23.43, "learning_rate": 6.281612008484255e-06, "loss": NaN, "step": 144100 }, { "epoch": 23.43, "eval_loss": 0.3890346884727478, "eval_runtime": 6.6729, "eval_samples_per_second": 14.986, "eval_wer": 0.33008526187576126, "step": 144100 }, { "epoch": 23.45, "learning_rate": 6.216348507097406e-06, "loss": NaN, "step": 144200 }, { "epoch": 23.45, "eval_loss": 0.417468786239624, "eval_runtime": 7.6605, "eval_samples_per_second": 13.054, "eval_wer": 0.3337393422655298, "step": 144200 }, { "epoch": 23.47, "learning_rate": 6.1510850057105564e-06, "loss": NaN, "step": 144300 }, { "epoch": 23.47, "eval_loss": 0.47427332401275635, "eval_runtime": 8.9388, "eval_samples_per_second": 11.187, "eval_wer": 0.3264311814859927, "step": 144300 }, { "epoch": 23.48, "learning_rate": 6.085821504323707e-06, "loss": NaN, "step": 144400 }, { "epoch": 23.48, "eval_loss": 0.3865101933479309, "eval_runtime": 7.3321, "eval_samples_per_second": 13.639, "eval_wer": 0.33008526187576126, "step": 144400 }, { "epoch": 23.5, "learning_rate": 6.020558002936858e-06, "loss": NaN, "step": 144500 }, { "epoch": 23.5, "eval_loss": 0.3971826434135437, "eval_runtime": 9.3902, "eval_samples_per_second": 10.649, "eval_wer": 0.3459196102314251, "step": 144500 }, { "epoch": 23.52, "learning_rate": 5.955294501550009e-06, "loss": NaN, "step": 144600 }, { "epoch": 23.52, "eval_loss": 0.5336860418319702, "eval_runtime": 7.7801, "eval_samples_per_second": 12.853, "eval_wer": 0.3276492082825822, "step": 144600 }, { "epoch": 23.53, "learning_rate": 5.890031000163159e-06, "loss": NaN, "step": 144700 }, { "epoch": 23.53, "eval_loss": 0.4055691063404083, "eval_runtime": 7.3304, "eval_samples_per_second": 13.642, "eval_wer": 0.3325213154689403, "step": 144700 }, { "epoch": 23.55, "learning_rate": 5.824767498776309e-06, "loss": NaN, "step": 144800 }, { "epoch": 23.55, "eval_loss": 0.39876997470855713, "eval_runtime": 8.2514, "eval_samples_per_second": 12.119, "eval_wer": 0.3398294762484775, "step": 144800 }, { "epoch": 23.56, "learning_rate": 5.75950399738946e-06, "loss": NaN, "step": 144900 }, { "epoch": 23.56, "eval_loss": 0.46831241250038147, "eval_runtime": 7.8267, "eval_samples_per_second": 12.777, "eval_wer": 0.33495736906211937, "step": 144900 }, { "epoch": 23.58, "learning_rate": 5.6942404960026105e-06, "loss": NaN, "step": 145000 }, { "epoch": 23.58, "eval_loss": 0.402251273393631, "eval_runtime": 8.6896, "eval_samples_per_second": 11.508, "eval_wer": 0.341047503045067, "step": 145000 }, { "epoch": 23.6, "learning_rate": 5.628976994615762e-06, "loss": NaN, "step": 145100 }, { "epoch": 23.6, "eval_loss": 0.42078322172164917, "eval_runtime": 7.0241, "eval_samples_per_second": 14.237, "eval_wer": 0.3386114494518879, "step": 145100 }, { "epoch": 23.61, "learning_rate": 5.563713493228912e-06, "loss": NaN, "step": 145200 }, { "epoch": 23.61, "eval_loss": 0.37739893794059753, "eval_runtime": 7.4681, "eval_samples_per_second": 13.39, "eval_wer": 0.3325213154689403, "step": 145200 }, { "epoch": 23.63, "learning_rate": 5.498449991842063e-06, "loss": NaN, "step": 145300 }, { "epoch": 23.63, "eval_loss": 0.38974130153656006, "eval_runtime": 8.1636, "eval_samples_per_second": 12.249, "eval_wer": 0.3325213154689403, "step": 145300 }, { "epoch": 23.65, "learning_rate": 5.433186490455213e-06, "loss": NaN, "step": 145400 }, { "epoch": 23.65, "eval_loss": 0.42759647965431213, "eval_runtime": 8.6656, "eval_samples_per_second": 11.54, "eval_wer": 0.3447015834348356, "step": 145400 }, { "epoch": 23.66, "learning_rate": 5.367922989068363e-06, "loss": NaN, "step": 145500 }, { "epoch": 23.66, "eval_loss": 0.446329265832901, "eval_runtime": 7.4281, "eval_samples_per_second": 13.462, "eval_wer": 0.3447015834348356, "step": 145500 }, { "epoch": 23.68, "learning_rate": 5.302659487681514e-06, "loss": NaN, "step": 145600 }, { "epoch": 23.68, "eval_loss": 0.4557843804359436, "eval_runtime": 8.6796, "eval_samples_per_second": 11.521, "eval_wer": 0.34957369062119364, "step": 145600 }, { "epoch": 23.69, "learning_rate": 5.2373959862946655e-06, "loss": NaN, "step": 145700 }, { "epoch": 23.69, "eval_loss": 0.42350074648857117, "eval_runtime": 6.9233, "eval_samples_per_second": 14.444, "eval_wer": 0.3313032886723508, "step": 145700 }, { "epoch": 23.71, "learning_rate": 5.172132484907816e-06, "loss": NaN, "step": 145800 }, { "epoch": 23.71, "eval_loss": 0.4503900110721588, "eval_runtime": 9.2067, "eval_samples_per_second": 10.862, "eval_wer": 0.34835566382460414, "step": 145800 }, { "epoch": 23.73, "learning_rate": 5.106868983520966e-06, "loss": NaN, "step": 145900 }, { "epoch": 23.73, "eval_loss": 0.38946789503097534, "eval_runtime": 6.7208, "eval_samples_per_second": 14.879, "eval_wer": 0.32521315468940315, "step": 145900 }, { "epoch": 23.74, "learning_rate": 5.041605482134117e-06, "loss": NaN, "step": 146000 }, { "epoch": 23.74, "eval_loss": 0.42941275238990784, "eval_runtime": 9.2546, "eval_samples_per_second": 10.805, "eval_wer": 0.3276492082825822, "step": 146000 }, { "epoch": 23.76, "learning_rate": 4.976341980747267e-06, "loss": NaN, "step": 146100 }, { "epoch": 23.76, "eval_loss": 0.3988470435142517, "eval_runtime": 8.8515, "eval_samples_per_second": 11.298, "eval_wer": 0.3337393422655298, "step": 146100 }, { "epoch": 23.78, "learning_rate": 4.911078479360418e-06, "loss": NaN, "step": 146200 }, { "epoch": 23.78, "eval_loss": 0.37505969405174255, "eval_runtime": 8.8108, "eval_samples_per_second": 11.35, "eval_wer": 0.3264311814859927, "step": 146200 }, { "epoch": 23.79, "learning_rate": 4.8458149779735685e-06, "loss": NaN, "step": 146300 }, { "epoch": 23.79, "eval_loss": 0.4064733386039734, "eval_runtime": 8.0955, "eval_samples_per_second": 12.353, "eval_wer": 0.33495736906211937, "step": 146300 }, { "epoch": 23.81, "learning_rate": 4.7805514765867196e-06, "loss": NaN, "step": 146400 }, { "epoch": 23.81, "eval_loss": 0.38152438402175903, "eval_runtime": 9.0081, "eval_samples_per_second": 11.101, "eval_wer": 0.3264311814859927, "step": 146400 }, { "epoch": 23.83, "learning_rate": 4.71528797519987e-06, "loss": NaN, "step": 146500 }, { "epoch": 23.83, "eval_loss": 0.4286877512931824, "eval_runtime": 34.8815, "eval_samples_per_second": 2.867, "eval_wer": 0.34957369062119364, "step": 146500 }, { "epoch": 23.84, "learning_rate": 4.65002447381302e-06, "loss": NaN, "step": 146600 }, { "epoch": 23.84, "eval_loss": 0.3909842371940613, "eval_runtime": 6.7922, "eval_samples_per_second": 14.723, "eval_wer": 0.3215590742996346, "step": 146600 }, { "epoch": 23.86, "learning_rate": 4.58476097242617e-06, "loss": NaN, "step": 146700 }, { "epoch": 23.86, "eval_loss": 0.4343806505203247, "eval_runtime": 8.1254, "eval_samples_per_second": 12.307, "eval_wer": 0.33008526187576126, "step": 146700 }, { "epoch": 23.87, "learning_rate": 4.519497471039322e-06, "loss": NaN, "step": 146800 }, { "epoch": 23.87, "eval_loss": 0.38777297735214233, "eval_runtime": 8.5033, "eval_samples_per_second": 11.76, "eval_wer": 0.3313032886723508, "step": 146800 }, { "epoch": 23.89, "learning_rate": 4.454233969652472e-06, "loss": NaN, "step": 146900 }, { "epoch": 23.89, "eval_loss": 0.40899020433425903, "eval_runtime": 7.6862, "eval_samples_per_second": 13.01, "eval_wer": 0.3227771010962241, "step": 146900 }, { "epoch": 23.91, "learning_rate": 4.388970468265623e-06, "loss": NaN, "step": 147000 }, { "epoch": 23.91, "eval_loss": 0.39654624462127686, "eval_runtime": 9.0568, "eval_samples_per_second": 11.041, "eval_wer": 0.3313032886723508, "step": 147000 }, { "epoch": 23.92, "learning_rate": 4.323706966878773e-06, "loss": NaN, "step": 147100 }, { "epoch": 23.92, "eval_loss": 0.5828571915626526, "eval_runtime": 9.0588, "eval_samples_per_second": 11.039, "eval_wer": 0.33617539585870887, "step": 147100 }, { "epoch": 23.94, "learning_rate": 4.258443465491924e-06, "loss": NaN, "step": 147200 }, { "epoch": 23.94, "eval_loss": 0.4280412793159485, "eval_runtime": 8.3581, "eval_samples_per_second": 11.964, "eval_wer": 0.33495736906211937, "step": 147200 }, { "epoch": 23.96, "learning_rate": 4.193179964105074e-06, "loss": NaN, "step": 147300 }, { "epoch": 23.96, "eval_loss": 0.3880465030670166, "eval_runtime": 8.3284, "eval_samples_per_second": 12.007, "eval_wer": 0.3215590742996346, "step": 147300 }, { "epoch": 23.97, "learning_rate": 4.127916462718225e-06, "loss": NaN, "step": 147400 }, { "epoch": 23.97, "eval_loss": 0.4489409923553467, "eval_runtime": 8.5866, "eval_samples_per_second": 11.646, "eval_wer": 0.33617539585870887, "step": 147400 }, { "epoch": 23.99, "learning_rate": 4.062652961331375e-06, "loss": NaN, "step": 147500 }, { "epoch": 23.99, "eval_loss": 0.41607800126075745, "eval_runtime": 8.1254, "eval_samples_per_second": 12.307, "eval_wer": 0.3471376370280146, "step": 147500 }, { "epoch": 24.0, "learning_rate": 3.9973894599445265e-06, "loss": NaN, "step": 147600 }, { "epoch": 24.0, "eval_loss": 0.38375845551490784, "eval_runtime": 8.373, "eval_samples_per_second": 11.943, "eval_wer": 0.3227771010962241, "step": 147600 }, { "epoch": 24.02, "learning_rate": 3.932125958557677e-06, "loss": NaN, "step": 147700 }, { "epoch": 24.02, "eval_loss": 0.4201222360134125, "eval_runtime": 8.7128, "eval_samples_per_second": 11.477, "eval_wer": 0.3447015834348356, "step": 147700 }, { "epoch": 24.04, "learning_rate": 3.866862457170827e-06, "loss": NaN, "step": 147800 }, { "epoch": 24.04, "eval_loss": 0.3707936108112335, "eval_runtime": 8.5162, "eval_samples_per_second": 11.742, "eval_wer": 0.3215590742996346, "step": 147800 }, { "epoch": 24.05, "learning_rate": 3.8015989557839784e-06, "loss": NaN, "step": 147900 }, { "epoch": 24.05, "eval_loss": 0.4147247076034546, "eval_runtime": 7.5178, "eval_samples_per_second": 13.302, "eval_wer": 0.3373934226552984, "step": 147900 }, { "epoch": 24.07, "learning_rate": 3.7363354543971286e-06, "loss": NaN, "step": 148000 }, { "epoch": 24.07, "eval_loss": 0.3992792069911957, "eval_runtime": 8.0681, "eval_samples_per_second": 12.395, "eval_wer": 0.3386114494518879, "step": 148000 }, { "epoch": 24.09, "learning_rate": 3.6710719530102793e-06, "loss": NaN, "step": 148100 }, { "epoch": 24.09, "eval_loss": 0.4286440312862396, "eval_runtime": 6.9843, "eval_samples_per_second": 14.318, "eval_wer": 0.34348355663824603, "step": 148100 }, { "epoch": 24.1, "learning_rate": 3.60580845162343e-06, "loss": NaN, "step": 148200 }, { "epoch": 24.1, "eval_loss": 0.4791194200515747, "eval_runtime": 7.4344, "eval_samples_per_second": 13.451, "eval_wer": 0.3447015834348356, "step": 148200 }, { "epoch": 24.12, "learning_rate": 3.54054495023658e-06, "loss": NaN, "step": 148300 }, { "epoch": 24.12, "eval_loss": 0.3939591348171234, "eval_runtime": 7.3768, "eval_samples_per_second": 13.556, "eval_wer": 0.34348355663824603, "step": 148300 }, { "epoch": 24.13, "learning_rate": 3.4752814488497308e-06, "loss": NaN, "step": 148400 }, { "epoch": 24.13, "eval_loss": 0.4074297249317169, "eval_runtime": 6.9657, "eval_samples_per_second": 14.356, "eval_wer": 0.3337393422655298, "step": 148400 }, { "epoch": 24.15, "learning_rate": 3.410017947462882e-06, "loss": NaN, "step": 148500 }, { "epoch": 24.15, "eval_loss": 0.42010945081710815, "eval_runtime": 7.4953, "eval_samples_per_second": 13.342, "eval_wer": 0.3373934226552984, "step": 148500 }, { "epoch": 24.17, "learning_rate": 3.3447544460760325e-06, "loss": NaN, "step": 148600 }, { "epoch": 24.17, "eval_loss": 0.3944063186645508, "eval_runtime": 8.1881, "eval_samples_per_second": 12.213, "eval_wer": 0.3313032886723508, "step": 148600 }, { "epoch": 24.18, "learning_rate": 3.2794909446891827e-06, "loss": NaN, "step": 148700 }, { "epoch": 24.18, "eval_loss": 0.38928863406181335, "eval_runtime": 9.1121, "eval_samples_per_second": 10.974, "eval_wer": 0.3325213154689403, "step": 148700 }, { "epoch": 24.2, "learning_rate": 3.2142274433023334e-06, "loss": NaN, "step": 148800 }, { "epoch": 24.2, "eval_loss": 0.4040900766849518, "eval_runtime": 7.8824, "eval_samples_per_second": 12.687, "eval_wer": 0.33495736906211937, "step": 148800 }, { "epoch": 24.22, "learning_rate": 3.1489639419154836e-06, "loss": NaN, "step": 148900 }, { "epoch": 24.22, "eval_loss": 0.39032647013664246, "eval_runtime": 6.7307, "eval_samples_per_second": 14.857, "eval_wer": 0.3215590742996346, "step": 148900 }, { "epoch": 24.23, "learning_rate": 3.0837004405286347e-06, "loss": NaN, "step": 149000 }, { "epoch": 24.23, "eval_loss": 0.40411511063575745, "eval_runtime": 8.2756, "eval_samples_per_second": 12.084, "eval_wer": 0.32886723507917176, "step": 149000 }, { "epoch": 24.25, "learning_rate": 3.018436939141785e-06, "loss": NaN, "step": 149100 }, { "epoch": 24.25, "eval_loss": 0.43083474040031433, "eval_runtime": 9.0012, "eval_samples_per_second": 11.11, "eval_wer": 0.3227771010962241, "step": 149100 }, { "epoch": 24.26, "learning_rate": 2.953173437754936e-06, "loss": NaN, "step": 149200 }, { "epoch": 24.26, "eval_loss": 0.3937508463859558, "eval_runtime": 7.7288, "eval_samples_per_second": 12.939, "eval_wer": 0.315468940316687, "step": 149200 }, { "epoch": 24.28, "learning_rate": 2.887909936368086e-06, "loss": NaN, "step": 149300 }, { "epoch": 24.28, "eval_loss": 0.3944269120693207, "eval_runtime": 6.9338, "eval_samples_per_second": 14.422, "eval_wer": 0.32399512789281365, "step": 149300 }, { "epoch": 24.3, "learning_rate": 2.822646434981237e-06, "loss": NaN, "step": 149400 }, { "epoch": 24.3, "eval_loss": 0.5013560652732849, "eval_runtime": 7.8923, "eval_samples_per_second": 12.671, "eval_wer": 0.34957369062119364, "step": 149400 }, { "epoch": 24.31, "learning_rate": 2.7573829335943875e-06, "loss": NaN, "step": 149500 }, { "epoch": 24.31, "eval_loss": 0.39637017250061035, "eval_runtime": 8.1021, "eval_samples_per_second": 12.343, "eval_wer": 0.3325213154689403, "step": 149500 }, { "epoch": 24.33, "learning_rate": 2.692119432207538e-06, "loss": NaN, "step": 149600 }, { "epoch": 24.33, "eval_loss": 0.4175480306148529, "eval_runtime": 8.4026, "eval_samples_per_second": 11.901, "eval_wer": 0.3325213154689403, "step": 149600 }, { "epoch": 24.35, "learning_rate": 2.6268559308206883e-06, "loss": NaN, "step": 149700 }, { "epoch": 24.35, "eval_loss": 0.4383509159088135, "eval_runtime": 8.2617, "eval_samples_per_second": 12.104, "eval_wer": 0.3276492082825822, "step": 149700 }, { "epoch": 24.36, "learning_rate": 2.5615924294338394e-06, "loss": NaN, "step": 149800 }, { "epoch": 24.36, "eval_loss": 0.3883654475212097, "eval_runtime": 7.6932, "eval_samples_per_second": 12.999, "eval_wer": 0.32886723507917176, "step": 149800 }, { "epoch": 24.38, "learning_rate": 2.4963289280469896e-06, "loss": NaN, "step": 149900 }, { "epoch": 24.38, "eval_loss": 0.42128920555114746, "eval_runtime": 7.3824, "eval_samples_per_second": 13.546, "eval_wer": 0.33008526187576126, "step": 149900 }, { "epoch": 24.39, "learning_rate": 2.4310654266601403e-06, "loss": NaN, "step": 150000 }, { "epoch": 24.39, "eval_loss": 0.37016811966896057, "eval_runtime": 7.3966, "eval_samples_per_second": 13.52, "eval_wer": 0.3264311814859927, "step": 150000 }, { "epoch": 24.41, "learning_rate": 2.365801925273291e-06, "loss": NaN, "step": 150100 }, { "epoch": 24.41, "eval_loss": 0.4776330888271332, "eval_runtime": 8.1524, "eval_samples_per_second": 12.266, "eval_wer": 0.3276492082825822, "step": 150100 }, { "epoch": 24.43, "learning_rate": 2.3005384238864416e-06, "loss": NaN, "step": 150200 }, { "epoch": 24.43, "eval_loss": 0.40871936082839966, "eval_runtime": 7.8643, "eval_samples_per_second": 12.716, "eval_wer": 0.3276492082825822, "step": 150200 }, { "epoch": 24.44, "learning_rate": 2.235274922499592e-06, "loss": NaN, "step": 150300 }, { "epoch": 24.44, "eval_loss": 0.4232352375984192, "eval_runtime": 7.5631, "eval_samples_per_second": 13.222, "eval_wer": 0.3325213154689403, "step": 150300 }, { "epoch": 24.46, "learning_rate": 2.170011421112743e-06, "loss": NaN, "step": 150400 }, { "epoch": 24.46, "eval_loss": 0.3953474164009094, "eval_runtime": 8.1896, "eval_samples_per_second": 12.211, "eval_wer": 0.32399512789281365, "step": 150400 }, { "epoch": 24.48, "learning_rate": 2.1047479197258935e-06, "loss": NaN, "step": 150500 }, { "epoch": 24.48, "eval_loss": 0.40007010102272034, "eval_runtime": 8.6682, "eval_samples_per_second": 11.536, "eval_wer": 0.32886723507917176, "step": 150500 }, { "epoch": 24.49, "learning_rate": 2.039484418339044e-06, "loss": NaN, "step": 150600 }, { "epoch": 24.49, "eval_loss": 0.4761078357696533, "eval_runtime": 9.2295, "eval_samples_per_second": 10.835, "eval_wer": 0.32886723507917176, "step": 150600 }, { "epoch": 24.51, "learning_rate": 1.9742209169521948e-06, "loss": NaN, "step": 150700 }, { "epoch": 24.51, "eval_loss": 0.4079989194869995, "eval_runtime": 8.3587, "eval_samples_per_second": 11.964, "eval_wer": 0.32886723507917176, "step": 150700 }, { "epoch": 24.52, "learning_rate": 1.908957415565345e-06, "loss": NaN, "step": 150800 }, { "epoch": 24.52, "eval_loss": 0.3929882049560547, "eval_runtime": 7.1125, "eval_samples_per_second": 14.06, "eval_wer": 0.33617539585870887, "step": 150800 }, { "epoch": 24.54, "learning_rate": 1.8436939141784959e-06, "loss": NaN, "step": 150900 }, { "epoch": 24.54, "eval_loss": 0.44755759835243225, "eval_runtime": 7.8989, "eval_samples_per_second": 12.66, "eval_wer": 0.3373934226552984, "step": 150900 }, { "epoch": 24.56, "learning_rate": 1.7784304127916463e-06, "loss": NaN, "step": 151000 }, { "epoch": 24.56, "eval_loss": 0.3977559208869934, "eval_runtime": 8.7185, "eval_samples_per_second": 11.47, "eval_wer": 0.32886723507917176, "step": 151000 }, { "epoch": 24.57, "learning_rate": 1.713166911404797e-06, "loss": NaN, "step": 151100 }, { "epoch": 24.57, "eval_loss": 0.4052342176437378, "eval_runtime": 7.8682, "eval_samples_per_second": 12.709, "eval_wer": 0.34226552984165654, "step": 151100 }, { "epoch": 24.59, "learning_rate": 1.6479034100179476e-06, "loss": NaN, "step": 151200 }, { "epoch": 24.59, "eval_loss": 0.4712124168872833, "eval_runtime": 8.3125, "eval_samples_per_second": 12.03, "eval_wer": 0.34226552984165654, "step": 151200 }, { "epoch": 24.61, "learning_rate": 1.5826399086310982e-06, "loss": NaN, "step": 151300 }, { "epoch": 24.61, "eval_loss": 0.3818945288658142, "eval_runtime": 7.968, "eval_samples_per_second": 12.55, "eval_wer": 0.33495736906211937, "step": 151300 }, { "epoch": 24.62, "learning_rate": 1.5173764072442489e-06, "loss": NaN, "step": 151400 }, { "epoch": 24.62, "eval_loss": 0.44341355562210083, "eval_runtime": 8.224, "eval_samples_per_second": 12.16, "eval_wer": 0.341047503045067, "step": 151400 }, { "epoch": 24.64, "learning_rate": 1.4521129058573993e-06, "loss": NaN, "step": 151500 }, { "epoch": 24.64, "eval_loss": 0.4101918041706085, "eval_runtime": 6.9383, "eval_samples_per_second": 14.413, "eval_wer": 0.3215590742996346, "step": 151500 }, { "epoch": 24.65, "learning_rate": 1.38684940447055e-06, "loss": NaN, "step": 151600 }, { "epoch": 24.65, "eval_loss": 0.39534106850624084, "eval_runtime": 8.9247, "eval_samples_per_second": 11.205, "eval_wer": 0.32886723507917176, "step": 151600 }, { "epoch": 24.67, "learning_rate": 1.3215859030837006e-06, "loss": NaN, "step": 151700 }, { "epoch": 24.67, "eval_loss": 0.3738269805908203, "eval_runtime": 7.6097, "eval_samples_per_second": 13.141, "eval_wer": 0.3264311814859927, "step": 151700 }, { "epoch": 24.69, "learning_rate": 1.256322401696851e-06, "loss": NaN, "step": 151800 }, { "epoch": 24.69, "eval_loss": 0.5128779411315918, "eval_runtime": 8.2012, "eval_samples_per_second": 12.193, "eval_wer": 0.3313032886723508, "step": 151800 }, { "epoch": 24.7, "learning_rate": 1.1910589003100017e-06, "loss": NaN, "step": 151900 }, { "epoch": 24.7, "eval_loss": 0.41557371616363525, "eval_runtime": 10.0221, "eval_samples_per_second": 9.978, "eval_wer": 0.3264311814859927, "step": 151900 }, { "epoch": 24.72, "learning_rate": 1.1257953989231523e-06, "loss": NaN, "step": 152000 }, { "epoch": 24.72, "eval_loss": 0.3804296851158142, "eval_runtime": 6.86, "eval_samples_per_second": 14.577, "eval_wer": 0.3166869671132765, "step": 152000 }, { "epoch": 24.74, "learning_rate": 1.060531897536303e-06, "loss": NaN, "step": 152100 }, { "epoch": 24.74, "eval_loss": 0.37247443199157715, "eval_runtime": 8.5022, "eval_samples_per_second": 11.762, "eval_wer": 0.31790499390986604, "step": 152100 }, { "epoch": 24.75, "learning_rate": 9.952683961494534e-07, "loss": NaN, "step": 152200 }, { "epoch": 24.75, "eval_loss": 0.4154191315174103, "eval_runtime": 7.3705, "eval_samples_per_second": 13.568, "eval_wer": 0.33495736906211937, "step": 152200 }, { "epoch": 24.77, "learning_rate": 9.30004894762604e-07, "loss": NaN, "step": 152300 }, { "epoch": 24.77, "eval_loss": 0.46218574047088623, "eval_runtime": 8.1433, "eval_samples_per_second": 12.28, "eval_wer": 0.34226552984165654, "step": 152300 }, { "epoch": 24.78, "learning_rate": 8.647413933757547e-07, "loss": NaN, "step": 152400 }, { "epoch": 24.78, "eval_loss": 0.39375588297843933, "eval_runtime": 6.9811, "eval_samples_per_second": 14.324, "eval_wer": 0.29963459196102316, "step": 152400 }, { "epoch": 24.8, "learning_rate": 7.994778919889051e-07, "loss": NaN, "step": 152500 }, { "epoch": 24.8, "eval_loss": 0.4095069169998169, "eval_runtime": 7.9503, "eval_samples_per_second": 12.578, "eval_wer": 0.3373934226552984, "step": 152500 }, { "epoch": 24.82, "learning_rate": 7.342143906020558e-07, "loss": NaN, "step": 152600 }, { "epoch": 24.82, "eval_loss": 0.431011438369751, "eval_runtime": 7.7649, "eval_samples_per_second": 12.878, "eval_wer": 0.3313032886723508, "step": 152600 }, { "epoch": 24.83, "learning_rate": 6.689508892152064e-07, "loss": NaN, "step": 152700 }, { "epoch": 24.83, "eval_loss": 0.39817845821380615, "eval_runtime": 6.8105, "eval_samples_per_second": 14.683, "eval_wer": 0.3264311814859927, "step": 152700 }, { "epoch": 24.85, "learning_rate": 6.036873878283571e-07, "loss": NaN, "step": 152800 }, { "epoch": 24.85, "eval_loss": 0.3910774886608124, "eval_runtime": 7.13, "eval_samples_per_second": 14.025, "eval_wer": 0.32034104750304504, "step": 152800 }, { "epoch": 24.87, "learning_rate": 5.384238864415076e-07, "loss": NaN, "step": 152900 }, { "epoch": 24.87, "eval_loss": 0.40002116560935974, "eval_runtime": 7.5393, "eval_samples_per_second": 13.264, "eval_wer": 0.31912302070645554, "step": 152900 }, { "epoch": 24.88, "learning_rate": 4.7316038505465825e-07, "loss": NaN, "step": 153000 }, { "epoch": 24.88, "eval_loss": 0.40296486020088196, "eval_runtime": 9.5006, "eval_samples_per_second": 10.526, "eval_wer": 0.33617539585870887, "step": 153000 }, { "epoch": 24.9, "learning_rate": 4.078968836678088e-07, "loss": NaN, "step": 153100 }, { "epoch": 24.9, "eval_loss": 0.3949245810508728, "eval_runtime": 9.1847, "eval_samples_per_second": 10.888, "eval_wer": 0.3313032886723508, "step": 153100 }, { "epoch": 24.91, "learning_rate": 3.426333822809594e-07, "loss": NaN, "step": 153200 }, { "epoch": 24.91, "eval_loss": 0.43339037895202637, "eval_runtime": 7.6951, "eval_samples_per_second": 12.995, "eval_wer": 0.34348355663824603, "step": 153200 }, { "epoch": 24.93, "learning_rate": 2.7736988089410997e-07, "loss": NaN, "step": 153300 }, { "epoch": 24.93, "eval_loss": 0.439365416765213, "eval_runtime": 6.9543, "eval_samples_per_second": 14.38, "eval_wer": 0.341047503045067, "step": 153300 }, { "epoch": 24.95, "learning_rate": 2.121063795072606e-07, "loss": NaN, "step": 153400 }, { "epoch": 24.95, "eval_loss": 0.4255564510822296, "eval_runtime": 8.4137, "eval_samples_per_second": 11.885, "eval_wer": 0.3373934226552984, "step": 153400 }, { "epoch": 24.96, "learning_rate": 1.4684287812041115e-07, "loss": NaN, "step": 153500 }, { "epoch": 24.96, "eval_loss": 0.3864142894744873, "eval_runtime": 9.5624, "eval_samples_per_second": 10.458, "eval_wer": 0.33008526187576126, "step": 153500 }, { "epoch": 24.98, "learning_rate": 8.157937673356176e-08, "loss": NaN, "step": 153600 }, { "epoch": 24.98, "eval_loss": 0.4688411056995392, "eval_runtime": 7.8079, "eval_samples_per_second": 12.808, "eval_wer": 0.3325213154689403, "step": 153600 }, { "epoch": 25.0, "learning_rate": 1.6315875346712352e-08, "loss": NaN, "step": 153700 }, { "epoch": 25.0, "eval_loss": 0.40519940853118896, "eval_runtime": 8.6405, "eval_samples_per_second": 11.573, "eval_wer": 0.32521315468940315, "step": 153700 }, { "epoch": 25.0, "step": 153725, "total_flos": 7.526023236355262e+20, "train_runtime": 258038.6163, "train_samples_per_second": 0.596 } ], "max_steps": 153725, "num_train_epochs": 25, "total_flos": 7.526023236355262e+20, "trial_name": null, "trial_params": null }