{ "best_metric": null, "best_model_checkpoint": null, "epoch": 4.8, "global_step": 36000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.01, "learning_rate": 0.0001, "loss": 16.4891, "step": 100 }, { "epoch": 0.01, "eval_loss": 7.453255653381348, "eval_runtime": 17.1907, "eval_samples_per_second": 4.654, "eval_wer": 1.0, "step": 100 }, { "epoch": 0.03, "learning_rate": 9.999555535801592e-05, "loss": 3.6143, "step": 200 }, { "epoch": 0.03, "eval_loss": 3.6875462532043457, "eval_runtime": 17.2862, "eval_samples_per_second": 4.628, "eval_wer": 1.0, "step": 200 }, { "epoch": 0.04, "learning_rate": 9.999111071603183e-05, "loss": 3.0476, "step": 300 }, { "epoch": 0.04, "eval_loss": 3.5380682945251465, "eval_runtime": 17.234, "eval_samples_per_second": 4.642, "eval_wer": 1.0, "step": 300 }, { "epoch": 0.05, "learning_rate": 9.998666607404774e-05, "loss": 3.0296, "step": 400 }, { "epoch": 0.05, "eval_loss": 3.5734219551086426, "eval_runtime": 17.3146, "eval_samples_per_second": 4.62, "eval_wer": 1.0, "step": 400 }, { "epoch": 0.07, "learning_rate": 9.998222143206365e-05, "loss": 3.04, "step": 500 }, { "epoch": 0.07, "eval_loss": 3.5502994060516357, "eval_runtime": 17.3078, "eval_samples_per_second": 4.622, "eval_wer": 1.0, "step": 500 }, { "epoch": 0.08, "learning_rate": 9.997777679007957e-05, "loss": Infinity, "step": 600 }, { "epoch": 0.08, "eval_loss": 3.3948416709899902, "eval_runtime": 17.323, "eval_samples_per_second": 4.618, "eval_wer": 1.0, "step": 600 }, { "epoch": 0.09, "learning_rate": 9.997333214809547e-05, "loss": NaN, "step": 700 }, { "epoch": 0.09, "eval_loss": 3.2798409461975098, "eval_runtime": 17.422, "eval_samples_per_second": 4.592, "eval_wer": 1.0, "step": 700 }, { "epoch": 0.11, "learning_rate": 9.996888750611138e-05, "loss": NaN, "step": 800 }, { "epoch": 0.11, "eval_loss": 3.1693687438964844, "eval_runtime": 17.3276, "eval_samples_per_second": 4.617, "eval_wer": 1.0, "step": 800 }, { "epoch": 0.12, "learning_rate": 9.99644428641273e-05, "loss": NaN, "step": 900 }, { "epoch": 0.12, "eval_loss": 3.0904104709625244, "eval_runtime": 17.3305, "eval_samples_per_second": 4.616, "eval_wer": 1.0, "step": 900 }, { "epoch": 0.13, "learning_rate": 9.995999822214322e-05, "loss": NaN, "step": 1000 }, { "epoch": 0.13, "eval_loss": 2.940812587738037, "eval_runtime": 17.5447, "eval_samples_per_second": 4.56, "eval_wer": 0.9968992248062015, "step": 1000 }, { "epoch": 0.15, "learning_rate": 9.995555358015912e-05, "loss": NaN, "step": 1100 }, { "epoch": 0.15, "eval_loss": 2.078176259994507, "eval_runtime": 17.4887, "eval_samples_per_second": 4.574, "eval_wer": 0.9906976744186047, "step": 1100 }, { "epoch": 0.16, "learning_rate": 9.995110893817503e-05, "loss": NaN, "step": 1200 }, { "epoch": 0.16, "eval_loss": 1.6720739603042603, "eval_runtime": 17.4985, "eval_samples_per_second": 4.572, "eval_wer": 0.9023255813953488, "step": 1200 }, { "epoch": 0.17, "learning_rate": 9.994666429619095e-05, "loss": NaN, "step": 1300 }, { "epoch": 0.17, "eval_loss": 1.5600072145462036, "eval_runtime": 17.6605, "eval_samples_per_second": 4.53, "eval_wer": 0.8635658914728682, "step": 1300 }, { "epoch": 0.19, "learning_rate": 9.994221965420686e-05, "loss": NaN, "step": 1400 }, { "epoch": 0.19, "eval_loss": 1.4188871383666992, "eval_runtime": 17.4862, "eval_samples_per_second": 4.575, "eval_wer": 0.8356589147286821, "step": 1400 }, { "epoch": 0.2, "learning_rate": 9.993777501222276e-05, "loss": NaN, "step": 1500 }, { "epoch": 0.2, "eval_loss": 1.2592538595199585, "eval_runtime": 17.3951, "eval_samples_per_second": 4.599, "eval_wer": 0.7906976744186046, "step": 1500 }, { "epoch": 0.21, "learning_rate": 9.993333037023869e-05, "loss": NaN, "step": 1600 }, { "epoch": 0.21, "eval_loss": 1.1907216310501099, "eval_runtime": 17.4046, "eval_samples_per_second": 4.596, "eval_wer": 0.7565891472868217, "step": 1600 }, { "epoch": 0.23, "learning_rate": 9.99288857282546e-05, "loss": NaN, "step": 1700 }, { "epoch": 0.23, "eval_loss": 1.3044092655181885, "eval_runtime": 17.3968, "eval_samples_per_second": 4.599, "eval_wer": 0.7829457364341085, "step": 1700 }, { "epoch": 0.24, "learning_rate": 9.992444108627051e-05, "loss": NaN, "step": 1800 }, { "epoch": 0.24, "eval_loss": 1.1965358257293701, "eval_runtime": 17.3177, "eval_samples_per_second": 4.62, "eval_wer": 0.7503875968992249, "step": 1800 }, { "epoch": 0.25, "learning_rate": 9.991999644428641e-05, "loss": NaN, "step": 1900 }, { "epoch": 0.25, "eval_loss": 1.1158918142318726, "eval_runtime": 17.4315, "eval_samples_per_second": 4.589, "eval_wer": 0.7007751937984497, "step": 1900 }, { "epoch": 0.27, "learning_rate": 9.991555180230233e-05, "loss": NaN, "step": 2000 }, { "epoch": 0.27, "eval_loss": 1.139773964881897, "eval_runtime": 17.4304, "eval_samples_per_second": 4.59, "eval_wer": 0.7286821705426356, "step": 2000 }, { "epoch": 0.28, "learning_rate": 9.991110716031824e-05, "loss": NaN, "step": 2100 }, { "epoch": 0.28, "eval_loss": 0.9968563318252563, "eval_runtime": 17.3268, "eval_samples_per_second": 4.617, "eval_wer": 0.6821705426356589, "step": 2100 }, { "epoch": 0.29, "learning_rate": 9.990666251833415e-05, "loss": NaN, "step": 2200 }, { "epoch": 0.29, "eval_loss": 0.9753952026367188, "eval_runtime": 17.36, "eval_samples_per_second": 4.608, "eval_wer": 0.6666666666666666, "step": 2200 }, { "epoch": 0.31, "learning_rate": 9.990221787635007e-05, "loss": NaN, "step": 2300 }, { "epoch": 0.31, "eval_loss": 0.9655939340591431, "eval_runtime": 17.3128, "eval_samples_per_second": 4.621, "eval_wer": 0.6651162790697674, "step": 2300 }, { "epoch": 0.32, "learning_rate": 9.989777323436598e-05, "loss": NaN, "step": 2400 }, { "epoch": 0.32, "eval_loss": 0.9793145060539246, "eval_runtime": 17.3154, "eval_samples_per_second": 4.62, "eval_wer": 0.6604651162790698, "step": 2400 }, { "epoch": 0.33, "learning_rate": 9.989332859238189e-05, "loss": NaN, "step": 2500 }, { "epoch": 0.33, "eval_loss": 0.9911659955978394, "eval_runtime": 17.3868, "eval_samples_per_second": 4.601, "eval_wer": 0.6558139534883721, "step": 2500 }, { "epoch": 0.35, "learning_rate": 9.98888839503978e-05, "loss": NaN, "step": 2600 }, { "epoch": 0.35, "eval_loss": 0.9256990551948547, "eval_runtime": 17.3404, "eval_samples_per_second": 4.613, "eval_wer": 0.6713178294573643, "step": 2600 }, { "epoch": 0.36, "learning_rate": 9.988443930841371e-05, "loss": NaN, "step": 2700 }, { "epoch": 0.36, "eval_loss": 0.8806975483894348, "eval_runtime": 17.3516, "eval_samples_per_second": 4.611, "eval_wer": 0.6325581395348837, "step": 2700 }, { "epoch": 0.37, "learning_rate": 9.987999466642962e-05, "loss": NaN, "step": 2800 }, { "epoch": 0.37, "eval_loss": 0.9201020002365112, "eval_runtime": 17.4402, "eval_samples_per_second": 4.587, "eval_wer": 0.6604651162790698, "step": 2800 }, { "epoch": 0.39, "learning_rate": 9.987555002444555e-05, "loss": NaN, "step": 2900 }, { "epoch": 0.39, "eval_loss": 0.8914031982421875, "eval_runtime": 17.3777, "eval_samples_per_second": 4.604, "eval_wer": 0.6248062015503876, "step": 2900 }, { "epoch": 0.4, "learning_rate": 9.987110538246144e-05, "loss": NaN, "step": 3000 }, { "epoch": 0.4, "eval_loss": 0.8329198956489563, "eval_runtime": 17.334, "eval_samples_per_second": 4.615, "eval_wer": 0.6186046511627907, "step": 3000 }, { "epoch": 0.41, "learning_rate": 9.986666074047736e-05, "loss": NaN, "step": 3100 }, { "epoch": 0.41, "eval_loss": 0.8818947672843933, "eval_runtime": 17.4737, "eval_samples_per_second": 4.578, "eval_wer": 0.6248062015503876, "step": 3100 }, { "epoch": 0.43, "learning_rate": 9.986221609849327e-05, "loss": NaN, "step": 3200 }, { "epoch": 0.43, "eval_loss": 0.9315568804740906, "eval_runtime": 17.3225, "eval_samples_per_second": 4.618, "eval_wer": 0.6155038759689923, "step": 3200 }, { "epoch": 0.44, "learning_rate": 9.985777145650919e-05, "loss": NaN, "step": 3300 }, { "epoch": 0.44, "eval_loss": 0.891169548034668, "eval_runtime": 17.3188, "eval_samples_per_second": 4.619, "eval_wer": 0.6062015503875969, "step": 3300 }, { "epoch": 0.45, "learning_rate": 9.985332681452509e-05, "loss": NaN, "step": 3400 }, { "epoch": 0.45, "eval_loss": 0.8204320073127747, "eval_runtime": 17.2776, "eval_samples_per_second": 4.63, "eval_wer": 0.6217054263565891, "step": 3400 }, { "epoch": 0.47, "learning_rate": 9.9848882172541e-05, "loss": NaN, "step": 3500 }, { "epoch": 0.47, "eval_loss": 0.7907635569572449, "eval_runtime": 17.4135, "eval_samples_per_second": 4.594, "eval_wer": 0.6124031007751938, "step": 3500 }, { "epoch": 0.48, "learning_rate": 9.984443753055693e-05, "loss": NaN, "step": 3600 }, { "epoch": 0.48, "eval_loss": 0.7738734483718872, "eval_runtime": 17.2483, "eval_samples_per_second": 4.638, "eval_wer": 0.5922480620155038, "step": 3600 }, { "epoch": 0.49, "learning_rate": 9.983999288857284e-05, "loss": NaN, "step": 3700 }, { "epoch": 0.49, "eval_loss": 0.8443992733955383, "eval_runtime": 17.3843, "eval_samples_per_second": 4.602, "eval_wer": 0.6341085271317829, "step": 3700 }, { "epoch": 0.51, "learning_rate": 9.983554824658873e-05, "loss": NaN, "step": 3800 }, { "epoch": 0.51, "eval_loss": 0.8256866335868835, "eval_runtime": 17.372, "eval_samples_per_second": 4.605, "eval_wer": 0.6031007751937985, "step": 3800 }, { "epoch": 0.52, "learning_rate": 9.983110360460466e-05, "loss": NaN, "step": 3900 }, { "epoch": 0.52, "eval_loss": 0.8002794981002808, "eval_runtime": 17.2749, "eval_samples_per_second": 4.631, "eval_wer": 0.5953488372093023, "step": 3900 }, { "epoch": 0.53, "learning_rate": 9.982665896262057e-05, "loss": NaN, "step": 4000 }, { "epoch": 0.53, "eval_loss": 0.7931162118911743, "eval_runtime": 17.3293, "eval_samples_per_second": 4.616, "eval_wer": 0.5891472868217055, "step": 4000 }, { "epoch": 0.55, "learning_rate": 9.982221432063648e-05, "loss": NaN, "step": 4100 }, { "epoch": 0.55, "eval_loss": 0.7502455711364746, "eval_runtime": 17.2431, "eval_samples_per_second": 4.64, "eval_wer": 0.5751937984496124, "step": 4100 }, { "epoch": 0.56, "learning_rate": 9.981776967865238e-05, "loss": NaN, "step": 4200 }, { "epoch": 0.56, "eval_loss": 0.752181887626648, "eval_runtime": 17.2919, "eval_samples_per_second": 4.626, "eval_wer": 0.5705426356589147, "step": 4200 }, { "epoch": 0.57, "learning_rate": 9.98133250366683e-05, "loss": NaN, "step": 4300 }, { "epoch": 0.57, "eval_loss": 0.8146766424179077, "eval_runtime": 17.3018, "eval_samples_per_second": 4.624, "eval_wer": 0.5767441860465117, "step": 4300 }, { "epoch": 0.59, "learning_rate": 9.980888039468422e-05, "loss": NaN, "step": 4400 }, { "epoch": 0.59, "eval_loss": 0.7647853493690491, "eval_runtime": 17.3393, "eval_samples_per_second": 4.614, "eval_wer": 0.5674418604651162, "step": 4400 }, { "epoch": 0.6, "learning_rate": 9.980443575270013e-05, "loss": NaN, "step": 4500 }, { "epoch": 0.6, "eval_loss": 0.8016502261161804, "eval_runtime": 17.3476, "eval_samples_per_second": 4.612, "eval_wer": 0.5751937984496124, "step": 4500 }, { "epoch": 0.61, "learning_rate": 9.979999111071604e-05, "loss": NaN, "step": 4600 }, { "epoch": 0.61, "eval_loss": 0.779055118560791, "eval_runtime": 17.31, "eval_samples_per_second": 4.622, "eval_wer": 0.5937984496124031, "step": 4600 }, { "epoch": 0.63, "learning_rate": 9.979554646873195e-05, "loss": NaN, "step": 4700 }, { "epoch": 0.63, "eval_loss": 0.7754725813865662, "eval_runtime": 17.4442, "eval_samples_per_second": 4.586, "eval_wer": 0.5705426356589147, "step": 4700 }, { "epoch": 0.64, "learning_rate": 9.979110182674786e-05, "loss": NaN, "step": 4800 }, { "epoch": 0.64, "eval_loss": 0.7565076947212219, "eval_runtime": 17.3494, "eval_samples_per_second": 4.611, "eval_wer": 0.5875968992248062, "step": 4800 }, { "epoch": 0.65, "learning_rate": 9.978665718476377e-05, "loss": NaN, "step": 4900 }, { "epoch": 0.65, "eval_loss": 0.7285895347595215, "eval_runtime": 17.2713, "eval_samples_per_second": 4.632, "eval_wer": 0.5720930232558139, "step": 4900 }, { "epoch": 0.67, "learning_rate": 9.978221254277968e-05, "loss": NaN, "step": 5000 }, { "epoch": 0.67, "eval_loss": 0.7842145562171936, "eval_runtime": 17.3978, "eval_samples_per_second": 4.598, "eval_wer": 0.5782945736434109, "step": 5000 }, { "epoch": 0.68, "learning_rate": 9.97777679007956e-05, "loss": NaN, "step": 5100 }, { "epoch": 0.68, "eval_loss": 0.7423646450042725, "eval_runtime": 17.3779, "eval_samples_per_second": 4.604, "eval_wer": 0.5767441860465117, "step": 5100 }, { "epoch": 0.69, "learning_rate": 9.977332325881152e-05, "loss": NaN, "step": 5200 }, { "epoch": 0.69, "eval_loss": 0.7223240733146667, "eval_runtime": 17.3244, "eval_samples_per_second": 4.618, "eval_wer": 0.5627906976744186, "step": 5200 }, { "epoch": 0.71, "learning_rate": 9.976887861682742e-05, "loss": NaN, "step": 5300 }, { "epoch": 0.71, "eval_loss": 0.8006032705307007, "eval_runtime": 17.3458, "eval_samples_per_second": 4.612, "eval_wer": 0.5767441860465117, "step": 5300 }, { "epoch": 0.72, "learning_rate": 9.976443397484333e-05, "loss": NaN, "step": 5400 }, { "epoch": 0.72, "eval_loss": 0.777060866355896, "eval_runtime": 17.3762, "eval_samples_per_second": 4.604, "eval_wer": 0.5891472868217055, "step": 5400 }, { "epoch": 0.73, "learning_rate": 9.975998933285924e-05, "loss": NaN, "step": 5500 }, { "epoch": 0.73, "eval_loss": 0.8182930946350098, "eval_runtime": 17.3543, "eval_samples_per_second": 4.61, "eval_wer": 0.5488372093023256, "step": 5500 }, { "epoch": 0.75, "learning_rate": 9.975554469087516e-05, "loss": NaN, "step": 5600 }, { "epoch": 0.75, "eval_loss": 0.8928201794624329, "eval_runtime": 17.3737, "eval_samples_per_second": 4.605, "eval_wer": 0.5534883720930233, "step": 5600 }, { "epoch": 0.76, "learning_rate": 9.975110004889106e-05, "loss": NaN, "step": 5700 }, { "epoch": 0.76, "eval_loss": 0.8263363838195801, "eval_runtime": 17.3975, "eval_samples_per_second": 4.598, "eval_wer": 0.57984496124031, "step": 5700 }, { "epoch": 0.77, "learning_rate": 9.974665540690697e-05, "loss": NaN, "step": 5800 }, { "epoch": 0.77, "eval_loss": 0.785165548324585, "eval_runtime": 17.3799, "eval_samples_per_second": 4.603, "eval_wer": 0.5565891472868217, "step": 5800 }, { "epoch": 0.79, "learning_rate": 9.97422107649229e-05, "loss": NaN, "step": 5900 }, { "epoch": 0.79, "eval_loss": 0.7735041379928589, "eval_runtime": 17.2943, "eval_samples_per_second": 4.626, "eval_wer": 0.5488372093023256, "step": 5900 }, { "epoch": 0.8, "learning_rate": 9.973776612293881e-05, "loss": NaN, "step": 6000 }, { "epoch": 0.8, "eval_loss": 0.7752858400344849, "eval_runtime": 17.3964, "eval_samples_per_second": 4.599, "eval_wer": 0.5596899224806201, "step": 6000 }, { "epoch": 0.81, "learning_rate": 9.97333214809547e-05, "loss": NaN, "step": 6100 }, { "epoch": 0.81, "eval_loss": 0.7791776657104492, "eval_runtime": 17.3616, "eval_samples_per_second": 4.608, "eval_wer": 0.5658914728682171, "step": 6100 }, { "epoch": 0.83, "learning_rate": 9.972887683897063e-05, "loss": NaN, "step": 6200 }, { "epoch": 0.83, "eval_loss": 0.9012916684150696, "eval_runtime": 17.2944, "eval_samples_per_second": 4.626, "eval_wer": 0.5612403100775194, "step": 6200 }, { "epoch": 0.84, "learning_rate": 9.972443219698654e-05, "loss": NaN, "step": 6300 }, { "epoch": 0.84, "eval_loss": 0.819232165813446, "eval_runtime": 17.2609, "eval_samples_per_second": 4.635, "eval_wer": 0.5503875968992248, "step": 6300 }, { "epoch": 0.85, "learning_rate": 9.971998755500245e-05, "loss": NaN, "step": 6400 }, { "epoch": 0.85, "eval_loss": 0.7208074331283569, "eval_runtime": 17.342, "eval_samples_per_second": 4.613, "eval_wer": 0.5565891472868217, "step": 6400 }, { "epoch": 0.87, "learning_rate": 9.971554291301835e-05, "loss": NaN, "step": 6500 }, { "epoch": 0.87, "eval_loss": 0.8276127576828003, "eval_runtime": 17.2796, "eval_samples_per_second": 4.63, "eval_wer": 0.5209302325581395, "step": 6500 }, { "epoch": 0.88, "learning_rate": 9.971109827103428e-05, "loss": NaN, "step": 6600 }, { "epoch": 0.88, "eval_loss": 0.6788396835327148, "eval_runtime": 17.3982, "eval_samples_per_second": 4.598, "eval_wer": 0.537984496124031, "step": 6600 }, { "epoch": 0.89, "learning_rate": 9.970665362905019e-05, "loss": NaN, "step": 6700 }, { "epoch": 0.89, "eval_loss": 0.7748047113418579, "eval_runtime": 17.3475, "eval_samples_per_second": 4.612, "eval_wer": 0.5581395348837209, "step": 6700 }, { "epoch": 0.91, "learning_rate": 9.97022089870661e-05, "loss": NaN, "step": 6800 }, { "epoch": 0.91, "eval_loss": 0.728911280632019, "eval_runtime": 17.3832, "eval_samples_per_second": 4.602, "eval_wer": 0.5581395348837209, "step": 6800 }, { "epoch": 0.92, "learning_rate": 9.969776434508201e-05, "loss": NaN, "step": 6900 }, { "epoch": 0.92, "eval_loss": 0.711087703704834, "eval_runtime": 17.3922, "eval_samples_per_second": 4.6, "eval_wer": 0.5674418604651162, "step": 6900 }, { "epoch": 0.93, "learning_rate": 9.969331970309792e-05, "loss": NaN, "step": 7000 }, { "epoch": 0.93, "eval_loss": 0.6784836649894714, "eval_runtime": 17.4107, "eval_samples_per_second": 4.595, "eval_wer": 0.5441860465116279, "step": 7000 }, { "epoch": 0.95, "learning_rate": 9.968887506111383e-05, "loss": NaN, "step": 7100 }, { "epoch": 0.95, "eval_loss": 0.6995629072189331, "eval_runtime": 17.3942, "eval_samples_per_second": 4.599, "eval_wer": 0.5503875968992248, "step": 7100 }, { "epoch": 0.96, "learning_rate": 9.968443041912974e-05, "loss": NaN, "step": 7200 }, { "epoch": 0.96, "eval_loss": 0.7547804713249207, "eval_runtime": 17.3298, "eval_samples_per_second": 4.616, "eval_wer": 0.5519379844961241, "step": 7200 }, { "epoch": 0.97, "learning_rate": 9.967998577714565e-05, "loss": NaN, "step": 7300 }, { "epoch": 0.97, "eval_loss": 0.7266980409622192, "eval_runtime": 17.3345, "eval_samples_per_second": 4.615, "eval_wer": 0.5720930232558139, "step": 7300 }, { "epoch": 0.99, "learning_rate": 9.967554113516157e-05, "loss": NaN, "step": 7400 }, { "epoch": 0.99, "eval_loss": 0.7356825470924377, "eval_runtime": 17.3815, "eval_samples_per_second": 4.603, "eval_wer": 0.5457364341085271, "step": 7400 }, { "epoch": 1.0, "learning_rate": 9.967109649317749e-05, "loss": NaN, "step": 7500 }, { "epoch": 1.0, "eval_loss": 0.6732177734375, "eval_runtime": 17.3666, "eval_samples_per_second": 4.607, "eval_wer": 0.5643410852713179, "step": 7500 }, { "epoch": 1.01, "learning_rate": 9.966665185119339e-05, "loss": NaN, "step": 7600 }, { "epoch": 1.01, "eval_loss": 0.6623905897140503, "eval_runtime": 17.3816, "eval_samples_per_second": 4.603, "eval_wer": 0.5457364341085271, "step": 7600 }, { "epoch": 1.03, "learning_rate": 9.96622072092093e-05, "loss": NaN, "step": 7700 }, { "epoch": 1.03, "eval_loss": 0.6646267175674438, "eval_runtime": 17.3087, "eval_samples_per_second": 4.622, "eval_wer": 0.5255813953488372, "step": 7700 }, { "epoch": 1.04, "learning_rate": 9.965776256722521e-05, "loss": NaN, "step": 7800 }, { "epoch": 1.04, "eval_loss": 0.6843534708023071, "eval_runtime": 17.3598, "eval_samples_per_second": 4.608, "eval_wer": 0.5472868217054263, "step": 7800 }, { "epoch": 1.05, "learning_rate": 9.965331792524114e-05, "loss": NaN, "step": 7900 }, { "epoch": 1.05, "eval_loss": 0.6367862224578857, "eval_runtime": 17.4366, "eval_samples_per_second": 4.588, "eval_wer": 0.5286821705426357, "step": 7900 }, { "epoch": 1.07, "learning_rate": 9.964887328325703e-05, "loss": NaN, "step": 8000 }, { "epoch": 1.07, "eval_loss": 0.6785103678703308, "eval_runtime": 17.4096, "eval_samples_per_second": 4.595, "eval_wer": 0.5596899224806201, "step": 8000 }, { "epoch": 1.08, "learning_rate": 9.964442864127294e-05, "loss": NaN, "step": 8100 }, { "epoch": 1.08, "eval_loss": 0.7153035998344421, "eval_runtime": 17.3734, "eval_samples_per_second": 4.605, "eval_wer": 0.5457364341085271, "step": 8100 }, { "epoch": 1.09, "learning_rate": 9.963998399928887e-05, "loss": NaN, "step": 8200 }, { "epoch": 1.09, "eval_loss": 0.6959100961685181, "eval_runtime": 17.3566, "eval_samples_per_second": 4.609, "eval_wer": 0.5395348837209303, "step": 8200 }, { "epoch": 1.11, "learning_rate": 9.963553935730478e-05, "loss": NaN, "step": 8300 }, { "epoch": 1.11, "eval_loss": 0.6857380270957947, "eval_runtime": 17.3435, "eval_samples_per_second": 4.613, "eval_wer": 0.5317829457364341, "step": 8300 }, { "epoch": 1.12, "learning_rate": 9.963109471532068e-05, "loss": NaN, "step": 8400 }, { "epoch": 1.12, "eval_loss": 0.6444656848907471, "eval_runtime": 17.3941, "eval_samples_per_second": 4.599, "eval_wer": 0.5333333333333333, "step": 8400 }, { "epoch": 1.13, "learning_rate": 9.96266500733366e-05, "loss": NaN, "step": 8500 }, { "epoch": 1.13, "eval_loss": 0.7181092500686646, "eval_runtime": 17.4167, "eval_samples_per_second": 4.593, "eval_wer": 0.5224806201550387, "step": 8500 }, { "epoch": 1.15, "learning_rate": 9.962220543135251e-05, "loss": NaN, "step": 8600 }, { "epoch": 1.15, "eval_loss": 0.7113466262817383, "eval_runtime": 17.4584, "eval_samples_per_second": 4.582, "eval_wer": 0.5333333333333333, "step": 8600 }, { "epoch": 1.16, "learning_rate": 9.961776078936843e-05, "loss": NaN, "step": 8700 }, { "epoch": 1.16, "eval_loss": 0.737747073173523, "eval_runtime": 17.3407, "eval_samples_per_second": 4.613, "eval_wer": 0.5472868217054263, "step": 8700 }, { "epoch": 1.17, "learning_rate": 9.961331614738432e-05, "loss": NaN, "step": 8800 }, { "epoch": 1.17, "eval_loss": 0.7109254598617554, "eval_runtime": 17.4806, "eval_samples_per_second": 4.577, "eval_wer": 0.5534883720930233, "step": 8800 }, { "epoch": 1.19, "learning_rate": 9.960887150540025e-05, "loss": NaN, "step": 8900 }, { "epoch": 1.19, "eval_loss": 0.774544358253479, "eval_runtime": 17.4029, "eval_samples_per_second": 4.597, "eval_wer": 0.5627906976744186, "step": 8900 }, { "epoch": 1.2, "learning_rate": 9.960442686341616e-05, "loss": NaN, "step": 9000 }, { "epoch": 1.2, "eval_loss": 0.7585596442222595, "eval_runtime": 17.4002, "eval_samples_per_second": 4.598, "eval_wer": 0.5317829457364341, "step": 9000 }, { "epoch": 1.21, "learning_rate": 9.959998222143207e-05, "loss": NaN, "step": 9100 }, { "epoch": 1.21, "eval_loss": 0.7920966744422913, "eval_runtime": 17.3362, "eval_samples_per_second": 4.615, "eval_wer": 0.5364341085271318, "step": 9100 }, { "epoch": 1.23, "learning_rate": 9.959553757944798e-05, "loss": NaN, "step": 9200 }, { "epoch": 1.23, "eval_loss": 0.7708950638771057, "eval_runtime": 17.4086, "eval_samples_per_second": 4.595, "eval_wer": 0.5333333333333333, "step": 9200 }, { "epoch": 1.24, "learning_rate": 9.959109293746389e-05, "loss": NaN, "step": 9300 }, { "epoch": 1.24, "eval_loss": 0.6876834630966187, "eval_runtime": 17.378, "eval_samples_per_second": 4.604, "eval_wer": 0.5612403100775194, "step": 9300 }, { "epoch": 1.25, "learning_rate": 9.95866482954798e-05, "loss": NaN, "step": 9400 }, { "epoch": 1.25, "eval_loss": 0.7105833292007446, "eval_runtime": 17.3931, "eval_samples_per_second": 4.6, "eval_wer": 0.5317829457364341, "step": 9400 }, { "epoch": 1.27, "learning_rate": 9.958220365349572e-05, "loss": NaN, "step": 9500 }, { "epoch": 1.27, "eval_loss": 0.7411137819290161, "eval_runtime": 17.4436, "eval_samples_per_second": 4.586, "eval_wer": 0.537984496124031, "step": 9500 }, { "epoch": 1.28, "learning_rate": 9.957775901151163e-05, "loss": NaN, "step": 9600 }, { "epoch": 1.28, "eval_loss": 0.703761875629425, "eval_runtime": 17.4301, "eval_samples_per_second": 4.59, "eval_wer": 0.5302325581395348, "step": 9600 }, { "epoch": 1.29, "learning_rate": 9.957331436952754e-05, "loss": NaN, "step": 9700 }, { "epoch": 1.29, "eval_loss": 0.6908837556838989, "eval_runtime": 17.4234, "eval_samples_per_second": 4.592, "eval_wer": 0.5286821705426357, "step": 9700 }, { "epoch": 1.31, "learning_rate": 9.956886972754345e-05, "loss": NaN, "step": 9800 }, { "epoch": 1.31, "eval_loss": 0.6668051481246948, "eval_runtime": 17.4034, "eval_samples_per_second": 4.597, "eval_wer": 0.5317829457364341, "step": 9800 }, { "epoch": 1.32, "learning_rate": 9.956442508555936e-05, "loss": NaN, "step": 9900 }, { "epoch": 1.32, "eval_loss": 0.7552028894424438, "eval_runtime": 17.4346, "eval_samples_per_second": 4.589, "eval_wer": 0.5426356589147286, "step": 9900 }, { "epoch": 1.33, "learning_rate": 9.955998044357527e-05, "loss": NaN, "step": 10000 }, { "epoch": 1.33, "eval_loss": 0.7529067397117615, "eval_runtime": 17.3764, "eval_samples_per_second": 4.604, "eval_wer": 0.5271317829457365, "step": 10000 }, { "epoch": 1.35, "learning_rate": 9.955553580159118e-05, "loss": NaN, "step": 10100 }, { "epoch": 1.35, "eval_loss": 0.6945570111274719, "eval_runtime": 17.5096, "eval_samples_per_second": 4.569, "eval_wer": 0.5348837209302325, "step": 10100 }, { "epoch": 1.36, "learning_rate": 9.955109115960711e-05, "loss": NaN, "step": 10200 }, { "epoch": 1.36, "eval_loss": 0.7381066679954529, "eval_runtime": 17.3519, "eval_samples_per_second": 4.61, "eval_wer": 0.5271317829457365, "step": 10200 }, { "epoch": 1.37, "learning_rate": 9.9546646517623e-05, "loss": NaN, "step": 10300 }, { "epoch": 1.37, "eval_loss": 0.7733180522918701, "eval_runtime": 17.3513, "eval_samples_per_second": 4.611, "eval_wer": 0.5395348837209303, "step": 10300 }, { "epoch": 1.39, "learning_rate": 9.954220187563892e-05, "loss": NaN, "step": 10400 }, { "epoch": 1.39, "eval_loss": 0.7235101461410522, "eval_runtime": 17.276, "eval_samples_per_second": 4.631, "eval_wer": 0.5162790697674419, "step": 10400 }, { "epoch": 1.4, "learning_rate": 9.953775723365484e-05, "loss": NaN, "step": 10500 }, { "epoch": 1.4, "eval_loss": 0.756510853767395, "eval_runtime": 17.3233, "eval_samples_per_second": 4.618, "eval_wer": 0.5162790697674419, "step": 10500 }, { "epoch": 1.41, "learning_rate": 9.953331259167075e-05, "loss": NaN, "step": 10600 }, { "epoch": 1.41, "eval_loss": 0.7486532330513, "eval_runtime": 17.3251, "eval_samples_per_second": 4.618, "eval_wer": 0.517829457364341, "step": 10600 }, { "epoch": 1.43, "learning_rate": 9.952886794968665e-05, "loss": NaN, "step": 10700 }, { "epoch": 1.43, "eval_loss": 0.8009279370307922, "eval_runtime": 17.3932, "eval_samples_per_second": 4.6, "eval_wer": 0.5333333333333333, "step": 10700 }, { "epoch": 1.44, "learning_rate": 9.952442330770258e-05, "loss": NaN, "step": 10800 }, { "epoch": 1.44, "eval_loss": 0.7493506073951721, "eval_runtime": 17.5083, "eval_samples_per_second": 4.569, "eval_wer": 0.517829457364341, "step": 10800 }, { "epoch": 1.45, "learning_rate": 9.951997866571849e-05, "loss": NaN, "step": 10900 }, { "epoch": 1.45, "eval_loss": 0.6919007301330566, "eval_runtime": 17.3761, "eval_samples_per_second": 4.604, "eval_wer": 0.5209302325581395, "step": 10900 }, { "epoch": 1.47, "learning_rate": 9.95155340237344e-05, "loss": NaN, "step": 11000 }, { "epoch": 1.47, "eval_loss": 0.6828303933143616, "eval_runtime": 17.3932, "eval_samples_per_second": 4.6, "eval_wer": 0.524031007751938, "step": 11000 }, { "epoch": 1.48, "learning_rate": 9.95110893817503e-05, "loss": NaN, "step": 11100 }, { "epoch": 1.48, "eval_loss": 0.6986581683158875, "eval_runtime": 17.3758, "eval_samples_per_second": 4.604, "eval_wer": 0.5348837209302325, "step": 11100 }, { "epoch": 1.49, "learning_rate": 9.950664473976622e-05, "loss": NaN, "step": 11200 }, { "epoch": 1.49, "eval_loss": 0.686642050743103, "eval_runtime": 17.3613, "eval_samples_per_second": 4.608, "eval_wer": 0.5395348837209303, "step": 11200 }, { "epoch": 1.51, "learning_rate": 9.950220009778213e-05, "loss": NaN, "step": 11300 }, { "epoch": 1.51, "eval_loss": 0.6886032223701477, "eval_runtime": 17.3873, "eval_samples_per_second": 4.601, "eval_wer": 0.5023255813953489, "step": 11300 }, { "epoch": 1.52, "learning_rate": 9.949775545579804e-05, "loss": NaN, "step": 11400 }, { "epoch": 1.52, "eval_loss": 0.6399986147880554, "eval_runtime": 17.4574, "eval_samples_per_second": 4.583, "eval_wer": 0.5162790697674419, "step": 11400 }, { "epoch": 1.53, "learning_rate": 9.949331081381395e-05, "loss": NaN, "step": 11500 }, { "epoch": 1.53, "eval_loss": 0.6944009065628052, "eval_runtime": 17.4437, "eval_samples_per_second": 4.586, "eval_wer": 0.4992248062015504, "step": 11500 }, { "epoch": 1.55, "learning_rate": 9.948886617182987e-05, "loss": NaN, "step": 11600 }, { "epoch": 1.55, "eval_loss": 0.7042981386184692, "eval_runtime": 17.4509, "eval_samples_per_second": 4.584, "eval_wer": 0.5069767441860465, "step": 11600 }, { "epoch": 1.56, "learning_rate": 9.948442152984578e-05, "loss": NaN, "step": 11700 }, { "epoch": 1.56, "eval_loss": 0.6655673980712891, "eval_runtime": 17.4233, "eval_samples_per_second": 4.592, "eval_wer": 0.5100775193798449, "step": 11700 }, { "epoch": 1.57, "learning_rate": 9.947997688786169e-05, "loss": NaN, "step": 11800 }, { "epoch": 1.57, "eval_loss": 0.6955547332763672, "eval_runtime": 17.3935, "eval_samples_per_second": 4.599, "eval_wer": 0.5209302325581395, "step": 11800 }, { "epoch": 1.59, "learning_rate": 9.94755322458776e-05, "loss": NaN, "step": 11900 }, { "epoch": 1.59, "eval_loss": 0.7002443075180054, "eval_runtime": 17.4036, "eval_samples_per_second": 4.597, "eval_wer": 0.5193798449612403, "step": 11900 }, { "epoch": 1.6, "learning_rate": 9.947108760389351e-05, "loss": NaN, "step": 12000 }, { "epoch": 1.6, "eval_loss": 0.6780632734298706, "eval_runtime": 17.4488, "eval_samples_per_second": 4.585, "eval_wer": 0.5209302325581395, "step": 12000 }, { "epoch": 1.61, "learning_rate": 9.946664296190942e-05, "loss": NaN, "step": 12100 }, { "epoch": 1.61, "eval_loss": 0.7334409356117249, "eval_runtime": 17.3983, "eval_samples_per_second": 4.598, "eval_wer": 0.5100775193798449, "step": 12100 }, { "epoch": 1.63, "learning_rate": 9.946219831992533e-05, "loss": NaN, "step": 12200 }, { "epoch": 1.63, "eval_loss": 0.7420142889022827, "eval_runtime": 17.4073, "eval_samples_per_second": 4.596, "eval_wer": 0.5224806201550387, "step": 12200 }, { "epoch": 1.64, "learning_rate": 9.945775367794124e-05, "loss": NaN, "step": 12300 }, { "epoch": 1.64, "eval_loss": 0.680244505405426, "eval_runtime": 17.4234, "eval_samples_per_second": 4.592, "eval_wer": 0.5038759689922481, "step": 12300 }, { "epoch": 1.65, "learning_rate": 9.945330903595716e-05, "loss": NaN, "step": 12400 }, { "epoch": 1.65, "eval_loss": 0.7066457867622375, "eval_runtime": 17.4153, "eval_samples_per_second": 4.594, "eval_wer": 0.5209302325581395, "step": 12400 }, { "epoch": 1.67, "learning_rate": 9.944886439397308e-05, "loss": NaN, "step": 12500 }, { "epoch": 1.67, "eval_loss": 0.637787938117981, "eval_runtime": 17.3934, "eval_samples_per_second": 4.599, "eval_wer": 0.5209302325581395, "step": 12500 }, { "epoch": 1.68, "learning_rate": 9.944441975198898e-05, "loss": NaN, "step": 12600 }, { "epoch": 1.68, "eval_loss": 0.6452146768569946, "eval_runtime": 17.4649, "eval_samples_per_second": 4.581, "eval_wer": 0.5054263565891473, "step": 12600 }, { "epoch": 1.69, "learning_rate": 9.943997511000489e-05, "loss": NaN, "step": 12700 }, { "epoch": 1.69, "eval_loss": 0.6308380365371704, "eval_runtime": 17.4706, "eval_samples_per_second": 4.579, "eval_wer": 0.5054263565891473, "step": 12700 }, { "epoch": 1.71, "learning_rate": 9.943553046802081e-05, "loss": NaN, "step": 12800 }, { "epoch": 1.71, "eval_loss": 0.6226298809051514, "eval_runtime": 17.3657, "eval_samples_per_second": 4.607, "eval_wer": 0.5131782945736434, "step": 12800 }, { "epoch": 1.72, "learning_rate": 9.943108582603672e-05, "loss": NaN, "step": 12900 }, { "epoch": 1.72, "eval_loss": 0.6554073095321655, "eval_runtime": 17.4972, "eval_samples_per_second": 4.572, "eval_wer": 0.517829457364341, "step": 12900 }, { "epoch": 1.73, "learning_rate": 9.942664118405262e-05, "loss": NaN, "step": 13000 }, { "epoch": 1.73, "eval_loss": 0.7324713468551636, "eval_runtime": 17.4373, "eval_samples_per_second": 4.588, "eval_wer": 0.5147286821705427, "step": 13000 }, { "epoch": 1.75, "learning_rate": 9.942219654206855e-05, "loss": NaN, "step": 13100 }, { "epoch": 1.75, "eval_loss": 0.6392424702644348, "eval_runtime": 17.4258, "eval_samples_per_second": 4.591, "eval_wer": 0.5085271317829457, "step": 13100 }, { "epoch": 1.76, "learning_rate": 9.941775190008446e-05, "loss": NaN, "step": 13200 }, { "epoch": 1.76, "eval_loss": 0.6548818349838257, "eval_runtime": 17.3702, "eval_samples_per_second": 4.606, "eval_wer": 0.5255813953488372, "step": 13200 }, { "epoch": 1.77, "learning_rate": 9.941330725810037e-05, "loss": NaN, "step": 13300 }, { "epoch": 1.77, "eval_loss": 0.687231183052063, "eval_runtime": 17.3777, "eval_samples_per_second": 4.604, "eval_wer": 0.5023255813953489, "step": 13300 }, { "epoch": 1.79, "learning_rate": 9.940886261611627e-05, "loss": NaN, "step": 13400 }, { "epoch": 1.79, "eval_loss": 0.705328106880188, "eval_runtime": 17.4159, "eval_samples_per_second": 4.594, "eval_wer": 0.517829457364341, "step": 13400 }, { "epoch": 1.8, "learning_rate": 9.940441797413219e-05, "loss": NaN, "step": 13500 }, { "epoch": 1.8, "eval_loss": 0.7033597230911255, "eval_runtime": 17.4035, "eval_samples_per_second": 4.597, "eval_wer": 0.517829457364341, "step": 13500 }, { "epoch": 1.81, "learning_rate": 9.93999733321481e-05, "loss": NaN, "step": 13600 }, { "epoch": 1.81, "eval_loss": 0.7513315081596375, "eval_runtime": 17.4233, "eval_samples_per_second": 4.592, "eval_wer": 0.5193798449612403, "step": 13600 }, { "epoch": 1.83, "learning_rate": 9.939552869016401e-05, "loss": NaN, "step": 13700 }, { "epoch": 1.83, "eval_loss": 0.7186664342880249, "eval_runtime": 17.423, "eval_samples_per_second": 4.592, "eval_wer": 0.5286821705426357, "step": 13700 }, { "epoch": 1.84, "learning_rate": 9.939108404817993e-05, "loss": NaN, "step": 13800 }, { "epoch": 1.84, "eval_loss": 0.7211223840713501, "eval_runtime": 17.3974, "eval_samples_per_second": 4.598, "eval_wer": 0.517829457364341, "step": 13800 }, { "epoch": 1.85, "learning_rate": 9.938663940619584e-05, "loss": NaN, "step": 13900 }, { "epoch": 1.85, "eval_loss": 0.6921149492263794, "eval_runtime": 17.4244, "eval_samples_per_second": 4.591, "eval_wer": 0.5116279069767442, "step": 13900 }, { "epoch": 1.87, "learning_rate": 9.938219476421175e-05, "loss": NaN, "step": 14000 }, { "epoch": 1.87, "eval_loss": 0.8026927709579468, "eval_runtime": 17.4647, "eval_samples_per_second": 4.581, "eval_wer": 0.5317829457364341, "step": 14000 }, { "epoch": 1.88, "learning_rate": 9.937775012222766e-05, "loss": NaN, "step": 14100 }, { "epoch": 1.88, "eval_loss": 0.7409325838088989, "eval_runtime": 17.4438, "eval_samples_per_second": 4.586, "eval_wer": 0.517829457364341, "step": 14100 }, { "epoch": 1.89, "learning_rate": 9.937330548024357e-05, "loss": NaN, "step": 14200 }, { "epoch": 1.89, "eval_loss": 0.6671923995018005, "eval_runtime": 17.3839, "eval_samples_per_second": 4.602, "eval_wer": 0.5085271317829457, "step": 14200 }, { "epoch": 1.91, "learning_rate": 9.936886083825948e-05, "loss": NaN, "step": 14300 }, { "epoch": 1.91, "eval_loss": 0.6567109823226929, "eval_runtime": 17.3915, "eval_samples_per_second": 4.6, "eval_wer": 0.5116279069767442, "step": 14300 }, { "epoch": 1.92, "learning_rate": 9.93644161962754e-05, "loss": NaN, "step": 14400 }, { "epoch": 1.92, "eval_loss": 0.707842230796814, "eval_runtime": 17.4097, "eval_samples_per_second": 4.595, "eval_wer": 0.5038759689922481, "step": 14400 }, { "epoch": 1.93, "learning_rate": 9.93599715542913e-05, "loss": NaN, "step": 14500 }, { "epoch": 1.93, "eval_loss": 0.7037177085876465, "eval_runtime": 17.5565, "eval_samples_per_second": 4.557, "eval_wer": 0.5193798449612403, "step": 14500 }, { "epoch": 1.95, "learning_rate": 9.935552691230722e-05, "loss": NaN, "step": 14600 }, { "epoch": 1.95, "eval_loss": 0.7334758043289185, "eval_runtime": 17.5057, "eval_samples_per_second": 4.57, "eval_wer": 0.5736434108527132, "step": 14600 }, { "epoch": 1.96, "learning_rate": 9.935108227032313e-05, "loss": NaN, "step": 14700 }, { "epoch": 1.96, "eval_loss": 0.6860212087631226, "eval_runtime": 17.4444, "eval_samples_per_second": 4.586, "eval_wer": 0.5224806201550387, "step": 14700 }, { "epoch": 1.97, "learning_rate": 9.934663762833905e-05, "loss": NaN, "step": 14800 }, { "epoch": 1.97, "eval_loss": 0.6953790187835693, "eval_runtime": 17.4429, "eval_samples_per_second": 4.586, "eval_wer": 0.5209302325581395, "step": 14800 }, { "epoch": 1.99, "learning_rate": 9.934219298635495e-05, "loss": NaN, "step": 14900 }, { "epoch": 1.99, "eval_loss": 0.7358990907669067, "eval_runtime": 17.4828, "eval_samples_per_second": 4.576, "eval_wer": 0.5116279069767442, "step": 14900 }, { "epoch": 2.0, "learning_rate": 9.933774834437086e-05, "loss": NaN, "step": 15000 }, { "epoch": 2.0, "eval_loss": 0.6997208595275879, "eval_runtime": 17.4415, "eval_samples_per_second": 4.587, "eval_wer": 0.5271317829457365, "step": 15000 }, { "epoch": 2.01, "learning_rate": 9.933330370238679e-05, "loss": NaN, "step": 15100 }, { "epoch": 2.01, "eval_loss": 0.6580943465232849, "eval_runtime": 17.4313, "eval_samples_per_second": 4.589, "eval_wer": 0.5085271317829457, "step": 15100 }, { "epoch": 2.03, "learning_rate": 9.93288590604027e-05, "loss": NaN, "step": 15200 }, { "epoch": 2.03, "eval_loss": 0.6659531593322754, "eval_runtime": 17.4095, "eval_samples_per_second": 4.595, "eval_wer": 0.5224806201550387, "step": 15200 }, { "epoch": 2.04, "learning_rate": 9.93244144184186e-05, "loss": NaN, "step": 15300 }, { "epoch": 2.04, "eval_loss": 0.7017448544502258, "eval_runtime": 17.4403, "eval_samples_per_second": 4.587, "eval_wer": 0.5224806201550387, "step": 15300 }, { "epoch": 2.05, "learning_rate": 9.931996977643452e-05, "loss": NaN, "step": 15400 }, { "epoch": 2.05, "eval_loss": 0.7005801796913147, "eval_runtime": 17.4039, "eval_samples_per_second": 4.597, "eval_wer": 0.5209302325581395, "step": 15400 }, { "epoch": 2.07, "learning_rate": 9.931552513445043e-05, "loss": NaN, "step": 15500 }, { "epoch": 2.07, "eval_loss": 0.646070659160614, "eval_runtime": 17.377, "eval_samples_per_second": 4.604, "eval_wer": 0.49767441860465117, "step": 15500 }, { "epoch": 2.08, "learning_rate": 9.931108049246634e-05, "loss": NaN, "step": 15600 }, { "epoch": 2.08, "eval_loss": 0.6526376008987427, "eval_runtime": 17.4521, "eval_samples_per_second": 4.584, "eval_wer": 0.5116279069767442, "step": 15600 }, { "epoch": 2.09, "learning_rate": 9.930663585048224e-05, "loss": NaN, "step": 15700 }, { "epoch": 2.09, "eval_loss": 0.7334516644477844, "eval_runtime": 17.501, "eval_samples_per_second": 4.571, "eval_wer": 0.5100775193798449, "step": 15700 }, { "epoch": 2.11, "learning_rate": 9.930219120849816e-05, "loss": NaN, "step": 15800 }, { "epoch": 2.11, "eval_loss": 0.6918967366218567, "eval_runtime": 17.5122, "eval_samples_per_second": 4.568, "eval_wer": 0.5193798449612403, "step": 15800 }, { "epoch": 2.12, "learning_rate": 9.929774656651408e-05, "loss": NaN, "step": 15900 }, { "epoch": 2.12, "eval_loss": 0.6813740730285645, "eval_runtime": 17.4079, "eval_samples_per_second": 4.596, "eval_wer": 0.4883720930232558, "step": 15900 }, { "epoch": 2.13, "learning_rate": 9.929330192452999e-05, "loss": NaN, "step": 16000 }, { "epoch": 2.13, "eval_loss": 0.704567551612854, "eval_runtime": 17.4009, "eval_samples_per_second": 4.597, "eval_wer": 0.5069767441860465, "step": 16000 }, { "epoch": 2.15, "learning_rate": 9.92888572825459e-05, "loss": NaN, "step": 16100 }, { "epoch": 2.15, "eval_loss": 0.7084250450134277, "eval_runtime": 17.3953, "eval_samples_per_second": 4.599, "eval_wer": 0.524031007751938, "step": 16100 }, { "epoch": 2.16, "learning_rate": 9.928441264056181e-05, "loss": NaN, "step": 16200 }, { "epoch": 2.16, "eval_loss": 0.7336726188659668, "eval_runtime": 17.5249, "eval_samples_per_second": 4.565, "eval_wer": 0.5317829457364341, "step": 16200 }, { "epoch": 2.17, "learning_rate": 9.927996799857772e-05, "loss": NaN, "step": 16300 }, { "epoch": 2.17, "eval_loss": 0.7087512016296387, "eval_runtime": 17.4343, "eval_samples_per_second": 4.589, "eval_wer": 0.5069767441860465, "step": 16300 }, { "epoch": 2.19, "learning_rate": 9.927552335659363e-05, "loss": NaN, "step": 16400 }, { "epoch": 2.19, "eval_loss": 0.7270997166633606, "eval_runtime": 17.4461, "eval_samples_per_second": 4.586, "eval_wer": 0.5100775193798449, "step": 16400 }, { "epoch": 2.2, "learning_rate": 9.927107871460954e-05, "loss": NaN, "step": 16500 }, { "epoch": 2.2, "eval_loss": 0.7297137379646301, "eval_runtime": 17.3651, "eval_samples_per_second": 4.607, "eval_wer": 0.5131782945736434, "step": 16500 }, { "epoch": 2.21, "learning_rate": 9.926663407262545e-05, "loss": NaN, "step": 16600 }, { "epoch": 2.21, "eval_loss": 0.7396950125694275, "eval_runtime": 17.4544, "eval_samples_per_second": 4.583, "eval_wer": 0.5193798449612403, "step": 16600 }, { "epoch": 2.23, "learning_rate": 9.926218943064137e-05, "loss": NaN, "step": 16700 }, { "epoch": 2.23, "eval_loss": 0.6693302392959595, "eval_runtime": 17.4093, "eval_samples_per_second": 4.595, "eval_wer": 0.5147286821705427, "step": 16700 }, { "epoch": 2.24, "learning_rate": 9.925774478865728e-05, "loss": NaN, "step": 16800 }, { "epoch": 2.24, "eval_loss": 0.681401252746582, "eval_runtime": 17.4358, "eval_samples_per_second": 4.588, "eval_wer": 0.5193798449612403, "step": 16800 }, { "epoch": 2.25, "learning_rate": 9.925330014667319e-05, "loss": NaN, "step": 16900 }, { "epoch": 2.25, "eval_loss": 0.6969695687294006, "eval_runtime": 17.4628, "eval_samples_per_second": 4.581, "eval_wer": 0.5085271317829457, "step": 16900 }, { "epoch": 2.27, "learning_rate": 9.92488555046891e-05, "loss": NaN, "step": 17000 }, { "epoch": 2.27, "eval_loss": 0.7665321826934814, "eval_runtime": 17.4427, "eval_samples_per_second": 4.586, "eval_wer": 0.5007751937984496, "step": 17000 }, { "epoch": 2.28, "learning_rate": 9.924441086270502e-05, "loss": NaN, "step": 17100 }, { "epoch": 2.28, "eval_loss": 0.6652202606201172, "eval_runtime": 17.3856, "eval_samples_per_second": 4.602, "eval_wer": 0.5100775193798449, "step": 17100 }, { "epoch": 2.29, "learning_rate": 9.923996622072092e-05, "loss": NaN, "step": 17200 }, { "epoch": 2.29, "eval_loss": 0.6718670129776001, "eval_runtime": 17.5534, "eval_samples_per_second": 4.558, "eval_wer": 0.4930232558139535, "step": 17200 }, { "epoch": 2.31, "learning_rate": 9.923552157873683e-05, "loss": NaN, "step": 17300 }, { "epoch": 2.31, "eval_loss": 0.7141027450561523, "eval_runtime": 17.3511, "eval_samples_per_second": 4.611, "eval_wer": 0.49612403100775193, "step": 17300 }, { "epoch": 2.32, "learning_rate": 9.923107693675276e-05, "loss": NaN, "step": 17400 }, { "epoch": 2.32, "eval_loss": 0.69825279712677, "eval_runtime": 17.3767, "eval_samples_per_second": 4.604, "eval_wer": 0.5054263565891473, "step": 17400 }, { "epoch": 2.33, "learning_rate": 9.922663229476867e-05, "loss": NaN, "step": 17500 }, { "epoch": 2.33, "eval_loss": 0.7104494571685791, "eval_runtime": 17.4248, "eval_samples_per_second": 4.591, "eval_wer": 0.5054263565891473, "step": 17500 }, { "epoch": 2.35, "learning_rate": 9.922218765278457e-05, "loss": NaN, "step": 17600 }, { "epoch": 2.35, "eval_loss": 0.7555495500564575, "eval_runtime": 17.4089, "eval_samples_per_second": 4.595, "eval_wer": 0.5054263565891473, "step": 17600 }, { "epoch": 2.36, "learning_rate": 9.921774301080049e-05, "loss": NaN, "step": 17700 }, { "epoch": 2.36, "eval_loss": 0.7753702998161316, "eval_runtime": 17.5354, "eval_samples_per_second": 4.562, "eval_wer": 0.5131782945736434, "step": 17700 }, { "epoch": 2.37, "learning_rate": 9.92132983688164e-05, "loss": NaN, "step": 17800 }, { "epoch": 2.37, "eval_loss": 0.7617055177688599, "eval_runtime": 17.6842, "eval_samples_per_second": 4.524, "eval_wer": 0.49612403100775193, "step": 17800 }, { "epoch": 2.39, "learning_rate": 9.92088537268323e-05, "loss": NaN, "step": 17900 }, { "epoch": 2.39, "eval_loss": 0.8150382041931152, "eval_runtime": 17.4098, "eval_samples_per_second": 4.595, "eval_wer": 0.4945736434108527, "step": 17900 }, { "epoch": 2.4, "learning_rate": 9.920440908484821e-05, "loss": NaN, "step": 18000 }, { "epoch": 2.4, "eval_loss": 0.8014766573905945, "eval_runtime": 17.5133, "eval_samples_per_second": 4.568, "eval_wer": 0.49767441860465117, "step": 18000 }, { "epoch": 2.41, "learning_rate": 9.919996444286414e-05, "loss": NaN, "step": 18100 }, { "epoch": 2.41, "eval_loss": 0.6994240283966064, "eval_runtime": 17.5258, "eval_samples_per_second": 4.565, "eval_wer": 0.5038759689922481, "step": 18100 }, { "epoch": 2.43, "learning_rate": 9.919551980088005e-05, "loss": NaN, "step": 18200 }, { "epoch": 2.43, "eval_loss": 0.7259965538978577, "eval_runtime": 17.5442, "eval_samples_per_second": 4.56, "eval_wer": 0.5162790697674419, "step": 18200 }, { "epoch": 2.44, "learning_rate": 9.919107515889595e-05, "loss": NaN, "step": 18300 }, { "epoch": 2.44, "eval_loss": 0.7805743217468262, "eval_runtime": 17.6196, "eval_samples_per_second": 4.54, "eval_wer": 0.4945736434108527, "step": 18300 }, { "epoch": 2.45, "learning_rate": 9.918663051691187e-05, "loss": NaN, "step": 18400 }, { "epoch": 2.45, "eval_loss": 0.7654392123222351, "eval_runtime": 17.5555, "eval_samples_per_second": 4.557, "eval_wer": 0.4992248062015504, "step": 18400 }, { "epoch": 2.47, "learning_rate": 9.918218587492778e-05, "loss": NaN, "step": 18500 }, { "epoch": 2.47, "eval_loss": 0.7141100168228149, "eval_runtime": 17.5057, "eval_samples_per_second": 4.57, "eval_wer": 0.49767441860465117, "step": 18500 }, { "epoch": 2.48, "learning_rate": 9.917774123294369e-05, "loss": NaN, "step": 18600 }, { "epoch": 2.48, "eval_loss": 0.6688128113746643, "eval_runtime": 17.4377, "eval_samples_per_second": 4.588, "eval_wer": 0.49147286821705427, "step": 18600 }, { "epoch": 2.49, "learning_rate": 9.91732965909596e-05, "loss": NaN, "step": 18700 }, { "epoch": 2.49, "eval_loss": 0.6818010807037354, "eval_runtime": 17.3635, "eval_samples_per_second": 4.607, "eval_wer": 0.5038759689922481, "step": 18700 }, { "epoch": 2.51, "learning_rate": 9.916885194897552e-05, "loss": NaN, "step": 18800 }, { "epoch": 2.51, "eval_loss": 0.6905618906021118, "eval_runtime": 17.4231, "eval_samples_per_second": 4.592, "eval_wer": 0.5193798449612403, "step": 18800 }, { "epoch": 2.52, "learning_rate": 9.916440730699143e-05, "loss": NaN, "step": 18900 }, { "epoch": 2.52, "eval_loss": 0.646501362323761, "eval_runtime": 17.4802, "eval_samples_per_second": 4.577, "eval_wer": 0.5271317829457365, "step": 18900 }, { "epoch": 2.53, "learning_rate": 9.915996266500734e-05, "loss": NaN, "step": 19000 }, { "epoch": 2.53, "eval_loss": 0.6760914325714111, "eval_runtime": 17.5136, "eval_samples_per_second": 4.568, "eval_wer": 0.5209302325581395, "step": 19000 }, { "epoch": 2.55, "learning_rate": 9.915551802302325e-05, "loss": NaN, "step": 19100 }, { "epoch": 2.55, "eval_loss": 0.7431942224502563, "eval_runtime": 17.3946, "eval_samples_per_second": 4.599, "eval_wer": 0.5116279069767442, "step": 19100 }, { "epoch": 2.56, "learning_rate": 9.915107338103916e-05, "loss": NaN, "step": 19200 }, { "epoch": 2.56, "eval_loss": 0.7671061754226685, "eval_runtime": 17.5834, "eval_samples_per_second": 4.55, "eval_wer": 0.5054263565891473, "step": 19200 }, { "epoch": 2.57, "learning_rate": 9.914662873905507e-05, "loss": NaN, "step": 19300 }, { "epoch": 2.57, "eval_loss": 0.7126530408859253, "eval_runtime": 17.5901, "eval_samples_per_second": 4.548, "eval_wer": 0.4868217054263566, "step": 19300 }, { "epoch": 2.59, "learning_rate": 9.914218409707098e-05, "loss": NaN, "step": 19400 }, { "epoch": 2.59, "eval_loss": 0.727730929851532, "eval_runtime": 17.6577, "eval_samples_per_second": 4.531, "eval_wer": 0.5085271317829457, "step": 19400 }, { "epoch": 2.6, "learning_rate": 9.91377394550869e-05, "loss": NaN, "step": 19500 }, { "epoch": 2.6, "eval_loss": 0.6788039207458496, "eval_runtime": 17.6112, "eval_samples_per_second": 4.543, "eval_wer": 0.48992248062015503, "step": 19500 }, { "epoch": 2.61, "learning_rate": 9.91332948131028e-05, "loss": NaN, "step": 19600 }, { "epoch": 2.61, "eval_loss": 0.6633437871932983, "eval_runtime": 17.6623, "eval_samples_per_second": 4.529, "eval_wer": 0.4821705426356589, "step": 19600 }, { "epoch": 2.63, "learning_rate": 9.912885017111873e-05, "loss": NaN, "step": 19700 }, { "epoch": 2.63, "eval_loss": 0.630849301815033, "eval_runtime": 17.4181, "eval_samples_per_second": 4.593, "eval_wer": 0.4728682170542636, "step": 19700 }, { "epoch": 2.64, "learning_rate": 9.912440552913463e-05, "loss": NaN, "step": 19800 }, { "epoch": 2.64, "eval_loss": 0.6438859701156616, "eval_runtime": 17.5582, "eval_samples_per_second": 4.556, "eval_wer": 0.48992248062015503, "step": 19800 }, { "epoch": 2.65, "learning_rate": 9.911996088715054e-05, "loss": NaN, "step": 19900 }, { "epoch": 2.65, "eval_loss": 0.6492059826850891, "eval_runtime": 17.5321, "eval_samples_per_second": 4.563, "eval_wer": 0.4868217054263566, "step": 19900 }, { "epoch": 2.67, "learning_rate": 9.911551624516646e-05, "loss": NaN, "step": 20000 }, { "epoch": 2.67, "eval_loss": 0.6646106839179993, "eval_runtime": 17.4882, "eval_samples_per_second": 4.575, "eval_wer": 0.48372093023255813, "step": 20000 }, { "epoch": 2.68, "learning_rate": 9.911107160318237e-05, "loss": NaN, "step": 20100 }, { "epoch": 2.68, "eval_loss": 0.6617286801338196, "eval_runtime": 17.4701, "eval_samples_per_second": 4.579, "eval_wer": 0.48372093023255813, "step": 20100 }, { "epoch": 2.69, "learning_rate": 9.910662696119827e-05, "loss": NaN, "step": 20200 }, { "epoch": 2.69, "eval_loss": 0.6755768060684204, "eval_runtime": 17.5213, "eval_samples_per_second": 4.566, "eval_wer": 0.4806201550387597, "step": 20200 }, { "epoch": 2.71, "learning_rate": 9.910218231921418e-05, "loss": NaN, "step": 20300 }, { "epoch": 2.71, "eval_loss": 0.633080005645752, "eval_runtime": 17.4548, "eval_samples_per_second": 4.583, "eval_wer": 0.5069767441860465, "step": 20300 }, { "epoch": 2.72, "learning_rate": 9.909773767723011e-05, "loss": NaN, "step": 20400 }, { "epoch": 2.72, "eval_loss": 0.665341317653656, "eval_runtime": 17.6885, "eval_samples_per_second": 4.523, "eval_wer": 0.5193798449612403, "step": 20400 }, { "epoch": 2.73, "learning_rate": 9.909329303524602e-05, "loss": NaN, "step": 20500 }, { "epoch": 2.73, "eval_loss": 0.6483832597732544, "eval_runtime": 17.6251, "eval_samples_per_second": 4.539, "eval_wer": 0.475968992248062, "step": 20500 }, { "epoch": 2.75, "learning_rate": 9.908884839326192e-05, "loss": NaN, "step": 20600 }, { "epoch": 2.75, "eval_loss": 0.6416093111038208, "eval_runtime": 17.5412, "eval_samples_per_second": 4.561, "eval_wer": 0.4496124031007752, "step": 20600 }, { "epoch": 2.76, "learning_rate": 9.908440375127784e-05, "loss": NaN, "step": 20700 }, { "epoch": 2.76, "eval_loss": 0.6763391494750977, "eval_runtime": 17.5193, "eval_samples_per_second": 4.566, "eval_wer": 0.4806201550387597, "step": 20700 }, { "epoch": 2.77, "learning_rate": 9.907995910929375e-05, "loss": NaN, "step": 20800 }, { "epoch": 2.77, "eval_loss": 0.654536783695221, "eval_runtime": 17.4594, "eval_samples_per_second": 4.582, "eval_wer": 0.4930232558139535, "step": 20800 }, { "epoch": 2.79, "learning_rate": 9.907551446730966e-05, "loss": NaN, "step": 20900 }, { "epoch": 2.79, "eval_loss": 0.6497390866279602, "eval_runtime": 17.4598, "eval_samples_per_second": 4.582, "eval_wer": 0.4883720930232558, "step": 20900 }, { "epoch": 2.8, "learning_rate": 9.907106982532558e-05, "loss": NaN, "step": 21000 }, { "epoch": 2.8, "eval_loss": 0.7144044041633606, "eval_runtime": 17.4935, "eval_samples_per_second": 4.573, "eval_wer": 0.4930232558139535, "step": 21000 }, { "epoch": 2.81, "learning_rate": 9.906662518334149e-05, "loss": NaN, "step": 21100 }, { "epoch": 2.81, "eval_loss": 0.6466220021247864, "eval_runtime": 17.5042, "eval_samples_per_second": 4.57, "eval_wer": 0.49767441860465117, "step": 21100 }, { "epoch": 2.83, "learning_rate": 9.90621805413574e-05, "loss": NaN, "step": 21200 }, { "epoch": 2.83, "eval_loss": 0.6383641362190247, "eval_runtime": 17.5022, "eval_samples_per_second": 4.571, "eval_wer": 0.4945736434108527, "step": 21200 }, { "epoch": 2.84, "learning_rate": 9.905773589937331e-05, "loss": NaN, "step": 21300 }, { "epoch": 2.84, "eval_loss": 0.6846612691879272, "eval_runtime": 17.4796, "eval_samples_per_second": 4.577, "eval_wer": 0.48527131782945737, "step": 21300 }, { "epoch": 2.85, "learning_rate": 9.905329125738922e-05, "loss": NaN, "step": 21400 }, { "epoch": 2.85, "eval_loss": 0.65887850522995, "eval_runtime": 17.6832, "eval_samples_per_second": 4.524, "eval_wer": 0.5038759689922481, "step": 21400 }, { "epoch": 2.87, "learning_rate": 9.904884661540513e-05, "loss": NaN, "step": 21500 }, { "epoch": 2.87, "eval_loss": 0.7195907831192017, "eval_runtime": 17.5562, "eval_samples_per_second": 4.557, "eval_wer": 0.5131782945736434, "step": 21500 }, { "epoch": 2.88, "learning_rate": 9.904440197342104e-05, "loss": NaN, "step": 21600 }, { "epoch": 2.88, "eval_loss": 0.6677905321121216, "eval_runtime": 17.6786, "eval_samples_per_second": 4.525, "eval_wer": 0.5147286821705427, "step": 21600 }, { "epoch": 2.89, "learning_rate": 9.903995733143695e-05, "loss": NaN, "step": 21700 }, { "epoch": 2.89, "eval_loss": 0.6715782880783081, "eval_runtime": 17.5941, "eval_samples_per_second": 4.547, "eval_wer": 0.49612403100775193, "step": 21700 }, { "epoch": 2.91, "learning_rate": 9.903551268945287e-05, "loss": NaN, "step": 21800 }, { "epoch": 2.91, "eval_loss": 0.6809279918670654, "eval_runtime": 17.4894, "eval_samples_per_second": 4.574, "eval_wer": 0.49612403100775193, "step": 21800 }, { "epoch": 2.92, "learning_rate": 9.903106804746878e-05, "loss": NaN, "step": 21900 }, { "epoch": 2.92, "eval_loss": 0.7200478911399841, "eval_runtime": 17.4913, "eval_samples_per_second": 4.574, "eval_wer": 0.5054263565891473, "step": 21900 }, { "epoch": 2.93, "learning_rate": 9.90266234054847e-05, "loss": NaN, "step": 22000 }, { "epoch": 2.93, "eval_loss": 0.7086242437362671, "eval_runtime": 17.7177, "eval_samples_per_second": 4.515, "eval_wer": 0.5131782945736434, "step": 22000 }, { "epoch": 2.95, "learning_rate": 9.90221787635006e-05, "loss": NaN, "step": 22100 }, { "epoch": 2.95, "eval_loss": 0.7738662958145142, "eval_runtime": 17.5778, "eval_samples_per_second": 4.551, "eval_wer": 0.4930232558139535, "step": 22100 }, { "epoch": 2.96, "learning_rate": 9.901773412151651e-05, "loss": NaN, "step": 22200 }, { "epoch": 2.96, "eval_loss": 0.719960629940033, "eval_runtime": 17.7048, "eval_samples_per_second": 4.519, "eval_wer": 0.5100775193798449, "step": 22200 }, { "epoch": 2.97, "learning_rate": 9.901328947953244e-05, "loss": NaN, "step": 22300 }, { "epoch": 2.97, "eval_loss": 0.6674638986587524, "eval_runtime": 17.7977, "eval_samples_per_second": 4.495, "eval_wer": 0.5100775193798449, "step": 22300 }, { "epoch": 2.99, "learning_rate": 9.900884483754835e-05, "loss": NaN, "step": 22400 }, { "epoch": 2.99, "eval_loss": 0.6668637990951538, "eval_runtime": 17.6814, "eval_samples_per_second": 4.525, "eval_wer": 0.49767441860465117, "step": 22400 }, { "epoch": 3.0, "learning_rate": 9.900440019556424e-05, "loss": NaN, "step": 22500 }, { "epoch": 3.0, "eval_loss": 0.7027889490127563, "eval_runtime": 17.5701, "eval_samples_per_second": 4.553, "eval_wer": 0.5317829457364341, "step": 22500 }, { "epoch": 3.01, "learning_rate": 9.899995555358016e-05, "loss": NaN, "step": 22600 }, { "epoch": 3.01, "eval_loss": 0.7082899212837219, "eval_runtime": 17.636, "eval_samples_per_second": 4.536, "eval_wer": 0.5100775193798449, "step": 22600 }, { "epoch": 3.03, "learning_rate": 9.899551091159608e-05, "loss": NaN, "step": 22700 }, { "epoch": 3.03, "eval_loss": 0.690900981426239, "eval_runtime": 17.5784, "eval_samples_per_second": 4.551, "eval_wer": 0.5147286821705427, "step": 22700 }, { "epoch": 3.04, "learning_rate": 9.899106626961199e-05, "loss": NaN, "step": 22800 }, { "epoch": 3.04, "eval_loss": 0.6628085374832153, "eval_runtime": 17.7779, "eval_samples_per_second": 4.5, "eval_wer": 0.5116279069767442, "step": 22800 }, { "epoch": 3.05, "learning_rate": 9.898662162762789e-05, "loss": NaN, "step": 22900 }, { "epoch": 3.05, "eval_loss": 0.7275087833404541, "eval_runtime": 17.8126, "eval_samples_per_second": 4.491, "eval_wer": 0.49767441860465117, "step": 22900 }, { "epoch": 3.07, "learning_rate": 9.898217698564381e-05, "loss": NaN, "step": 23000 }, { "epoch": 3.07, "eval_loss": 0.7226203680038452, "eval_runtime": 17.6988, "eval_samples_per_second": 4.52, "eval_wer": 0.48527131782945737, "step": 23000 }, { "epoch": 3.08, "learning_rate": 9.897773234365973e-05, "loss": NaN, "step": 23100 }, { "epoch": 3.08, "eval_loss": 0.6935572028160095, "eval_runtime": 17.7653, "eval_samples_per_second": 4.503, "eval_wer": 0.4883720930232558, "step": 23100 }, { "epoch": 3.09, "learning_rate": 9.897328770167564e-05, "loss": NaN, "step": 23200 }, { "epoch": 3.09, "eval_loss": 0.7608216404914856, "eval_runtime": 17.8167, "eval_samples_per_second": 4.49, "eval_wer": 0.5193798449612403, "step": 23200 }, { "epoch": 3.11, "learning_rate": 9.896884305969155e-05, "loss": NaN, "step": 23300 }, { "epoch": 3.11, "eval_loss": 0.8762000203132629, "eval_runtime": 17.7039, "eval_samples_per_second": 4.519, "eval_wer": 0.48992248062015503, "step": 23300 }, { "epoch": 3.12, "learning_rate": 9.896439841770746e-05, "loss": NaN, "step": 23400 }, { "epoch": 3.12, "eval_loss": 0.8612931370735168, "eval_runtime": 17.6357, "eval_samples_per_second": 4.536, "eval_wer": 0.524031007751938, "step": 23400 }, { "epoch": 3.13, "learning_rate": 9.895995377572337e-05, "loss": NaN, "step": 23500 }, { "epoch": 3.13, "eval_loss": 0.6559737920761108, "eval_runtime": 17.6948, "eval_samples_per_second": 4.521, "eval_wer": 0.49767441860465117, "step": 23500 }, { "epoch": 3.15, "learning_rate": 9.895550913373928e-05, "loss": NaN, "step": 23600 }, { "epoch": 3.15, "eval_loss": 0.7084537148475647, "eval_runtime": 17.6392, "eval_samples_per_second": 4.535, "eval_wer": 0.4930232558139535, "step": 23600 }, { "epoch": 3.16, "learning_rate": 9.895106449175519e-05, "loss": NaN, "step": 23700 }, { "epoch": 3.16, "eval_loss": 0.6912034749984741, "eval_runtime": 17.7427, "eval_samples_per_second": 4.509, "eval_wer": 0.49147286821705427, "step": 23700 }, { "epoch": 3.17, "learning_rate": 9.89466198497711e-05, "loss": NaN, "step": 23800 }, { "epoch": 3.17, "eval_loss": 0.7391806840896606, "eval_runtime": 17.7803, "eval_samples_per_second": 4.499, "eval_wer": 0.48372093023255813, "step": 23800 }, { "epoch": 3.19, "learning_rate": 9.894217520778702e-05, "loss": NaN, "step": 23900 }, { "epoch": 3.19, "eval_loss": 0.7380479574203491, "eval_runtime": 17.7057, "eval_samples_per_second": 4.518, "eval_wer": 0.5007751937984496, "step": 23900 }, { "epoch": 3.2, "learning_rate": 9.893773056580293e-05, "loss": NaN, "step": 24000 }, { "epoch": 3.2, "eval_loss": 0.6259809732437134, "eval_runtime": 17.7735, "eval_samples_per_second": 4.501, "eval_wer": 0.5054263565891473, "step": 24000 }, { "epoch": 3.21, "learning_rate": 9.893328592381884e-05, "loss": NaN, "step": 24100 }, { "epoch": 3.21, "eval_loss": 0.6884532570838928, "eval_runtime": 17.6673, "eval_samples_per_second": 4.528, "eval_wer": 0.4868217054263566, "step": 24100 }, { "epoch": 3.23, "learning_rate": 9.892884128183475e-05, "loss": NaN, "step": 24200 }, { "epoch": 3.23, "eval_loss": 0.693473219871521, "eval_runtime": 17.7372, "eval_samples_per_second": 4.51, "eval_wer": 0.5116279069767442, "step": 24200 }, { "epoch": 3.24, "learning_rate": 9.892439663985067e-05, "loss": NaN, "step": 24300 }, { "epoch": 3.24, "eval_loss": 0.6742721199989319, "eval_runtime": 17.6443, "eval_samples_per_second": 4.534, "eval_wer": 0.5116279069767442, "step": 24300 }, { "epoch": 3.25, "learning_rate": 9.891995199786657e-05, "loss": NaN, "step": 24400 }, { "epoch": 3.25, "eval_loss": 0.7249454259872437, "eval_runtime": 17.6261, "eval_samples_per_second": 4.539, "eval_wer": 0.5162790697674419, "step": 24400 }, { "epoch": 3.27, "learning_rate": 9.891550735588248e-05, "loss": NaN, "step": 24500 }, { "epoch": 3.27, "eval_loss": 0.6982861757278442, "eval_runtime": 17.6565, "eval_samples_per_second": 4.531, "eval_wer": 0.5162790697674419, "step": 24500 }, { "epoch": 3.28, "learning_rate": 9.89110627138984e-05, "loss": NaN, "step": 24600 }, { "epoch": 3.28, "eval_loss": 0.6899422407150269, "eval_runtime": 17.8327, "eval_samples_per_second": 4.486, "eval_wer": 0.5147286821705427, "step": 24600 }, { "epoch": 3.29, "learning_rate": 9.890661807191432e-05, "loss": NaN, "step": 24700 }, { "epoch": 3.29, "eval_loss": 0.7489897012710571, "eval_runtime": 17.7463, "eval_samples_per_second": 4.508, "eval_wer": 0.5116279069767442, "step": 24700 }, { "epoch": 3.31, "learning_rate": 9.890217342993022e-05, "loss": NaN, "step": 24800 }, { "epoch": 3.31, "eval_loss": 0.6491571664810181, "eval_runtime": 17.9426, "eval_samples_per_second": 4.459, "eval_wer": 0.4992248062015504, "step": 24800 }, { "epoch": 3.32, "learning_rate": 9.889772878794613e-05, "loss": NaN, "step": 24900 }, { "epoch": 3.32, "eval_loss": 0.6521108150482178, "eval_runtime": 17.6592, "eval_samples_per_second": 4.53, "eval_wer": 0.48372093023255813, "step": 24900 }, { "epoch": 3.33, "learning_rate": 9.889328414596205e-05, "loss": NaN, "step": 25000 }, { "epoch": 3.33, "eval_loss": 0.6570430397987366, "eval_runtime": 17.7233, "eval_samples_per_second": 4.514, "eval_wer": 0.49612403100775193, "step": 25000 }, { "epoch": 3.35, "learning_rate": 9.888883950397796e-05, "loss": NaN, "step": 25100 }, { "epoch": 3.35, "eval_loss": 0.6758342385292053, "eval_runtime": 18.0274, "eval_samples_per_second": 4.438, "eval_wer": 0.49612403100775193, "step": 25100 }, { "epoch": 3.36, "learning_rate": 9.888439486199386e-05, "loss": NaN, "step": 25200 }, { "epoch": 3.36, "eval_loss": 0.6588055491447449, "eval_runtime": 17.7155, "eval_samples_per_second": 4.516, "eval_wer": 0.4883720930232558, "step": 25200 }, { "epoch": 3.37, "learning_rate": 9.887995022000979e-05, "loss": NaN, "step": 25300 }, { "epoch": 3.37, "eval_loss": 0.6541072130203247, "eval_runtime": 17.6533, "eval_samples_per_second": 4.532, "eval_wer": 0.5023255813953489, "step": 25300 }, { "epoch": 3.39, "learning_rate": 9.88755055780257e-05, "loss": NaN, "step": 25400 }, { "epoch": 3.39, "eval_loss": 0.7445347309112549, "eval_runtime": 17.8422, "eval_samples_per_second": 4.484, "eval_wer": 0.537984496124031, "step": 25400 }, { "epoch": 3.4, "learning_rate": 9.887106093604161e-05, "loss": NaN, "step": 25500 }, { "epoch": 3.4, "eval_loss": 0.6562886238098145, "eval_runtime": 18.0886, "eval_samples_per_second": 4.423, "eval_wer": 0.5023255813953489, "step": 25500 }, { "epoch": 3.41, "learning_rate": 9.886661629405752e-05, "loss": NaN, "step": 25600 }, { "epoch": 3.41, "eval_loss": 0.6530973315238953, "eval_runtime": 17.8674, "eval_samples_per_second": 4.477, "eval_wer": 0.5023255813953489, "step": 25600 }, { "epoch": 3.43, "learning_rate": 9.886217165207343e-05, "loss": NaN, "step": 25700 }, { "epoch": 3.43, "eval_loss": 0.700346827507019, "eval_runtime": 17.7178, "eval_samples_per_second": 4.515, "eval_wer": 0.5348837209302325, "step": 25700 }, { "epoch": 3.44, "learning_rate": 9.885772701008934e-05, "loss": NaN, "step": 25800 }, { "epoch": 3.44, "eval_loss": 0.7025777697563171, "eval_runtime": 17.7283, "eval_samples_per_second": 4.513, "eval_wer": 0.5116279069767442, "step": 25800 }, { "epoch": 3.45, "learning_rate": 9.885328236810525e-05, "loss": NaN, "step": 25900 }, { "epoch": 3.45, "eval_loss": 0.6949543356895447, "eval_runtime": 17.8409, "eval_samples_per_second": 4.484, "eval_wer": 0.4945736434108527, "step": 25900 }, { "epoch": 3.47, "learning_rate": 9.884883772612116e-05, "loss": NaN, "step": 26000 }, { "epoch": 3.47, "eval_loss": 0.6976181268692017, "eval_runtime": 17.7292, "eval_samples_per_second": 4.512, "eval_wer": 0.5271317829457365, "step": 26000 }, { "epoch": 3.48, "learning_rate": 9.884439308413708e-05, "loss": NaN, "step": 26100 }, { "epoch": 3.48, "eval_loss": 0.776595950126648, "eval_runtime": 17.6407, "eval_samples_per_second": 4.535, "eval_wer": 0.5023255813953489, "step": 26100 }, { "epoch": 3.49, "learning_rate": 9.883994844215299e-05, "loss": NaN, "step": 26200 }, { "epoch": 3.49, "eval_loss": 0.7193652987480164, "eval_runtime": 17.7195, "eval_samples_per_second": 4.515, "eval_wer": 0.48992248062015503, "step": 26200 }, { "epoch": 3.51, "learning_rate": 9.88355038001689e-05, "loss": NaN, "step": 26300 }, { "epoch": 3.51, "eval_loss": 0.7061530351638794, "eval_runtime": 17.6793, "eval_samples_per_second": 4.525, "eval_wer": 0.49147286821705427, "step": 26300 }, { "epoch": 3.52, "learning_rate": 9.883105915818481e-05, "loss": NaN, "step": 26400 }, { "epoch": 3.52, "eval_loss": 0.7101202011108398, "eval_runtime": 17.6388, "eval_samples_per_second": 4.535, "eval_wer": 0.5147286821705427, "step": 26400 }, { "epoch": 3.53, "learning_rate": 9.882661451620072e-05, "loss": NaN, "step": 26500 }, { "epoch": 3.53, "eval_loss": 0.7322906255722046, "eval_runtime": 17.5209, "eval_samples_per_second": 4.566, "eval_wer": 0.5100775193798449, "step": 26500 }, { "epoch": 3.55, "learning_rate": 9.882216987421665e-05, "loss": NaN, "step": 26600 }, { "epoch": 3.55, "eval_loss": 0.759114682674408, "eval_runtime": 17.7065, "eval_samples_per_second": 4.518, "eval_wer": 0.49767441860465117, "step": 26600 }, { "epoch": 3.56, "learning_rate": 9.881772523223254e-05, "loss": NaN, "step": 26700 }, { "epoch": 3.56, "eval_loss": 0.8165428042411804, "eval_runtime": 17.7222, "eval_samples_per_second": 4.514, "eval_wer": 0.5147286821705427, "step": 26700 }, { "epoch": 3.57, "learning_rate": 9.881328059024845e-05, "loss": NaN, "step": 26800 }, { "epoch": 3.57, "eval_loss": 0.7161229252815247, "eval_runtime": 17.8272, "eval_samples_per_second": 4.488, "eval_wer": 0.48992248062015503, "step": 26800 }, { "epoch": 3.59, "learning_rate": 9.880883594826437e-05, "loss": NaN, "step": 26900 }, { "epoch": 3.59, "eval_loss": 0.738871693611145, "eval_runtime": 17.6582, "eval_samples_per_second": 4.53, "eval_wer": 0.49767441860465117, "step": 26900 }, { "epoch": 3.6, "learning_rate": 9.880439130628029e-05, "loss": NaN, "step": 27000 }, { "epoch": 3.6, "eval_loss": 0.6424237489700317, "eval_runtime": 17.8001, "eval_samples_per_second": 4.494, "eval_wer": 0.475968992248062, "step": 27000 }, { "epoch": 3.61, "learning_rate": 9.879994666429619e-05, "loss": NaN, "step": 27100 }, { "epoch": 3.61, "eval_loss": 0.7210354208946228, "eval_runtime": 17.9075, "eval_samples_per_second": 4.467, "eval_wer": 0.4868217054263566, "step": 27100 }, { "epoch": 3.63, "learning_rate": 9.87955020223121e-05, "loss": NaN, "step": 27200 }, { "epoch": 3.63, "eval_loss": 0.684795081615448, "eval_runtime": 17.8466, "eval_samples_per_second": 4.483, "eval_wer": 0.5038759689922481, "step": 27200 }, { "epoch": 3.64, "learning_rate": 9.879105738032802e-05, "loss": NaN, "step": 27300 }, { "epoch": 3.64, "eval_loss": 0.6793242692947388, "eval_runtime": 17.9938, "eval_samples_per_second": 4.446, "eval_wer": 0.5116279069767442, "step": 27300 }, { "epoch": 3.65, "learning_rate": 9.878661273834394e-05, "loss": NaN, "step": 27400 }, { "epoch": 3.65, "eval_loss": 0.7072234749794006, "eval_runtime": 17.7391, "eval_samples_per_second": 4.51, "eval_wer": 0.49767441860465117, "step": 27400 }, { "epoch": 3.67, "learning_rate": 9.878216809635983e-05, "loss": NaN, "step": 27500 }, { "epoch": 3.67, "eval_loss": 0.794607400894165, "eval_runtime": 17.713, "eval_samples_per_second": 4.516, "eval_wer": 0.5224806201550387, "step": 27500 }, { "epoch": 3.68, "learning_rate": 9.877772345437576e-05, "loss": NaN, "step": 27600 }, { "epoch": 3.68, "eval_loss": 0.7146335244178772, "eval_runtime": 17.8755, "eval_samples_per_second": 4.475, "eval_wer": 0.5162790697674419, "step": 27600 }, { "epoch": 3.69, "learning_rate": 9.877327881239167e-05, "loss": NaN, "step": 27700 }, { "epoch": 3.69, "eval_loss": 0.7817438244819641, "eval_runtime": 17.78, "eval_samples_per_second": 4.499, "eval_wer": 0.5054263565891473, "step": 27700 }, { "epoch": 3.71, "learning_rate": 9.876883417040758e-05, "loss": NaN, "step": 27800 }, { "epoch": 3.71, "eval_loss": 0.7325385808944702, "eval_runtime": 17.8427, "eval_samples_per_second": 4.484, "eval_wer": 0.5100775193798449, "step": 27800 }, { "epoch": 3.72, "learning_rate": 9.876438952842349e-05, "loss": NaN, "step": 27900 }, { "epoch": 3.72, "eval_loss": 0.8487836718559265, "eval_runtime": 17.8001, "eval_samples_per_second": 4.494, "eval_wer": 0.5007751937984496, "step": 27900 }, { "epoch": 3.73, "learning_rate": 9.87599448864394e-05, "loss": NaN, "step": 28000 }, { "epoch": 3.73, "eval_loss": 0.8588669896125793, "eval_runtime": 17.9789, "eval_samples_per_second": 4.45, "eval_wer": 0.5023255813953489, "step": 28000 }, { "epoch": 3.75, "learning_rate": 9.875550024445531e-05, "loss": NaN, "step": 28100 }, { "epoch": 3.75, "eval_loss": 0.8295779228210449, "eval_runtime": 17.7403, "eval_samples_per_second": 4.51, "eval_wer": 0.48527131782945737, "step": 28100 }, { "epoch": 3.76, "learning_rate": 9.875105560247123e-05, "loss": NaN, "step": 28200 }, { "epoch": 3.76, "eval_loss": 0.6985501646995544, "eval_runtime": 17.5929, "eval_samples_per_second": 4.547, "eval_wer": 0.5147286821705427, "step": 28200 }, { "epoch": 3.77, "learning_rate": 9.874661096048714e-05, "loss": NaN, "step": 28300 }, { "epoch": 3.77, "eval_loss": 0.8200405240058899, "eval_runtime": 17.9213, "eval_samples_per_second": 4.464, "eval_wer": 0.5193798449612403, "step": 28300 }, { "epoch": 3.79, "learning_rate": 9.874216631850305e-05, "loss": NaN, "step": 28400 }, { "epoch": 3.79, "eval_loss": 0.8269991874694824, "eval_runtime": 17.6268, "eval_samples_per_second": 4.539, "eval_wer": 0.5069767441860465, "step": 28400 }, { "epoch": 3.8, "learning_rate": 9.873772167651896e-05, "loss": NaN, "step": 28500 }, { "epoch": 3.8, "eval_loss": 0.8213759660720825, "eval_runtime": 17.9751, "eval_samples_per_second": 4.451, "eval_wer": 0.5302325581395348, "step": 28500 }, { "epoch": 3.81, "learning_rate": 9.873327703453487e-05, "loss": NaN, "step": 28600 }, { "epoch": 3.81, "eval_loss": 0.6891577243804932, "eval_runtime": 17.7686, "eval_samples_per_second": 4.502, "eval_wer": 0.5100775193798449, "step": 28600 }, { "epoch": 3.83, "learning_rate": 9.872883239255078e-05, "loss": NaN, "step": 28700 }, { "epoch": 3.83, "eval_loss": 0.6482048034667969, "eval_runtime": 17.6883, "eval_samples_per_second": 4.523, "eval_wer": 0.4868217054263566, "step": 28700 }, { "epoch": 3.84, "learning_rate": 9.87243877505667e-05, "loss": NaN, "step": 28800 }, { "epoch": 3.84, "eval_loss": 0.7204601168632507, "eval_runtime": 17.5891, "eval_samples_per_second": 4.548, "eval_wer": 0.517829457364341, "step": 28800 }, { "epoch": 3.85, "learning_rate": 9.871994310858262e-05, "loss": NaN, "step": 28900 }, { "epoch": 3.85, "eval_loss": 0.723224937915802, "eval_runtime": 17.7967, "eval_samples_per_second": 4.495, "eval_wer": 0.5069767441860465, "step": 28900 }, { "epoch": 3.87, "learning_rate": 9.871549846659852e-05, "loss": NaN, "step": 29000 }, { "epoch": 3.87, "eval_loss": 0.6662874221801758, "eval_runtime": 17.7906, "eval_samples_per_second": 4.497, "eval_wer": 0.475968992248062, "step": 29000 }, { "epoch": 3.88, "learning_rate": 9.871105382461443e-05, "loss": NaN, "step": 29100 }, { "epoch": 3.88, "eval_loss": 0.6662710905075073, "eval_runtime": 17.8296, "eval_samples_per_second": 4.487, "eval_wer": 0.4945736434108527, "step": 29100 }, { "epoch": 3.89, "learning_rate": 9.870660918263034e-05, "loss": NaN, "step": 29200 }, { "epoch": 3.89, "eval_loss": 0.7283247709274292, "eval_runtime": 17.8161, "eval_samples_per_second": 4.49, "eval_wer": 0.48992248062015503, "step": 29200 }, { "epoch": 3.91, "learning_rate": 9.870216454064626e-05, "loss": NaN, "step": 29300 }, { "epoch": 3.91, "eval_loss": 0.7031872868537903, "eval_runtime": 17.7282, "eval_samples_per_second": 4.513, "eval_wer": 0.5085271317829457, "step": 29300 }, { "epoch": 3.92, "learning_rate": 9.869771989866216e-05, "loss": NaN, "step": 29400 }, { "epoch": 3.92, "eval_loss": 0.6514617204666138, "eval_runtime": 17.7963, "eval_samples_per_second": 4.495, "eval_wer": 0.4883720930232558, "step": 29400 }, { "epoch": 3.93, "learning_rate": 9.869327525667807e-05, "loss": NaN, "step": 29500 }, { "epoch": 3.93, "eval_loss": 0.6518000364303589, "eval_runtime": 17.8676, "eval_samples_per_second": 4.477, "eval_wer": 0.47131782945736433, "step": 29500 }, { "epoch": 3.95, "learning_rate": 9.8688830614694e-05, "loss": NaN, "step": 29600 }, { "epoch": 3.95, "eval_loss": 0.7044751048088074, "eval_runtime": 17.8213, "eval_samples_per_second": 4.489, "eval_wer": 0.4868217054263566, "step": 29600 }, { "epoch": 3.96, "learning_rate": 9.868438597270991e-05, "loss": NaN, "step": 29700 }, { "epoch": 3.96, "eval_loss": 0.7028575539588928, "eval_runtime": 17.7101, "eval_samples_per_second": 4.517, "eval_wer": 0.4930232558139535, "step": 29700 }, { "epoch": 3.97, "learning_rate": 9.86799413307258e-05, "loss": NaN, "step": 29800 }, { "epoch": 3.97, "eval_loss": 0.735122799873352, "eval_runtime": 17.5395, "eval_samples_per_second": 4.561, "eval_wer": 0.4945736434108527, "step": 29800 }, { "epoch": 3.99, "learning_rate": 9.867549668874173e-05, "loss": NaN, "step": 29900 }, { "epoch": 3.99, "eval_loss": 0.7852219939231873, "eval_runtime": 17.5067, "eval_samples_per_second": 4.57, "eval_wer": 0.4868217054263566, "step": 29900 }, { "epoch": 4.0, "learning_rate": 9.867105204675764e-05, "loss": NaN, "step": 30000 }, { "epoch": 4.0, "eval_loss": 0.7610275149345398, "eval_runtime": 17.6453, "eval_samples_per_second": 4.534, "eval_wer": 0.5023255813953489, "step": 30000 }, { "epoch": 4.01, "learning_rate": 9.866660740477355e-05, "loss": NaN, "step": 30100 }, { "epoch": 4.01, "eval_loss": 0.8094395399093628, "eval_runtime": 17.7642, "eval_samples_per_second": 4.503, "eval_wer": 0.4806201550387597, "step": 30100 }, { "epoch": 4.03, "learning_rate": 9.866216276278946e-05, "loss": NaN, "step": 30200 }, { "epoch": 4.03, "eval_loss": 0.8135471343994141, "eval_runtime": 17.6874, "eval_samples_per_second": 4.523, "eval_wer": 0.4992248062015504, "step": 30200 }, { "epoch": 4.04, "learning_rate": 9.865771812080538e-05, "loss": NaN, "step": 30300 }, { "epoch": 4.04, "eval_loss": 0.7297781109809875, "eval_runtime": 17.539, "eval_samples_per_second": 4.561, "eval_wer": 0.49767441860465117, "step": 30300 }, { "epoch": 4.05, "learning_rate": 9.865327347882129e-05, "loss": NaN, "step": 30400 }, { "epoch": 4.05, "eval_loss": 0.7608882784843445, "eval_runtime": 17.6916, "eval_samples_per_second": 4.522, "eval_wer": 0.5007751937984496, "step": 30400 }, { "epoch": 4.07, "learning_rate": 9.86488288368372e-05, "loss": NaN, "step": 30500 }, { "epoch": 4.07, "eval_loss": 0.7042602300643921, "eval_runtime": 17.6883, "eval_samples_per_second": 4.523, "eval_wer": 0.5100775193798449, "step": 30500 }, { "epoch": 4.08, "learning_rate": 9.864438419485311e-05, "loss": NaN, "step": 30600 }, { "epoch": 4.08, "eval_loss": 0.6467885971069336, "eval_runtime": 17.6906, "eval_samples_per_second": 4.522, "eval_wer": 0.47751937984496123, "step": 30600 }, { "epoch": 4.09, "learning_rate": 9.863993955286902e-05, "loss": NaN, "step": 30700 }, { "epoch": 4.09, "eval_loss": 0.7081225514411926, "eval_runtime": 17.6982, "eval_samples_per_second": 4.52, "eval_wer": 0.4992248062015504, "step": 30700 }, { "epoch": 4.11, "learning_rate": 9.863549491088493e-05, "loss": NaN, "step": 30800 }, { "epoch": 4.11, "eval_loss": 0.6654272675514221, "eval_runtime": 17.5676, "eval_samples_per_second": 4.554, "eval_wer": 0.48372093023255813, "step": 30800 }, { "epoch": 4.12, "learning_rate": 9.863105026890084e-05, "loss": NaN, "step": 30900 }, { "epoch": 4.12, "eval_loss": 0.6897600889205933, "eval_runtime": 17.7155, "eval_samples_per_second": 4.516, "eval_wer": 0.48527131782945737, "step": 30900 }, { "epoch": 4.13, "learning_rate": 9.862660562691675e-05, "loss": NaN, "step": 31000 }, { "epoch": 4.13, "eval_loss": 0.629447340965271, "eval_runtime": 17.7496, "eval_samples_per_second": 4.507, "eval_wer": 0.4728682170542636, "step": 31000 }, { "epoch": 4.15, "learning_rate": 9.862216098493267e-05, "loss": NaN, "step": 31100 }, { "epoch": 4.15, "eval_loss": 0.637413501739502, "eval_runtime": 17.659, "eval_samples_per_second": 4.53, "eval_wer": 0.48372093023255813, "step": 31100 }, { "epoch": 4.16, "learning_rate": 9.861771634294859e-05, "loss": NaN, "step": 31200 }, { "epoch": 4.16, "eval_loss": 0.6577144861221313, "eval_runtime": 17.6907, "eval_samples_per_second": 4.522, "eval_wer": 0.4883720930232558, "step": 31200 }, { "epoch": 4.17, "learning_rate": 9.861327170096449e-05, "loss": NaN, "step": 31300 }, { "epoch": 4.17, "eval_loss": 0.7151761054992676, "eval_runtime": 17.836, "eval_samples_per_second": 4.485, "eval_wer": 0.4883720930232558, "step": 31300 }, { "epoch": 4.19, "learning_rate": 9.86088270589804e-05, "loss": NaN, "step": 31400 }, { "epoch": 4.19, "eval_loss": 0.7481046915054321, "eval_runtime": 17.7063, "eval_samples_per_second": 4.518, "eval_wer": 0.49147286821705427, "step": 31400 }, { "epoch": 4.2, "learning_rate": 9.860438241699631e-05, "loss": NaN, "step": 31500 }, { "epoch": 4.2, "eval_loss": 0.7165336608886719, "eval_runtime": 17.7286, "eval_samples_per_second": 4.512, "eval_wer": 0.48992248062015503, "step": 31500 }, { "epoch": 4.21, "learning_rate": 9.859993777501224e-05, "loss": NaN, "step": 31600 }, { "epoch": 4.21, "eval_loss": 0.7002926468849182, "eval_runtime": 17.6498, "eval_samples_per_second": 4.533, "eval_wer": 0.5007751937984496, "step": 31600 }, { "epoch": 4.23, "learning_rate": 9.859549313302813e-05, "loss": NaN, "step": 31700 }, { "epoch": 4.23, "eval_loss": 0.6786822080612183, "eval_runtime": 17.5909, "eval_samples_per_second": 4.548, "eval_wer": 0.4806201550387597, "step": 31700 }, { "epoch": 4.24, "learning_rate": 9.859104849104404e-05, "loss": NaN, "step": 31800 }, { "epoch": 4.24, "eval_loss": 0.7046242952346802, "eval_runtime": 17.6497, "eval_samples_per_second": 4.533, "eval_wer": 0.4821705426356589, "step": 31800 }, { "epoch": 4.25, "learning_rate": 9.858660384905997e-05, "loss": NaN, "step": 31900 }, { "epoch": 4.25, "eval_loss": 0.747069776058197, "eval_runtime": 17.7298, "eval_samples_per_second": 4.512, "eval_wer": 0.5224806201550387, "step": 31900 }, { "epoch": 4.27, "learning_rate": 9.858215920707588e-05, "loss": NaN, "step": 32000 }, { "epoch": 4.27, "eval_loss": 0.676543116569519, "eval_runtime": 17.7787, "eval_samples_per_second": 4.5, "eval_wer": 0.4945736434108527, "step": 32000 }, { "epoch": 4.28, "learning_rate": 9.857771456509178e-05, "loss": NaN, "step": 32100 }, { "epoch": 4.28, "eval_loss": 0.6780596971511841, "eval_runtime": 17.7101, "eval_samples_per_second": 4.517, "eval_wer": 0.5147286821705427, "step": 32100 }, { "epoch": 4.29, "learning_rate": 9.85732699231077e-05, "loss": NaN, "step": 32200 }, { "epoch": 4.29, "eval_loss": 0.7229406237602234, "eval_runtime": 17.6392, "eval_samples_per_second": 4.535, "eval_wer": 0.5085271317829457, "step": 32200 }, { "epoch": 4.31, "learning_rate": 9.856882528112361e-05, "loss": NaN, "step": 32300 }, { "epoch": 4.31, "eval_loss": 0.7299832105636597, "eval_runtime": 17.6718, "eval_samples_per_second": 4.527, "eval_wer": 0.5069767441860465, "step": 32300 }, { "epoch": 4.32, "learning_rate": 9.856438063913952e-05, "loss": NaN, "step": 32400 }, { "epoch": 4.32, "eval_loss": 0.6965775489807129, "eval_runtime": 17.7649, "eval_samples_per_second": 4.503, "eval_wer": 0.4930232558139535, "step": 32400 }, { "epoch": 4.33, "learning_rate": 9.855993599715544e-05, "loss": NaN, "step": 32500 }, { "epoch": 4.33, "eval_loss": 0.6707865595817566, "eval_runtime": 17.5045, "eval_samples_per_second": 4.57, "eval_wer": 0.4945736434108527, "step": 32500 }, { "epoch": 4.35, "learning_rate": 9.855549135517135e-05, "loss": NaN, "step": 32600 }, { "epoch": 4.35, "eval_loss": 0.6962494254112244, "eval_runtime": 17.5191, "eval_samples_per_second": 4.566, "eval_wer": 0.49612403100775193, "step": 32600 }, { "epoch": 4.36, "learning_rate": 9.855104671318726e-05, "loss": NaN, "step": 32700 }, { "epoch": 4.36, "eval_loss": 0.7435300350189209, "eval_runtime": 17.5234, "eval_samples_per_second": 4.565, "eval_wer": 0.4806201550387597, "step": 32700 }, { "epoch": 4.37, "learning_rate": 9.854660207120317e-05, "loss": NaN, "step": 32800 }, { "epoch": 4.37, "eval_loss": 0.8106309771537781, "eval_runtime": 17.5548, "eval_samples_per_second": 4.557, "eval_wer": 0.475968992248062, "step": 32800 }, { "epoch": 4.39, "learning_rate": 9.854215742921908e-05, "loss": NaN, "step": 32900 }, { "epoch": 4.39, "eval_loss": 0.7216034531593323, "eval_runtime": 17.5922, "eval_samples_per_second": 4.547, "eval_wer": 0.4635658914728682, "step": 32900 }, { "epoch": 4.4, "learning_rate": 9.853771278723499e-05, "loss": NaN, "step": 33000 }, { "epoch": 4.4, "eval_loss": 0.7068824172019958, "eval_runtime": 17.4424, "eval_samples_per_second": 4.587, "eval_wer": 0.4806201550387597, "step": 33000 }, { "epoch": 4.41, "learning_rate": 9.85332681452509e-05, "loss": NaN, "step": 33100 }, { "epoch": 4.41, "eval_loss": 0.6770612001419067, "eval_runtime": 17.5754, "eval_samples_per_second": 4.552, "eval_wer": 0.4821705426356589, "step": 33100 }, { "epoch": 4.43, "learning_rate": 9.852882350326681e-05, "loss": NaN, "step": 33200 }, { "epoch": 4.43, "eval_loss": 0.7043319940567017, "eval_runtime": 17.5764, "eval_samples_per_second": 4.552, "eval_wer": 0.48372093023255813, "step": 33200 }, { "epoch": 4.44, "learning_rate": 9.852437886128273e-05, "loss": NaN, "step": 33300 }, { "epoch": 4.44, "eval_loss": 0.7157676815986633, "eval_runtime": 17.5258, "eval_samples_per_second": 4.565, "eval_wer": 0.4992248062015504, "step": 33300 }, { "epoch": 4.45, "learning_rate": 9.851993421929864e-05, "loss": NaN, "step": 33400 }, { "epoch": 4.45, "eval_loss": 0.622586190700531, "eval_runtime": 17.5815, "eval_samples_per_second": 4.55, "eval_wer": 0.4635658914728682, "step": 33400 }, { "epoch": 4.47, "learning_rate": 9.851548957731456e-05, "loss": NaN, "step": 33500 }, { "epoch": 4.47, "eval_loss": 0.656098484992981, "eval_runtime": 17.501, "eval_samples_per_second": 4.571, "eval_wer": 0.4635658914728682, "step": 33500 }, { "epoch": 4.48, "learning_rate": 9.851104493533046e-05, "loss": NaN, "step": 33600 }, { "epoch": 4.48, "eval_loss": 0.6705238223075867, "eval_runtime": 17.5581, "eval_samples_per_second": 4.556, "eval_wer": 0.47131782945736433, "step": 33600 }, { "epoch": 4.49, "learning_rate": 9.850660029334637e-05, "loss": NaN, "step": 33700 }, { "epoch": 4.49, "eval_loss": 0.6990655660629272, "eval_runtime": 17.553, "eval_samples_per_second": 4.558, "eval_wer": 0.4728682170542636, "step": 33700 }, { "epoch": 4.51, "learning_rate": 9.850215565136228e-05, "loss": NaN, "step": 33800 }, { "epoch": 4.51, "eval_loss": 0.6776248216629028, "eval_runtime": 17.5252, "eval_samples_per_second": 4.565, "eval_wer": 0.47131782945736433, "step": 33800 }, { "epoch": 4.52, "learning_rate": 9.849771100937821e-05, "loss": NaN, "step": 33900 }, { "epoch": 4.52, "eval_loss": 0.6578621864318848, "eval_runtime": 17.5632, "eval_samples_per_second": 4.555, "eval_wer": 0.4728682170542636, "step": 33900 }, { "epoch": 4.53, "learning_rate": 9.84932663673941e-05, "loss": NaN, "step": 34000 }, { "epoch": 4.53, "eval_loss": 0.6970942616462708, "eval_runtime": 17.555, "eval_samples_per_second": 4.557, "eval_wer": 0.4868217054263566, "step": 34000 }, { "epoch": 4.55, "learning_rate": 9.848882172541002e-05, "loss": NaN, "step": 34100 }, { "epoch": 4.55, "eval_loss": 0.6826914548873901, "eval_runtime": 17.5393, "eval_samples_per_second": 4.561, "eval_wer": 0.5069767441860465, "step": 34100 }, { "epoch": 4.56, "learning_rate": 9.848437708342594e-05, "loss": NaN, "step": 34200 }, { "epoch": 4.56, "eval_loss": 0.6816051602363586, "eval_runtime": 17.5537, "eval_samples_per_second": 4.557, "eval_wer": 0.4728682170542636, "step": 34200 }, { "epoch": 4.57, "learning_rate": 9.847993244144185e-05, "loss": NaN, "step": 34300 }, { "epoch": 4.57, "eval_loss": 0.7528648972511292, "eval_runtime": 17.5699, "eval_samples_per_second": 4.553, "eval_wer": 0.49612403100775193, "step": 34300 }, { "epoch": 4.59, "learning_rate": 9.847548779945775e-05, "loss": NaN, "step": 34400 }, { "epoch": 4.59, "eval_loss": 0.6876388788223267, "eval_runtime": 17.4887, "eval_samples_per_second": 4.574, "eval_wer": 0.5085271317829457, "step": 34400 }, { "epoch": 4.6, "learning_rate": 9.847104315747367e-05, "loss": NaN, "step": 34500 }, { "epoch": 4.6, "eval_loss": 0.7198226451873779, "eval_runtime": 17.4698, "eval_samples_per_second": 4.579, "eval_wer": 0.5069767441860465, "step": 34500 }, { "epoch": 4.61, "learning_rate": 9.846659851548959e-05, "loss": NaN, "step": 34600 }, { "epoch": 4.61, "eval_loss": 0.7185400724411011, "eval_runtime": 17.5466, "eval_samples_per_second": 4.559, "eval_wer": 0.47751937984496123, "step": 34600 }, { "epoch": 4.63, "learning_rate": 9.84621538735055e-05, "loss": NaN, "step": 34700 }, { "epoch": 4.63, "eval_loss": 0.7706559896469116, "eval_runtime": 17.5053, "eval_samples_per_second": 4.57, "eval_wer": 0.5069767441860465, "step": 34700 }, { "epoch": 4.64, "learning_rate": 9.845770923152141e-05, "loss": NaN, "step": 34800 }, { "epoch": 4.64, "eval_loss": 0.8254127502441406, "eval_runtime": 17.5689, "eval_samples_per_second": 4.553, "eval_wer": 0.4945736434108527, "step": 34800 }, { "epoch": 4.65, "learning_rate": 9.845326458953732e-05, "loss": NaN, "step": 34900 }, { "epoch": 4.65, "eval_loss": 0.8003772497177124, "eval_runtime": 17.4204, "eval_samples_per_second": 4.592, "eval_wer": 0.4883720930232558, "step": 34900 }, { "epoch": 4.67, "learning_rate": 9.844881994755323e-05, "loss": NaN, "step": 35000 }, { "epoch": 4.67, "eval_loss": 0.6992226839065552, "eval_runtime": 17.4907, "eval_samples_per_second": 4.574, "eval_wer": 0.5085271317829457, "step": 35000 }, { "epoch": 4.68, "learning_rate": 9.844437530556914e-05, "loss": NaN, "step": 35100 }, { "epoch": 4.68, "eval_loss": 0.7514958381652832, "eval_runtime": 17.4878, "eval_samples_per_second": 4.575, "eval_wer": 0.49612403100775193, "step": 35100 }, { "epoch": 4.69, "learning_rate": 9.843993066358505e-05, "loss": NaN, "step": 35200 }, { "epoch": 4.69, "eval_loss": 0.7265327572822571, "eval_runtime": 17.4636, "eval_samples_per_second": 4.581, "eval_wer": 0.4682170542635659, "step": 35200 }, { "epoch": 4.71, "learning_rate": 9.843548602160096e-05, "loss": NaN, "step": 35300 }, { "epoch": 4.71, "eval_loss": 0.7364674806594849, "eval_runtime": 17.5101, "eval_samples_per_second": 4.569, "eval_wer": 0.47751937984496123, "step": 35300 }, { "epoch": 4.72, "learning_rate": 9.843104137961688e-05, "loss": NaN, "step": 35400 }, { "epoch": 4.72, "eval_loss": 0.6975224018096924, "eval_runtime": 17.4555, "eval_samples_per_second": 4.583, "eval_wer": 0.47751937984496123, "step": 35400 }, { "epoch": 4.73, "learning_rate": 9.842659673763279e-05, "loss": NaN, "step": 35500 }, { "epoch": 4.73, "eval_loss": 0.6800852417945862, "eval_runtime": 17.5482, "eval_samples_per_second": 4.559, "eval_wer": 0.4868217054263566, "step": 35500 }, { "epoch": 4.75, "learning_rate": 9.84221520956487e-05, "loss": NaN, "step": 35600 }, { "epoch": 4.75, "eval_loss": 0.7129591703414917, "eval_runtime": 17.5425, "eval_samples_per_second": 4.56, "eval_wer": 0.4992248062015504, "step": 35600 }, { "epoch": 4.76, "learning_rate": 9.841770745366461e-05, "loss": NaN, "step": 35700 }, { "epoch": 4.76, "eval_loss": 0.7202149033546448, "eval_runtime": 17.5335, "eval_samples_per_second": 4.563, "eval_wer": 0.4930232558139535, "step": 35700 }, { "epoch": 4.77, "learning_rate": 9.841326281168053e-05, "loss": NaN, "step": 35800 }, { "epoch": 4.77, "eval_loss": 0.6712242960929871, "eval_runtime": 17.5011, "eval_samples_per_second": 4.571, "eval_wer": 0.48527131782945737, "step": 35800 }, { "epoch": 4.79, "learning_rate": 9.840881816969643e-05, "loss": NaN, "step": 35900 }, { "epoch": 4.79, "eval_loss": 0.8096708059310913, "eval_runtime": 17.5196, "eval_samples_per_second": 4.566, "eval_wer": 0.49147286821705427, "step": 35900 }, { "epoch": 4.8, "learning_rate": 9.840437352771234e-05, "loss": NaN, "step": 36000 }, { "epoch": 4.8, "eval_loss": 0.6871185898780823, "eval_runtime": 17.4561, "eval_samples_per_second": 4.583, "eval_wer": 0.47751937984496123, "step": 36000 } ], "max_steps": 2250000, "num_train_epochs": 300, "total_flos": 2.3169703440557314e+19, "trial_name": null, "trial_params": null }