{ "best_metric": null, "best_model_checkpoint": null, "epoch": 14.999946469675072, "global_step": 140100, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.01, "eval_loss": 3.625196695327759, "eval_runtime": 48.6485, "eval_samples_per_second": 41.666, "eval_steps_per_second": 5.221, "eval_wer": 1.0, "step": 100 }, { "epoch": 0.02, "eval_loss": 3.190624713897705, "eval_runtime": 48.8326, "eval_samples_per_second": 41.509, "eval_steps_per_second": 5.201, "eval_wer": 1.0, "step": 200 }, { "epoch": 0.03, "eval_loss": 3.108981132507324, "eval_runtime": 48.8211, "eval_samples_per_second": 41.519, "eval_steps_per_second": 5.203, "eval_wer": 1.0, "step": 300 }, { "epoch": 0.04, "eval_loss": 1.8795998096466064, "eval_runtime": 48.7588, "eval_samples_per_second": 41.572, "eval_steps_per_second": 5.209, "eval_wer": 0.9954865499187578, "step": 400 }, { "epoch": 0.05, "learning_rate": 0.00029759999999999997, "loss": 6.2575, "step": 500 }, { "epoch": 0.05, "eval_loss": 1.3514989614486694, "eval_runtime": 48.9732, "eval_samples_per_second": 41.39, "eval_steps_per_second": 5.187, "eval_wer": 0.9057591623036649, "step": 500 }, { "epoch": 0.06, "eval_loss": 1.1209492683410645, "eval_runtime": 48.2472, "eval_samples_per_second": 42.013, "eval_steps_per_second": 5.265, "eval_wer": 0.8328218089907926, "step": 600 }, { "epoch": 0.07, "eval_loss": 1.1404383182525635, "eval_runtime": 48.9274, "eval_samples_per_second": 41.429, "eval_steps_per_second": 5.191, "eval_wer": 0.8309261599566709, "step": 700 }, { "epoch": 0.09, "eval_loss": 1.0599348545074463, "eval_runtime": 48.4506, "eval_samples_per_second": 41.836, "eval_steps_per_second": 5.242, "eval_wer": 0.8021303484383463, "step": 800 }, { "epoch": 0.1, "eval_loss": 0.9901070594787598, "eval_runtime": 48.6803, "eval_samples_per_second": 41.639, "eval_steps_per_second": 5.218, "eval_wer": 0.8335439610037912, "step": 900 }, { "epoch": 0.11, "learning_rate": 0.0002989340974212034, "loss": 0.7737, "step": 1000 }, { "epoch": 0.11, "eval_loss": 0.884602963924408, "eval_runtime": 48.4241, "eval_samples_per_second": 41.859, "eval_steps_per_second": 5.245, "eval_wer": 0.7400252753204549, "step": 1000 }, { "epoch": 0.12, "eval_loss": 0.9971189498901367, "eval_runtime": 48.5998, "eval_samples_per_second": 41.708, "eval_steps_per_second": 5.226, "eval_wer": 0.7820003610760065, "step": 1100 }, { "epoch": 0.13, "eval_loss": 0.8665233850479126, "eval_runtime": 48.3232, "eval_samples_per_second": 41.947, "eval_steps_per_second": 5.256, "eval_wer": 0.7123126918216285, "step": 1200 }, { "epoch": 0.14, "eval_loss": 0.8489500284194946, "eval_runtime": 48.8631, "eval_samples_per_second": 41.483, "eval_steps_per_second": 5.198, "eval_wer": 0.736595053258711, "step": 1300 }, { "epoch": 0.15, "eval_loss": 0.8249963521957397, "eval_runtime": 48.6019, "eval_samples_per_second": 41.706, "eval_steps_per_second": 5.226, "eval_wer": 0.6764758981765662, "step": 1400 }, { "epoch": 0.16, "learning_rate": 0.00029785959885386817, "loss": 0.6183, "step": 1500 }, { "epoch": 0.16, "eval_loss": 0.8290594220161438, "eval_runtime": 48.6721, "eval_samples_per_second": 41.646, "eval_steps_per_second": 5.219, "eval_wer": 0.6965156165372811, "step": 1500 }, { "epoch": 0.17, "eval_loss": 0.7945746779441833, "eval_runtime": 48.366, "eval_samples_per_second": 41.91, "eval_steps_per_second": 5.252, "eval_wer": 0.682253114280556, "step": 1600 }, { "epoch": 0.18, "eval_loss": 0.8239201903343201, "eval_runtime": 49.119, "eval_samples_per_second": 41.267, "eval_steps_per_second": 5.171, "eval_wer": 0.6893843654089186, "step": 1700 }, { "epoch": 0.19, "eval_loss": 0.828230082988739, "eval_runtime": 48.821, "eval_samples_per_second": 41.519, "eval_steps_per_second": 5.203, "eval_wer": 0.6796353132334356, "step": 1800 }, { "epoch": 0.2, "eval_loss": 0.764546275138855, "eval_runtime": 49.1104, "eval_samples_per_second": 41.274, "eval_steps_per_second": 5.172, "eval_wer": 0.6518324607329843, "step": 1900 }, { "epoch": 0.21, "learning_rate": 0.0002967851002865329, "loss": 0.561, "step": 2000 }, { "epoch": 0.21, "eval_loss": 0.7530480623245239, "eval_runtime": 48.5997, "eval_samples_per_second": 41.708, "eval_steps_per_second": 5.226, "eval_wer": 0.6366672684600109, "step": 2000 }, { "epoch": 0.22, "eval_loss": 0.7295656800270081, "eval_runtime": 48.6615, "eval_samples_per_second": 41.655, "eval_steps_per_second": 5.22, "eval_wer": 0.617710778118794, "step": 2100 }, { "epoch": 0.24, "eval_loss": 0.7527036070823669, "eval_runtime": 48.4283, "eval_samples_per_second": 41.856, "eval_steps_per_second": 5.245, "eval_wer": 0.6498465426972377, "step": 2200 }, { "epoch": 0.25, "eval_loss": 0.7209727764129639, "eval_runtime": 48.8209, "eval_samples_per_second": 41.519, "eval_steps_per_second": 5.203, "eval_wer": 0.6316122043690197, "step": 2300 }, { "epoch": 0.26, "eval_loss": 0.7938166856765747, "eval_runtime": 48.2216, "eval_samples_per_second": 42.035, "eval_steps_per_second": 5.267, "eval_wer": 0.6756634771619426, "step": 2400 }, { "epoch": 0.27, "learning_rate": 0.00029571060171919766, "loss": 0.5402, "step": 2500 }, { "epoch": 0.27, "eval_loss": 0.7485235929489136, "eval_runtime": 48.3609, "eval_samples_per_second": 41.914, "eval_steps_per_second": 5.252, "eval_wer": 0.6372088824697599, "step": 2500 }, { "epoch": 0.28, "eval_loss": 0.7146492004394531, "eval_runtime": 48.3522, "eval_samples_per_second": 41.922, "eval_steps_per_second": 5.253, "eval_wer": 0.6132875970391768, "step": 2600 }, { "epoch": 0.29, "eval_loss": 0.7308168411254883, "eval_runtime": 48.4029, "eval_samples_per_second": 41.878, "eval_steps_per_second": 5.248, "eval_wer": 0.6625744719263404, "step": 2700 }, { "epoch": 0.3, "eval_loss": 0.7078224420547485, "eval_runtime": 48.7403, "eval_samples_per_second": 41.588, "eval_steps_per_second": 5.211, "eval_wer": 0.594872720707709, "step": 2800 }, { "epoch": 0.31, "eval_loss": 0.7679122090339661, "eval_runtime": 48.4081, "eval_samples_per_second": 41.873, "eval_steps_per_second": 5.247, "eval_wer": 0.6372991514713847, "step": 2900 }, { "epoch": 0.32, "learning_rate": 0.0002946361031518624, "loss": 0.5303, "step": 3000 }, { "epoch": 0.32, "eval_loss": 0.72626131772995, "eval_runtime": 48.7452, "eval_samples_per_second": 41.584, "eval_steps_per_second": 5.211, "eval_wer": 0.6502076187037371, "step": 3000 }, { "epoch": 0.33, "eval_loss": 0.6612817049026489, "eval_runtime": 48.9995, "eval_samples_per_second": 41.368, "eval_steps_per_second": 5.184, "eval_wer": 0.584582054522477, "step": 3100 }, { "epoch": 0.34, "eval_loss": 0.6783962249755859, "eval_runtime": 48.6023, "eval_samples_per_second": 41.706, "eval_steps_per_second": 5.226, "eval_wer": 0.578263224408738, "step": 3200 }, { "epoch": 0.35, "eval_loss": 0.6908129453659058, "eval_runtime": 48.5922, "eval_samples_per_second": 41.715, "eval_steps_per_second": 5.227, "eval_wer": 0.5833182884997292, "step": 3300 }, { "epoch": 0.36, "eval_loss": 0.6595033407211304, "eval_runtime": 48.473, "eval_samples_per_second": 41.817, "eval_steps_per_second": 5.24, "eval_wer": 0.5825961364867305, "step": 3400 }, { "epoch": 0.37, "learning_rate": 0.0002935616045845272, "loss": 0.503, "step": 3500 }, { "epoch": 0.37, "eval_loss": 0.6716800928115845, "eval_runtime": 48.6209, "eval_samples_per_second": 41.69, "eval_steps_per_second": 5.224, "eval_wer": 0.5937894926882109, "step": 3500 }, { "epoch": 0.39, "eval_loss": 0.6937839984893799, "eval_runtime": 48.9232, "eval_samples_per_second": 41.432, "eval_steps_per_second": 5.192, "eval_wer": 0.5790756454233617, "step": 3600 }, { "epoch": 0.4, "eval_loss": 0.667679488658905, "eval_runtime": 48.3286, "eval_samples_per_second": 41.942, "eval_steps_per_second": 5.256, "eval_wer": 0.6051633868929409, "step": 3700 }, { "epoch": 0.41, "eval_loss": 0.65436190366745, "eval_runtime": 48.7685, "eval_samples_per_second": 41.564, "eval_steps_per_second": 5.208, "eval_wer": 0.555425166997653, "step": 3800 }, { "epoch": 0.42, "eval_loss": 0.6514427661895752, "eval_runtime": 48.532, "eval_samples_per_second": 41.766, "eval_steps_per_second": 5.234, "eval_wer": 0.5727568153096226, "step": 3900 }, { "epoch": 0.43, "learning_rate": 0.00029248710601719195, "loss": 0.4959, "step": 4000 }, { "epoch": 0.43, "eval_loss": 0.6847020983695984, "eval_runtime": 48.5364, "eval_samples_per_second": 41.763, "eval_steps_per_second": 5.233, "eval_wer": 0.6187940061382922, "step": 4000 }, { "epoch": 0.44, "eval_loss": 0.6626438498497009, "eval_runtime": 48.3485, "eval_samples_per_second": 41.925, "eval_steps_per_second": 5.254, "eval_wer": 0.5869290485647228, "step": 4100 }, { "epoch": 0.45, "eval_loss": 0.6669931411743164, "eval_runtime": 48.5641, "eval_samples_per_second": 41.739, "eval_steps_per_second": 5.23, "eval_wer": 0.5699584762592526, "step": 4200 }, { "epoch": 0.46, "eval_loss": 0.6595851182937622, "eval_runtime": 48.6164, "eval_samples_per_second": 41.694, "eval_steps_per_second": 5.225, "eval_wer": 0.584582054522477, "step": 4300 }, { "epoch": 0.47, "eval_loss": 0.6522601246833801, "eval_runtime": 48.5548, "eval_samples_per_second": 41.747, "eval_steps_per_second": 5.231, "eval_wer": 0.5467593428416682, "step": 4400 }, { "epoch": 0.48, "learning_rate": 0.0002914126074498567, "loss": 0.4824, "step": 4500 }, { "epoch": 0.48, "eval_loss": 0.6391969919204712, "eval_runtime": 48.4793, "eval_samples_per_second": 41.812, "eval_steps_per_second": 5.239, "eval_wer": 0.5687849792381297, "step": 4500 }, { "epoch": 0.49, "eval_loss": 0.6561304926872253, "eval_runtime": 48.7756, "eval_samples_per_second": 41.558, "eval_steps_per_second": 5.208, "eval_wer": 0.5686947102365048, "step": 4600 }, { "epoch": 0.5, "eval_loss": 0.6697142124176025, "eval_runtime": 48.9375, "eval_samples_per_second": 41.42, "eval_steps_per_second": 5.19, "eval_wer": 0.581693446470482, "step": 4700 }, { "epoch": 0.51, "eval_loss": 0.6348330974578857, "eval_runtime": 49.0519, "eval_samples_per_second": 41.324, "eval_steps_per_second": 5.178, "eval_wer": 0.5608413070951436, "step": 4800 }, { "epoch": 0.52, "eval_loss": 0.656074047088623, "eval_runtime": 48.3379, "eval_samples_per_second": 41.934, "eval_steps_per_second": 5.255, "eval_wer": 0.5600288860805199, "step": 4900 }, { "epoch": 0.54, "learning_rate": 0.00029033810888252145, "loss": 0.4714, "step": 5000 }, { "epoch": 0.54, "eval_loss": 0.652241051197052, "eval_runtime": 48.5527, "eval_samples_per_second": 41.748, "eval_steps_per_second": 5.231, "eval_wer": 0.6180718541252934, "step": 5000 }, { "epoch": 0.55, "eval_loss": 0.6857942938804626, "eval_runtime": 48.4567, "eval_samples_per_second": 41.831, "eval_steps_per_second": 5.242, "eval_wer": 0.5920743816573388, "step": 5100 }, { "epoch": 0.56, "eval_loss": 0.6706011891365051, "eval_runtime": 48.9061, "eval_samples_per_second": 41.447, "eval_steps_per_second": 5.194, "eval_wer": 0.5497382198952879, "step": 5200 }, { "epoch": 0.57, "eval_loss": 0.7122880220413208, "eval_runtime": 49.0884, "eval_samples_per_second": 41.293, "eval_steps_per_second": 5.174, "eval_wer": 0.5768189203827405, "step": 5300 }, { "epoch": 0.58, "eval_loss": 0.659943699836731, "eval_runtime": 49.0325, "eval_samples_per_second": 41.34, "eval_steps_per_second": 5.18, "eval_wer": 0.6100379129806824, "step": 5400 }, { "epoch": 0.59, "learning_rate": 0.00028926361031518625, "loss": 0.471, "step": 5500 }, { "epoch": 0.59, "eval_loss": 0.6421207785606384, "eval_runtime": 48.992, "eval_samples_per_second": 41.374, "eval_steps_per_second": 5.185, "eval_wer": 0.5625564181260155, "step": 5500 }, { "epoch": 0.6, "eval_loss": 0.6395331621170044, "eval_runtime": 48.7511, "eval_samples_per_second": 41.579, "eval_steps_per_second": 5.21, "eval_wer": 0.5752843473551182, "step": 5600 }, { "epoch": 0.61, "eval_loss": 0.6788127422332764, "eval_runtime": 48.7567, "eval_samples_per_second": 41.574, "eval_steps_per_second": 5.21, "eval_wer": 0.5481133778660408, "step": 5700 }, { "epoch": 0.62, "eval_loss": 0.6385824084281921, "eval_runtime": 48.9331, "eval_samples_per_second": 41.424, "eval_steps_per_second": 5.191, "eval_wer": 0.5516338689294097, "step": 5800 }, { "epoch": 0.63, "eval_loss": 0.6694206595420837, "eval_runtime": 48.8182, "eval_samples_per_second": 41.521, "eval_steps_per_second": 5.203, "eval_wer": 0.5912619606427153, "step": 5900 }, { "epoch": 0.64, "learning_rate": 0.000288189111747851, "loss": 0.4707, "step": 6000 }, { "epoch": 0.64, "eval_loss": 0.6250674724578857, "eval_runtime": 48.8318, "eval_samples_per_second": 41.51, "eval_steps_per_second": 5.202, "eval_wer": 0.5698682072576278, "step": 6000 }, { "epoch": 0.65, "eval_loss": 0.6243389844894409, "eval_runtime": 48.6735, "eval_samples_per_second": 41.645, "eval_steps_per_second": 5.218, "eval_wer": 0.5566889330204008, "step": 6100 }, { "epoch": 0.66, "eval_loss": 0.6645160913467407, "eval_runtime": 48.8686, "eval_samples_per_second": 41.479, "eval_steps_per_second": 5.198, "eval_wer": 0.5629174941325149, "step": 6200 }, { "epoch": 0.67, "eval_loss": 0.6295756101608276, "eval_runtime": 49.1221, "eval_samples_per_second": 41.265, "eval_steps_per_second": 5.171, "eval_wer": 0.5895468496118433, "step": 6300 }, { "epoch": 0.69, "eval_loss": 0.6077612042427063, "eval_runtime": 48.8377, "eval_samples_per_second": 41.505, "eval_steps_per_second": 5.201, "eval_wer": 0.518324607329843, "step": 6400 }, { "epoch": 0.7, "learning_rate": 0.00028711461318051574, "loss": 0.4632, "step": 6500 }, { "epoch": 0.7, "eval_loss": 0.6269996762275696, "eval_runtime": 48.7596, "eval_samples_per_second": 41.571, "eval_steps_per_second": 5.209, "eval_wer": 0.5619245351146416, "step": 6500 }, { "epoch": 0.71, "eval_loss": 0.6050315499305725, "eval_runtime": 49.3099, "eval_samples_per_second": 41.107, "eval_steps_per_second": 5.151, "eval_wer": 0.5335800686044412, "step": 6600 }, { "epoch": 0.72, "eval_loss": 0.6185252666473389, "eval_runtime": 49.0917, "eval_samples_per_second": 41.29, "eval_steps_per_second": 5.174, "eval_wer": 0.5448636938075465, "step": 6700 }, { "epoch": 0.73, "eval_loss": 0.6281481385231018, "eval_runtime": 48.533, "eval_samples_per_second": 41.765, "eval_steps_per_second": 5.234, "eval_wer": 0.5645423361617621, "step": 6800 }, { "epoch": 0.74, "eval_loss": 0.5876803398132324, "eval_runtime": 48.7707, "eval_samples_per_second": 41.562, "eval_steps_per_second": 5.208, "eval_wer": 0.5083950171511104, "step": 6900 }, { "epoch": 0.75, "learning_rate": 0.0002860401146131805, "loss": 0.4514, "step": 7000 }, { "epoch": 0.75, "eval_loss": 0.6199076175689697, "eval_runtime": 49.1573, "eval_samples_per_second": 41.235, "eval_steps_per_second": 5.167, "eval_wer": 0.5402599747246796, "step": 7000 }, { "epoch": 0.76, "eval_loss": 0.6293303966522217, "eval_runtime": 48.9241, "eval_samples_per_second": 41.432, "eval_steps_per_second": 5.192, "eval_wer": 0.5275320454955769, "step": 7100 }, { "epoch": 0.77, "eval_loss": 0.6289793848991394, "eval_runtime": 49.1249, "eval_samples_per_second": 41.262, "eval_steps_per_second": 5.17, "eval_wer": 0.5446831558042968, "step": 7200 }, { "epoch": 0.78, "eval_loss": 0.613017737865448, "eval_runtime": 48.9639, "eval_samples_per_second": 41.398, "eval_steps_per_second": 5.187, "eval_wer": 0.5372810976710598, "step": 7300 }, { "epoch": 0.79, "eval_loss": 0.6137964129447937, "eval_runtime": 49.0353, "eval_samples_per_second": 41.338, "eval_steps_per_second": 5.18, "eval_wer": 0.5285250045134501, "step": 7400 }, { "epoch": 0.8, "learning_rate": 0.00028496561604584523, "loss": 0.4457, "step": 7500 }, { "epoch": 0.8, "eval_loss": 0.6040118336677551, "eval_runtime": 48.8487, "eval_samples_per_second": 41.495, "eval_steps_per_second": 5.2, "eval_wer": 0.5259072034663297, "step": 7500 }, { "epoch": 0.81, "eval_loss": 0.622002363204956, "eval_runtime": 48.8408, "eval_samples_per_second": 41.502, "eval_steps_per_second": 5.201, "eval_wer": 0.56860444123488, "step": 7600 }, { "epoch": 0.82, "eval_loss": 0.5914533734321594, "eval_runtime": 48.6432, "eval_samples_per_second": 41.671, "eval_steps_per_second": 5.222, "eval_wer": 0.5164289582957212, "step": 7700 }, { "epoch": 0.84, "eval_loss": 0.6269855499267578, "eval_runtime": 48.6798, "eval_samples_per_second": 41.639, "eval_steps_per_second": 5.218, "eval_wer": 0.5288860805199495, "step": 7800 }, { "epoch": 0.85, "eval_loss": 0.6224400997161865, "eval_runtime": 48.9678, "eval_samples_per_second": 41.395, "eval_steps_per_second": 5.187, "eval_wer": 0.55145333092616, "step": 7900 }, { "epoch": 0.86, "learning_rate": 0.00028389111747851003, "loss": 0.4458, "step": 8000 }, { "epoch": 0.86, "eval_loss": 0.6161192059516907, "eval_runtime": 48.8802, "eval_samples_per_second": 41.469, "eval_steps_per_second": 5.196, "eval_wer": 0.5323163025816935, "step": 8000 }, { "epoch": 0.87, "eval_loss": 0.5826652646064758, "eval_runtime": 48.8638, "eval_samples_per_second": 41.483, "eval_steps_per_second": 5.198, "eval_wer": 0.5121863152193536, "step": 8100 }, { "epoch": 0.88, "eval_loss": 0.6067497730255127, "eval_runtime": 48.7237, "eval_samples_per_second": 41.602, "eval_steps_per_second": 5.213, "eval_wer": 0.5202202563639646, "step": 8200 }, { "epoch": 0.89, "eval_loss": 0.6086713671684265, "eval_runtime": 49.0772, "eval_samples_per_second": 41.302, "eval_steps_per_second": 5.176, "eval_wer": 0.5192272973460913, "step": 8300 }, { "epoch": 0.9, "eval_loss": 0.6859478950500488, "eval_runtime": 48.6001, "eval_samples_per_second": 41.708, "eval_steps_per_second": 5.226, "eval_wer": 0.5796172594331107, "step": 8400 }, { "epoch": 0.91, "learning_rate": 0.0002828187679083094, "loss": 0.4409, "step": 8500 }, { "epoch": 0.91, "eval_loss": 0.6179741621017456, "eval_runtime": 48.6105, "eval_samples_per_second": 41.699, "eval_steps_per_second": 5.225, "eval_wer": 0.5130890052356021, "step": 8500 }, { "epoch": 0.92, "eval_loss": 0.5945226550102234, "eval_runtime": 49.073, "eval_samples_per_second": 41.306, "eval_steps_per_second": 5.176, "eval_wer": 0.49476439790575916, "step": 8600 }, { "epoch": 0.93, "eval_loss": 0.5967476963996887, "eval_runtime": 49.0045, "eval_samples_per_second": 41.364, "eval_steps_per_second": 5.183, "eval_wer": 0.553168441957032, "step": 8700 }, { "epoch": 0.94, "eval_loss": 0.5770399570465088, "eval_runtime": 48.7028, "eval_samples_per_second": 41.62, "eval_steps_per_second": 5.215, "eval_wer": 0.4961184329301318, "step": 8800 }, { "epoch": 0.95, "eval_loss": 0.5808792114257812, "eval_runtime": 48.8469, "eval_samples_per_second": 41.497, "eval_steps_per_second": 5.2, "eval_wer": 0.5203105253655894, "step": 8900 }, { "epoch": 0.96, "learning_rate": 0.00028174426934097417, "loss": 0.4305, "step": 9000 }, { "epoch": 0.96, "eval_loss": 0.5804657936096191, "eval_runtime": 49.9542, "eval_samples_per_second": 40.577, "eval_steps_per_second": 5.085, "eval_wer": 0.5038815670698682, "step": 9000 }, { "epoch": 0.97, "eval_loss": 0.5873450040817261, "eval_runtime": 48.5365, "eval_samples_per_second": 41.762, "eval_steps_per_second": 5.233, "eval_wer": 0.5187759523379671, "step": 9100 }, { "epoch": 0.98, "eval_loss": 0.6276754140853882, "eval_runtime": 48.6742, "eval_samples_per_second": 41.644, "eval_steps_per_second": 5.218, "eval_wer": 0.5516338689294097, "step": 9200 }, { "epoch": 1.0, "eval_loss": 0.5726681351661682, "eval_runtime": 48.9081, "eval_samples_per_second": 41.445, "eval_steps_per_second": 5.193, "eval_wer": 0.5052356020942408, "step": 9300 }, { "epoch": 1.01, "eval_loss": 0.5858115553855896, "eval_runtime": 48.4967, "eval_samples_per_second": 41.797, "eval_steps_per_second": 5.237, "eval_wer": 0.5122765842209785, "step": 9400 }, { "epoch": 1.02, "learning_rate": 0.0002806719197707736, "loss": 0.4264, "step": 9500 }, { "epoch": 1.02, "eval_loss": 0.5691950917243958, "eval_runtime": 48.3307, "eval_samples_per_second": 41.94, "eval_steps_per_second": 5.255, "eval_wer": 0.49684058494313055, "step": 9500 }, { "epoch": 1.03, "eval_loss": 0.5954357981681824, "eval_runtime": 48.3796, "eval_samples_per_second": 41.898, "eval_steps_per_second": 5.25, "eval_wer": 0.5117349702112295, "step": 9600 }, { "epoch": 1.04, "eval_loss": 0.5903880000114441, "eval_runtime": 48.2992, "eval_samples_per_second": 41.968, "eval_steps_per_second": 5.259, "eval_wer": 0.5075825961364867, "step": 9700 }, { "epoch": 1.05, "eval_loss": 0.6046377420425415, "eval_runtime": 48.5859, "eval_samples_per_second": 41.72, "eval_steps_per_second": 5.228, "eval_wer": 0.5101101281819823, "step": 9800 }, { "epoch": 1.06, "eval_loss": 0.5616235136985779, "eval_runtime": 48.5046, "eval_samples_per_second": 41.79, "eval_steps_per_second": 5.237, "eval_wer": 0.492597941866763, "step": 9900 }, { "epoch": 1.07, "learning_rate": 0.00027959742120343837, "loss": 0.4176, "step": 10000 }, { "epoch": 1.07, "eval_loss": 0.5971259474754333, "eval_runtime": 48.5096, "eval_samples_per_second": 41.786, "eval_steps_per_second": 5.236, "eval_wer": 0.5368297526629355, "step": 10000 }, { "epoch": 1.08, "eval_loss": 0.5706018805503845, "eval_runtime": 48.1561, "eval_samples_per_second": 42.092, "eval_steps_per_second": 5.275, "eval_wer": 0.4940422458927604, "step": 10100 }, { "epoch": 1.09, "eval_loss": 0.5612200498580933, "eval_runtime": 48.0575, "eval_samples_per_second": 42.179, "eval_steps_per_second": 5.285, "eval_wer": 0.5032496840584944, "step": 10200 }, { "epoch": 1.1, "eval_loss": 0.5671827793121338, "eval_runtime": 48.4862, "eval_samples_per_second": 41.806, "eval_steps_per_second": 5.239, "eval_wer": 0.4944033218992598, "step": 10300 }, { "epoch": 1.11, "eval_loss": 0.5915140509605408, "eval_runtime": 48.186, "eval_samples_per_second": 42.066, "eval_steps_per_second": 5.271, "eval_wer": 0.5218450983932118, "step": 10400 }, { "epoch": 1.12, "learning_rate": 0.00027852292263610317, "loss": 0.4033, "step": 10500 }, { "epoch": 1.12, "eval_loss": 0.5705661177635193, "eval_runtime": 48.5793, "eval_samples_per_second": 41.726, "eval_steps_per_second": 5.229, "eval_wer": 0.505145333092616, "step": 10500 }, { "epoch": 1.13, "eval_loss": 0.56607985496521, "eval_runtime": 48.4918, "eval_samples_per_second": 41.801, "eval_steps_per_second": 5.238, "eval_wer": 0.4934103628813865, "step": 10600 }, { "epoch": 1.15, "eval_loss": 0.5724338889122009, "eval_runtime": 48.2921, "eval_samples_per_second": 41.974, "eval_steps_per_second": 5.26, "eval_wer": 0.49025094782451706, "step": 10700 }, { "epoch": 1.16, "eval_loss": 0.5792076587677002, "eval_runtime": 48.2324, "eval_samples_per_second": 42.026, "eval_steps_per_second": 5.266, "eval_wer": 0.49395197689113557, "step": 10800 }, { "epoch": 1.17, "eval_loss": 0.5744290351867676, "eval_runtime": 48.5673, "eval_samples_per_second": 41.736, "eval_steps_per_second": 5.23, "eval_wer": 0.49106336883914065, "step": 10900 }, { "epoch": 1.18, "learning_rate": 0.00027744842406876786, "loss": 0.392, "step": 11000 }, { "epoch": 1.18, "eval_loss": 0.5767287015914917, "eval_runtime": 48.5934, "eval_samples_per_second": 41.714, "eval_steps_per_second": 5.227, "eval_wer": 0.5161581512908467, "step": 11000 }, { "epoch": 1.19, "eval_loss": 0.5588058829307556, "eval_runtime": 48.5001, "eval_samples_per_second": 41.794, "eval_steps_per_second": 5.237, "eval_wer": 0.4834807727026539, "step": 11100 }, { "epoch": 1.2, "eval_loss": 0.5609337687492371, "eval_runtime": 48.6478, "eval_samples_per_second": 41.667, "eval_steps_per_second": 5.221, "eval_wer": 0.4922368658602636, "step": 11200 }, { "epoch": 1.21, "eval_loss": 0.5889888405799866, "eval_runtime": 48.4613, "eval_samples_per_second": 41.827, "eval_steps_per_second": 5.241, "eval_wer": 0.49142444484564, "step": 11300 }, { "epoch": 1.22, "eval_loss": 0.5525108575820923, "eval_runtime": 48.6323, "eval_samples_per_second": 41.68, "eval_steps_per_second": 5.223, "eval_wer": 0.489709333814768, "step": 11400 }, { "epoch": 1.23, "learning_rate": 0.0002763739255014326, "loss": 0.387, "step": 11500 }, { "epoch": 1.23, "eval_loss": 0.5704483389854431, "eval_runtime": 48.2001, "eval_samples_per_second": 42.054, "eval_steps_per_second": 5.27, "eval_wer": 0.5050550640909911, "step": 11500 }, { "epoch": 1.24, "eval_loss": 0.5538840889930725, "eval_runtime": 48.397, "eval_samples_per_second": 41.883, "eval_steps_per_second": 5.248, "eval_wer": 0.5013540350243726, "step": 11600 }, { "epoch": 1.25, "eval_loss": 0.5473034381866455, "eval_runtime": 48.5532, "eval_samples_per_second": 41.748, "eval_steps_per_second": 5.231, "eval_wer": 0.48817476078714567, "step": 11700 }, { "epoch": 1.26, "eval_loss": 0.5661569237709045, "eval_runtime": 48.3301, "eval_samples_per_second": 41.941, "eval_steps_per_second": 5.256, "eval_wer": 0.5003610760064994, "step": 11800 }, { "epoch": 1.27, "eval_loss": 0.5784680247306824, "eval_runtime": 48.4292, "eval_samples_per_second": 41.855, "eval_steps_per_second": 5.245, "eval_wer": 0.5220256363964615, "step": 11900 }, { "epoch": 1.28, "learning_rate": 0.0002752994269340974, "loss": 0.3956, "step": 12000 }, { "epoch": 1.28, "eval_loss": 0.5989814400672913, "eval_runtime": 48.3584, "eval_samples_per_second": 41.916, "eval_steps_per_second": 5.252, "eval_wer": 0.5113738942047301, "step": 12000 }, { "epoch": 1.3, "eval_loss": 0.549746036529541, "eval_runtime": 48.5897, "eval_samples_per_second": 41.717, "eval_steps_per_second": 5.227, "eval_wer": 0.4895287958115183, "step": 12100 }, { "epoch": 1.31, "eval_loss": 0.5537735819816589, "eval_runtime": 48.5304, "eval_samples_per_second": 41.768, "eval_steps_per_second": 5.234, "eval_wer": 0.4895287958115183, "step": 12200 }, { "epoch": 1.32, "eval_loss": 0.5651851296424866, "eval_runtime": 48.2022, "eval_samples_per_second": 42.052, "eval_steps_per_second": 5.269, "eval_wer": 0.4913341758440152, "step": 12300 }, { "epoch": 1.33, "eval_loss": 0.5682100057601929, "eval_runtime": 48.2298, "eval_samples_per_second": 42.028, "eval_steps_per_second": 5.266, "eval_wer": 0.5128181982307276, "step": 12400 }, { "epoch": 1.34, "learning_rate": 0.00027422492836676215, "loss": 0.4043, "step": 12500 }, { "epoch": 1.34, "eval_loss": 0.5829596519470215, "eval_runtime": 48.3024, "eval_samples_per_second": 41.965, "eval_steps_per_second": 5.259, "eval_wer": 0.49990973099837516, "step": 12500 }, { "epoch": 1.35, "eval_loss": 0.5685592889785767, "eval_runtime": 48.5496, "eval_samples_per_second": 41.751, "eval_steps_per_second": 5.232, "eval_wer": 0.4864596497562737, "step": 12600 }, { "epoch": 1.36, "eval_loss": 0.5688390135765076, "eval_runtime": 48.1792, "eval_samples_per_second": 42.072, "eval_steps_per_second": 5.272, "eval_wer": 0.49368116988626104, "step": 12700 }, { "epoch": 1.37, "eval_loss": 0.575319230556488, "eval_runtime": 48.6663, "eval_samples_per_second": 41.651, "eval_steps_per_second": 5.219, "eval_wer": 0.503430222061744, "step": 12800 }, { "epoch": 1.38, "eval_loss": 0.5897743701934814, "eval_runtime": 48.6109, "eval_samples_per_second": 41.698, "eval_steps_per_second": 5.225, "eval_wer": 0.48654991875789855, "step": 12900 }, { "epoch": 1.39, "learning_rate": 0.0002731504297994269, "loss": 0.3997, "step": 13000 }, { "epoch": 1.39, "eval_loss": 0.5723254680633545, "eval_runtime": 48.325, "eval_samples_per_second": 41.945, "eval_steps_per_second": 5.256, "eval_wer": 0.4962989709333815, "step": 13000 }, { "epoch": 1.4, "eval_loss": 0.5766825675964355, "eval_runtime": 48.386, "eval_samples_per_second": 41.892, "eval_steps_per_second": 5.249, "eval_wer": 0.4985556959740025, "step": 13100 }, { "epoch": 1.41, "eval_loss": 0.5959895849227905, "eval_runtime": 48.351, "eval_samples_per_second": 41.923, "eval_steps_per_second": 5.253, "eval_wer": 0.5083950171511104, "step": 13200 }, { "epoch": 1.42, "eval_loss": 0.5859235525131226, "eval_runtime": 49.246, "eval_samples_per_second": 41.161, "eval_steps_per_second": 5.158, "eval_wer": 0.5095685141722333, "step": 13300 }, { "epoch": 1.43, "eval_loss": 0.5490578413009644, "eval_runtime": 48.6297, "eval_samples_per_second": 41.682, "eval_steps_per_second": 5.223, "eval_wer": 0.4784257086116628, "step": 13400 }, { "epoch": 1.45, "learning_rate": 0.00027207593123209164, "loss": 0.3997, "step": 13500 }, { "epoch": 1.45, "eval_loss": 0.5636021494865417, "eval_runtime": 48.4175, "eval_samples_per_second": 41.865, "eval_steps_per_second": 5.246, "eval_wer": 0.5048745260877414, "step": 13500 }, { "epoch": 1.46, "eval_loss": 0.5667489767074585, "eval_runtime": 48.7553, "eval_samples_per_second": 41.575, "eval_steps_per_second": 5.21, "eval_wer": 0.470843112475176, "step": 13600 }, { "epoch": 1.47, "eval_loss": 0.5757395029067993, "eval_runtime": 48.5863, "eval_samples_per_second": 41.72, "eval_steps_per_second": 5.228, "eval_wer": 0.4861888427513992, "step": 13700 }, { "epoch": 1.48, "eval_loss": 0.5444319844245911, "eval_runtime": 48.6276, "eval_samples_per_second": 41.684, "eval_steps_per_second": 5.223, "eval_wer": 0.48158512366853223, "step": 13800 }, { "epoch": 1.49, "eval_loss": 0.5556561350822449, "eval_runtime": 48.6386, "eval_samples_per_second": 41.675, "eval_steps_per_second": 5.222, "eval_wer": 0.4792381296262863, "step": 13900 }, { "epoch": 1.5, "learning_rate": 0.00027100143266475644, "loss": 0.3954, "step": 14000 }, { "epoch": 1.5, "eval_loss": 0.5437420010566711, "eval_runtime": 48.3246, "eval_samples_per_second": 41.946, "eval_steps_per_second": 5.256, "eval_wer": 0.48095324065715833, "step": 14000 }, { "epoch": 1.51, "eval_loss": 0.5488930940628052, "eval_runtime": 48.1775, "eval_samples_per_second": 42.074, "eval_steps_per_second": 5.272, "eval_wer": 0.46741289041343204, "step": 14100 }, { "epoch": 1.52, "eval_loss": 0.541516900062561, "eval_runtime": 48.22, "eval_samples_per_second": 42.037, "eval_steps_per_second": 5.268, "eval_wer": 0.46741289041343204, "step": 14200 }, { "epoch": 1.53, "eval_loss": 0.5481301546096802, "eval_runtime": 49.0132, "eval_samples_per_second": 41.356, "eval_steps_per_second": 5.182, "eval_wer": 0.4901606788228922, "step": 14300 }, { "epoch": 1.54, "eval_loss": 0.547429621219635, "eval_runtime": 48.9783, "eval_samples_per_second": 41.386, "eval_steps_per_second": 5.186, "eval_wer": 0.4763495215742914, "step": 14400 }, { "epoch": 1.55, "learning_rate": 0.0002699269340974212, "loss": 0.3814, "step": 14500 }, { "epoch": 1.55, "eval_loss": 0.5588225722312927, "eval_runtime": 48.3905, "eval_samples_per_second": 41.888, "eval_steps_per_second": 5.249, "eval_wer": 0.4730998375157971, "step": 14500 }, { "epoch": 1.56, "eval_loss": 0.5745720267295837, "eval_runtime": 48.5865, "eval_samples_per_second": 41.719, "eval_steps_per_second": 5.228, "eval_wer": 0.48203646867665645, "step": 14600 }, { "epoch": 1.57, "eval_loss": 0.5675551891326904, "eval_runtime": 48.3999, "eval_samples_per_second": 41.88, "eval_steps_per_second": 5.248, "eval_wer": 0.48835529879039535, "step": 14700 }, { "epoch": 1.58, "eval_loss": 0.5494562387466431, "eval_runtime": 48.3296, "eval_samples_per_second": 41.941, "eval_steps_per_second": 5.256, "eval_wer": 0.47111391948005055, "step": 14800 }, { "epoch": 1.6, "eval_loss": 0.556481659412384, "eval_runtime": 48.4994, "eval_samples_per_second": 41.794, "eval_steps_per_second": 5.237, "eval_wer": 0.4782451706084131, "step": 14900 }, { "epoch": 1.61, "learning_rate": 0.0002688545845272206, "loss": 0.3877, "step": 15000 }, { "epoch": 1.61, "eval_loss": 0.5670508742332458, "eval_runtime": 48.5206, "eval_samples_per_second": 41.776, "eval_steps_per_second": 5.235, "eval_wer": 0.5135403502437264, "step": 15000 }, { "epoch": 1.62, "eval_loss": 0.5511665344238281, "eval_runtime": 48.5022, "eval_samples_per_second": 41.792, "eval_steps_per_second": 5.237, "eval_wer": 0.4868207257627731, "step": 15100 }, { "epoch": 1.63, "eval_loss": 0.5683439373970032, "eval_runtime": 48.7471, "eval_samples_per_second": 41.582, "eval_steps_per_second": 5.211, "eval_wer": 0.4649756273695613, "step": 15200 }, { "epoch": 1.64, "eval_loss": 0.5426750183105469, "eval_runtime": 48.8663, "eval_samples_per_second": 41.481, "eval_steps_per_second": 5.198, "eval_wer": 0.47174580249142445, "step": 15300 }, { "epoch": 1.65, "eval_loss": 0.5519290566444397, "eval_runtime": 48.7168, "eval_samples_per_second": 41.608, "eval_steps_per_second": 5.214, "eval_wer": 0.4650658963711861, "step": 15400 }, { "epoch": 1.66, "learning_rate": 0.0002677800859598854, "loss": 0.387, "step": 15500 }, { "epoch": 1.66, "eval_loss": 0.532715916633606, "eval_runtime": 48.8241, "eval_samples_per_second": 41.516, "eval_steps_per_second": 5.202, "eval_wer": 0.44556779202022023, "step": 15500 }, { "epoch": 1.67, "eval_loss": 0.5371445417404175, "eval_runtime": 48.9886, "eval_samples_per_second": 41.377, "eval_steps_per_second": 5.185, "eval_wer": 0.4673226214118072, "step": 15600 }, { "epoch": 1.68, "eval_loss": 0.5337085127830505, "eval_runtime": 48.4513, "eval_samples_per_second": 41.836, "eval_steps_per_second": 5.242, "eval_wer": 0.47048203646867665, "step": 15700 }, { "epoch": 1.69, "eval_loss": 0.5606207847595215, "eval_runtime": 48.5238, "eval_samples_per_second": 41.773, "eval_steps_per_second": 5.235, "eval_wer": 0.4991875789853764, "step": 15800 }, { "epoch": 1.7, "eval_loss": 0.5253767967224121, "eval_runtime": 48.1837, "eval_samples_per_second": 42.068, "eval_steps_per_second": 5.271, "eval_wer": 0.46127459830294276, "step": 15900 }, { "epoch": 1.71, "learning_rate": 0.00026670558739255013, "loss": 0.3877, "step": 16000 }, { "epoch": 1.71, "eval_loss": 0.5618729591369629, "eval_runtime": 48.4128, "eval_samples_per_second": 41.869, "eval_steps_per_second": 5.247, "eval_wer": 0.48817476078714567, "step": 16000 }, { "epoch": 1.72, "eval_loss": 0.5212122797966003, "eval_runtime": 48.591, "eval_samples_per_second": 41.716, "eval_steps_per_second": 5.227, "eval_wer": 0.4560389962087019, "step": 16100 }, { "epoch": 1.73, "eval_loss": 0.536945641040802, "eval_runtime": 48.7143, "eval_samples_per_second": 41.61, "eval_steps_per_second": 5.214, "eval_wer": 0.4695793464524282, "step": 16200 }, { "epoch": 1.75, "eval_loss": 0.5391582250595093, "eval_runtime": 48.284, "eval_samples_per_second": 41.981, "eval_steps_per_second": 5.261, "eval_wer": 0.46768369741830657, "step": 16300 }, { "epoch": 1.76, "eval_loss": 0.535341739654541, "eval_runtime": 48.3278, "eval_samples_per_second": 41.943, "eval_steps_per_second": 5.256, "eval_wer": 0.4768008665824156, "step": 16400 }, { "epoch": 1.77, "learning_rate": 0.0002656310888252149, "loss": 0.3739, "step": 16500 }, { "epoch": 1.77, "eval_loss": 0.5435373187065125, "eval_runtime": 48.2949, "eval_samples_per_second": 41.971, "eval_steps_per_second": 5.259, "eval_wer": 0.47770355659866404, "step": 16500 }, { "epoch": 1.78, "eval_loss": 0.5342755317687988, "eval_runtime": 48.4704, "eval_samples_per_second": 41.819, "eval_steps_per_second": 5.24, "eval_wer": 0.4884455677920202, "step": 16600 }, { "epoch": 1.79, "eval_loss": 0.5309295058250427, "eval_runtime": 48.3519, "eval_samples_per_second": 41.922, "eval_steps_per_second": 5.253, "eval_wer": 0.4942227838960101, "step": 16700 }, { "epoch": 1.8, "eval_loss": 0.5372947454452515, "eval_runtime": 48.1794, "eval_samples_per_second": 42.072, "eval_steps_per_second": 5.272, "eval_wer": 0.4727387615092977, "step": 16800 }, { "epoch": 1.81, "eval_loss": 0.5549677610397339, "eval_runtime": 48.1603, "eval_samples_per_second": 42.089, "eval_steps_per_second": 5.274, "eval_wer": 0.468586387434555, "step": 16900 }, { "epoch": 1.82, "learning_rate": 0.0002645565902578796, "loss": 0.3884, "step": 17000 }, { "epoch": 1.82, "eval_loss": 0.5485758185386658, "eval_runtime": 48.2605, "eval_samples_per_second": 42.001, "eval_steps_per_second": 5.263, "eval_wer": 0.4825780826864055, "step": 17000 }, { "epoch": 1.83, "eval_loss": 0.5507860779762268, "eval_runtime": 48.2489, "eval_samples_per_second": 42.011, "eval_steps_per_second": 5.264, "eval_wer": 0.4861888427513992, "step": 17100 }, { "epoch": 1.84, "eval_loss": 0.5423179864883423, "eval_runtime": 48.238, "eval_samples_per_second": 42.021, "eval_steps_per_second": 5.266, "eval_wer": 0.48546669073840043, "step": 17200 }, { "epoch": 1.85, "eval_loss": 0.5478358864784241, "eval_runtime": 48.2249, "eval_samples_per_second": 42.032, "eval_steps_per_second": 5.267, "eval_wer": 0.47300956851417225, "step": 17300 }, { "epoch": 1.86, "eval_loss": 0.5437774062156677, "eval_runtime": 48.3875, "eval_samples_per_second": 41.891, "eval_steps_per_second": 5.249, "eval_wer": 0.4937714388878859, "step": 17400 }, { "epoch": 1.87, "learning_rate": 0.0002634820916905444, "loss": 0.3842, "step": 17500 }, { "epoch": 1.87, "eval_loss": 0.5570672750473022, "eval_runtime": 48.3857, "eval_samples_per_second": 41.893, "eval_steps_per_second": 5.249, "eval_wer": 0.4817656616717819, "step": 17500 }, { "epoch": 1.88, "eval_loss": 0.5401641130447388, "eval_runtime": 48.625, "eval_samples_per_second": 41.686, "eval_steps_per_second": 5.224, "eval_wer": 0.4752662935547933, "step": 17600 }, { "epoch": 1.9, "eval_loss": 0.5679250955581665, "eval_runtime": 48.1534, "eval_samples_per_second": 42.095, "eval_steps_per_second": 5.275, "eval_wer": 0.48266835168803035, "step": 17700 }, { "epoch": 1.91, "eval_loss": 0.5385044813156128, "eval_runtime": 49.0923, "eval_samples_per_second": 41.29, "eval_steps_per_second": 5.174, "eval_wer": 0.46416320635493774, "step": 17800 }, { "epoch": 1.92, "eval_loss": 0.5519374012947083, "eval_runtime": 48.6773, "eval_samples_per_second": 41.642, "eval_steps_per_second": 5.218, "eval_wer": 0.4942227838960101, "step": 17900 }, { "epoch": 1.93, "learning_rate": 0.00026240759312320917, "loss": 0.3953, "step": 18000 }, { "epoch": 1.93, "eval_loss": 0.5559102892875671, "eval_runtime": 48.5742, "eval_samples_per_second": 41.73, "eval_steps_per_second": 5.229, "eval_wer": 0.47454414154179453, "step": 18000 }, { "epoch": 1.94, "eval_loss": 0.5656890869140625, "eval_runtime": 48.6283, "eval_samples_per_second": 41.684, "eval_steps_per_second": 5.223, "eval_wer": 0.4962989709333815, "step": 18100 }, { "epoch": 1.95, "eval_loss": 0.5296332836151123, "eval_runtime": 48.245, "eval_samples_per_second": 42.015, "eval_steps_per_second": 5.265, "eval_wer": 0.46416320635493774, "step": 18200 }, { "epoch": 1.96, "eval_loss": 0.5529346466064453, "eval_runtime": 48.1639, "eval_samples_per_second": 42.085, "eval_steps_per_second": 5.274, "eval_wer": 0.4907022928326413, "step": 18300 }, { "epoch": 1.97, "eval_loss": 0.5379639267921448, "eval_runtime": 48.3399, "eval_samples_per_second": 41.932, "eval_steps_per_second": 5.254, "eval_wer": 0.4536017331648312, "step": 18400 }, { "epoch": 1.98, "learning_rate": 0.00026133524355300856, "loss": 0.3745, "step": 18500 }, { "epoch": 1.98, "eval_loss": 0.5275648832321167, "eval_runtime": 48.1451, "eval_samples_per_second": 42.102, "eval_steps_per_second": 5.276, "eval_wer": 0.4677739664199314, "step": 18500 }, { "epoch": 1.99, "eval_loss": 0.5544295310974121, "eval_runtime": 48.5316, "eval_samples_per_second": 41.767, "eval_steps_per_second": 5.234, "eval_wer": 0.4853764217367756, "step": 18600 }, { "epoch": 2.0, "eval_loss": 0.5195306539535522, "eval_runtime": 48.7173, "eval_samples_per_second": 41.607, "eval_steps_per_second": 5.214, "eval_wer": 0.45351146416320637, "step": 18700 }, { "epoch": 2.01, "eval_loss": 0.5165307521820068, "eval_runtime": 49.0261, "eval_samples_per_second": 41.345, "eval_steps_per_second": 5.181, "eval_wer": 0.46353132334356384, "step": 18800 }, { "epoch": 2.02, "eval_loss": 0.5062076449394226, "eval_runtime": 49.107, "eval_samples_per_second": 41.277, "eval_steps_per_second": 5.172, "eval_wer": 0.4431305289763495, "step": 18900 }, { "epoch": 2.03, "learning_rate": 0.00026026074498567336, "loss": 0.3538, "step": 19000 }, { "epoch": 2.03, "eval_loss": 0.5254501104354858, "eval_runtime": 55.2719, "eval_samples_per_second": 36.673, "eval_steps_per_second": 4.595, "eval_wer": 0.4508936631160859, "step": 19000 }, { "epoch": 2.04, "eval_loss": 0.5124872326850891, "eval_runtime": 48.7773, "eval_samples_per_second": 41.556, "eval_steps_per_second": 5.207, "eval_wer": 0.45116447012096045, "step": 19100 }, { "epoch": 2.06, "eval_loss": 0.510496973991394, "eval_runtime": 49.0354, "eval_samples_per_second": 41.337, "eval_steps_per_second": 5.18, "eval_wer": 0.45035204910633686, "step": 19200 }, { "epoch": 2.07, "eval_loss": 0.5000460147857666, "eval_runtime": 48.7939, "eval_samples_per_second": 41.542, "eval_steps_per_second": 5.206, "eval_wer": 0.44899801408196427, "step": 19300 }, { "epoch": 2.08, "eval_loss": 0.5149863362312317, "eval_runtime": 48.7295, "eval_samples_per_second": 41.597, "eval_steps_per_second": 5.212, "eval_wer": 0.45197689113558404, "step": 19400 }, { "epoch": 2.09, "learning_rate": 0.0002591862464183381, "loss": 0.356, "step": 19500 }, { "epoch": 2.09, "eval_loss": 0.5052781701087952, "eval_runtime": 48.7825, "eval_samples_per_second": 41.552, "eval_steps_per_second": 5.207, "eval_wer": 0.43825600288860805, "step": 19500 }, { "epoch": 2.1, "eval_loss": 0.5084646344184875, "eval_runtime": 48.8304, "eval_samples_per_second": 41.511, "eval_steps_per_second": 5.202, "eval_wer": 0.44168622495035204, "step": 19600 }, { "epoch": 2.11, "eval_loss": 0.5229296088218689, "eval_runtime": 49.9067, "eval_samples_per_second": 40.616, "eval_steps_per_second": 5.089, "eval_wer": 0.44899801408196427, "step": 19700 }, { "epoch": 2.12, "eval_loss": 0.5325890183448792, "eval_runtime": 49.0157, "eval_samples_per_second": 41.354, "eval_steps_per_second": 5.182, "eval_wer": 0.44917855208521396, "step": 19800 }, { "epoch": 2.13, "eval_loss": 0.5138561725616455, "eval_runtime": 48.4503, "eval_samples_per_second": 41.837, "eval_steps_per_second": 5.242, "eval_wer": 0.4490882830835891, "step": 19900 }, { "epoch": 2.14, "learning_rate": 0.00025811174785100285, "loss": 0.3474, "step": 20000 }, { "epoch": 2.14, "eval_loss": 0.5133703351020813, "eval_runtime": 48.4371, "eval_samples_per_second": 41.848, "eval_steps_per_second": 5.244, "eval_wer": 0.43843654089185774, "step": 20000 }, { "epoch": 2.15, "eval_loss": 0.5498203635215759, "eval_runtime": 49.0522, "eval_samples_per_second": 41.323, "eval_steps_per_second": 5.178, "eval_wer": 0.46064271529156886, "step": 20100 }, { "epoch": 2.16, "eval_loss": 0.532422661781311, "eval_runtime": 49.1671, "eval_samples_per_second": 41.227, "eval_steps_per_second": 5.166, "eval_wer": 0.4539628091713306, "step": 20200 }, { "epoch": 2.17, "eval_loss": 0.5338008999824524, "eval_runtime": 48.8328, "eval_samples_per_second": 41.509, "eval_steps_per_second": 5.201, "eval_wer": 0.4547752301859541, "step": 20300 }, { "epoch": 2.18, "eval_loss": 0.5075809955596924, "eval_runtime": 49.1135, "eval_samples_per_second": 41.272, "eval_steps_per_second": 5.172, "eval_wer": 0.4424986459649756, "step": 20400 }, { "epoch": 2.19, "learning_rate": 0.0002570393982808023, "loss": 0.345, "step": 20500 }, { "epoch": 2.19, "eval_loss": 0.5252628326416016, "eval_runtime": 48.651, "eval_samples_per_second": 41.664, "eval_steps_per_second": 5.221, "eval_wer": 0.4549557681892038, "step": 20500 }, { "epoch": 2.21, "eval_loss": 0.5125060677528381, "eval_runtime": 48.9394, "eval_samples_per_second": 41.419, "eval_steps_per_second": 5.19, "eval_wer": 0.4618162123126918, "step": 20600 }, { "epoch": 2.22, "eval_loss": 0.5170891284942627, "eval_runtime": 48.4981, "eval_samples_per_second": 41.795, "eval_steps_per_second": 5.237, "eval_wer": 0.44872720707708974, "step": 20700 }, { "epoch": 2.23, "eval_loss": 0.5232036113739014, "eval_runtime": 50.0089, "eval_samples_per_second": 40.533, "eval_steps_per_second": 5.079, "eval_wer": 0.4463802130348438, "step": 20800 }, { "epoch": 2.24, "eval_loss": 0.5297756195068359, "eval_runtime": 49.4494, "eval_samples_per_second": 40.991, "eval_steps_per_second": 5.137, "eval_wer": 0.45883733525907205, "step": 20900 }, { "epoch": 2.25, "learning_rate": 0.000255964899713467, "loss": 0.341, "step": 21000 }, { "epoch": 2.25, "eval_loss": 0.5342200994491577, "eval_runtime": 48.7244, "eval_samples_per_second": 41.601, "eval_steps_per_second": 5.213, "eval_wer": 0.45757356923632425, "step": 21000 }, { "epoch": 2.26, "eval_loss": 0.5514694452285767, "eval_runtime": 48.4433, "eval_samples_per_second": 41.843, "eval_steps_per_second": 5.243, "eval_wer": 0.4677739664199314, "step": 21100 }, { "epoch": 2.27, "eval_loss": 0.5041313767433167, "eval_runtime": 48.8996, "eval_samples_per_second": 41.452, "eval_steps_per_second": 5.194, "eval_wer": 0.44953962809171333, "step": 21200 }, { "epoch": 2.28, "eval_loss": 0.5169302821159363, "eval_runtime": 48.8222, "eval_samples_per_second": 41.518, "eval_steps_per_second": 5.203, "eval_wer": 0.44728290305109225, "step": 21300 }, { "epoch": 2.29, "eval_loss": 0.522724449634552, "eval_runtime": 48.6369, "eval_samples_per_second": 41.676, "eval_steps_per_second": 5.222, "eval_wer": 0.44935909008846364, "step": 21400 }, { "epoch": 2.3, "learning_rate": 0.0002548904011461318, "loss": 0.354, "step": 21500 }, { "epoch": 2.3, "eval_loss": 0.5213791131973267, "eval_runtime": 48.5544, "eval_samples_per_second": 41.747, "eval_steps_per_second": 5.231, "eval_wer": 0.44583859902509476, "step": 21500 }, { "epoch": 2.31, "eval_loss": 0.5303418636322021, "eval_runtime": 49.529, "eval_samples_per_second": 40.925, "eval_steps_per_second": 5.128, "eval_wer": 0.4587470662574472, "step": 21600 }, { "epoch": 2.32, "eval_loss": 0.5236622095108032, "eval_runtime": 48.9492, "eval_samples_per_second": 41.41, "eval_steps_per_second": 5.189, "eval_wer": 0.45974002527532043, "step": 21700 }, { "epoch": 2.33, "eval_loss": 0.5067057013511658, "eval_runtime": 49.3403, "eval_samples_per_second": 41.082, "eval_steps_per_second": 5.148, "eval_wer": 0.44601913702834445, "step": 21800 }, { "epoch": 2.34, "eval_loss": 0.5117440819740295, "eval_runtime": 48.9443, "eval_samples_per_second": 41.414, "eval_steps_per_second": 5.19, "eval_wer": 0.4560389962087019, "step": 21900 }, { "epoch": 2.36, "learning_rate": 0.00025381590257879654, "loss": 0.3333, "step": 22000 }, { "epoch": 2.36, "eval_loss": 0.5104334950447083, "eval_runtime": 49.2332, "eval_samples_per_second": 41.171, "eval_steps_per_second": 5.159, "eval_wer": 0.43590900884636213, "step": 22000 }, { "epoch": 2.37, "eval_loss": 0.5325857996940613, "eval_runtime": 48.7968, "eval_samples_per_second": 41.54, "eval_steps_per_second": 5.205, "eval_wer": 0.46786423542155625, "step": 22100 }, { "epoch": 2.38, "eval_loss": 0.509769082069397, "eval_runtime": 49.5392, "eval_samples_per_second": 40.917, "eval_steps_per_second": 5.127, "eval_wer": 0.45098393211771076, "step": 22200 }, { "epoch": 2.39, "eval_loss": 0.5043946504592896, "eval_runtime": 49.0673, "eval_samples_per_second": 41.311, "eval_steps_per_second": 5.177, "eval_wer": 0.44448456400072217, "step": 22300 }, { "epoch": 2.4, "eval_loss": 0.5219407677650452, "eval_runtime": 49.3521, "eval_samples_per_second": 41.072, "eval_steps_per_second": 5.147, "eval_wer": 0.4489077450803394, "step": 22400 }, { "epoch": 2.41, "learning_rate": 0.0002527414040114613, "loss": 0.3514, "step": 22500 }, { "epoch": 2.41, "eval_loss": 0.4986798167228699, "eval_runtime": 48.8881, "eval_samples_per_second": 41.462, "eval_steps_per_second": 5.196, "eval_wer": 0.4433110669795992, "step": 22500 }, { "epoch": 2.42, "eval_loss": 0.5008650422096252, "eval_runtime": 48.9214, "eval_samples_per_second": 41.434, "eval_steps_per_second": 5.192, "eval_wer": 0.4338328218089908, "step": 22600 }, { "epoch": 2.43, "eval_loss": 0.5252286195755005, "eval_runtime": 48.9441, "eval_samples_per_second": 41.415, "eval_steps_per_second": 5.19, "eval_wer": 0.44439429499909733, "step": 22700 }, { "epoch": 2.44, "eval_loss": 0.4861030876636505, "eval_runtime": 49.1509, "eval_samples_per_second": 41.24, "eval_steps_per_second": 5.168, "eval_wer": 0.42688210868387794, "step": 22800 }, { "epoch": 2.45, "eval_loss": 0.5156984925270081, "eval_runtime": 48.9934, "eval_samples_per_second": 41.373, "eval_steps_per_second": 5.184, "eval_wer": 0.44213756995847625, "step": 22900 }, { "epoch": 2.46, "learning_rate": 0.00025166690544412603, "loss": 0.3444, "step": 23000 }, { "epoch": 2.46, "eval_loss": 0.5277285575866699, "eval_runtime": 49.0393, "eval_samples_per_second": 41.334, "eval_steps_per_second": 5.18, "eval_wer": 0.44258891496660047, "step": 23000 }, { "epoch": 2.47, "eval_loss": 0.5213038325309753, "eval_runtime": 48.8044, "eval_samples_per_second": 41.533, "eval_steps_per_second": 5.204, "eval_wer": 0.43780465788048384, "step": 23100 }, { "epoch": 2.48, "eval_loss": 0.5172164440155029, "eval_runtime": 48.9505, "eval_samples_per_second": 41.409, "eval_steps_per_second": 5.189, "eval_wer": 0.4481855930673407, "step": 23200 }, { "epoch": 2.49, "eval_loss": 0.51420658826828, "eval_runtime": 49.0092, "eval_samples_per_second": 41.36, "eval_steps_per_second": 5.183, "eval_wer": 0.43762411987723415, "step": 23300 }, { "epoch": 2.51, "eval_loss": 0.5044341087341309, "eval_runtime": 48.7967, "eval_samples_per_second": 41.54, "eval_steps_per_second": 5.205, "eval_wer": 0.4230908106156346, "step": 23400 }, { "epoch": 2.52, "learning_rate": 0.0002505924068767908, "loss": 0.3536, "step": 23500 }, { "epoch": 2.52, "eval_loss": 0.5267765522003174, "eval_runtime": 49.0223, "eval_samples_per_second": 41.349, "eval_steps_per_second": 5.181, "eval_wer": 0.44962989709333817, "step": 23500 }, { "epoch": 2.53, "eval_loss": 0.5175958871841431, "eval_runtime": 48.8831, "eval_samples_per_second": 41.466, "eval_steps_per_second": 5.196, "eval_wer": 0.432569055786243, "step": 23600 }, { "epoch": 2.54, "eval_loss": 0.5031694173812866, "eval_runtime": 48.7866, "eval_samples_per_second": 41.548, "eval_steps_per_second": 5.206, "eval_wer": 0.42959017873262323, "step": 23700 }, { "epoch": 2.55, "eval_loss": 0.5210540890693665, "eval_runtime": 49.2301, "eval_samples_per_second": 41.174, "eval_steps_per_second": 5.159, "eval_wer": 0.44601913702834445, "step": 23800 }, { "epoch": 2.56, "eval_loss": 0.5092755556106567, "eval_runtime": 48.5206, "eval_samples_per_second": 41.776, "eval_steps_per_second": 5.235, "eval_wer": 0.4378949268821087, "step": 23900 }, { "epoch": 2.57, "learning_rate": 0.00024952005730659023, "loss": 0.337, "step": 24000 }, { "epoch": 2.57, "eval_loss": 0.49896007776260376, "eval_runtime": 48.9304, "eval_samples_per_second": 41.426, "eval_steps_per_second": 5.191, "eval_wer": 0.4311247517602455, "step": 24000 }, { "epoch": 2.58, "eval_loss": 0.49622592329978943, "eval_runtime": 48.829, "eval_samples_per_second": 41.512, "eval_steps_per_second": 5.202, "eval_wer": 0.43293013179274237, "step": 24100 }, { "epoch": 2.59, "eval_loss": 0.5032628178596497, "eval_runtime": 48.9877, "eval_samples_per_second": 41.378, "eval_steps_per_second": 5.185, "eval_wer": 0.4288680267196245, "step": 24200 }, { "epoch": 2.6, "eval_loss": 0.5260281562805176, "eval_runtime": 48.83, "eval_samples_per_second": 41.511, "eval_steps_per_second": 5.202, "eval_wer": 0.4534211951615815, "step": 24300 }, { "epoch": 2.61, "eval_loss": 0.5309225916862488, "eval_runtime": 48.8251, "eval_samples_per_second": 41.516, "eval_steps_per_second": 5.202, "eval_wer": 0.4441234879942228, "step": 24400 }, { "epoch": 2.62, "learning_rate": 0.000248445558739255, "loss": 0.3393, "step": 24500 }, { "epoch": 2.62, "eval_loss": 0.5131687521934509, "eval_runtime": 48.6954, "eval_samples_per_second": 41.626, "eval_steps_per_second": 5.216, "eval_wer": 0.43455497382198954, "step": 24500 }, { "epoch": 2.63, "eval_loss": 0.5188684463500977, "eval_runtime": 48.6759, "eval_samples_per_second": 41.643, "eval_steps_per_second": 5.218, "eval_wer": 0.42327134861888427, "step": 24600 }, { "epoch": 2.64, "eval_loss": 0.5074316263198853, "eval_runtime": 48.5643, "eval_samples_per_second": 41.738, "eval_steps_per_second": 5.23, "eval_wer": 0.432569055786243, "step": 24700 }, { "epoch": 2.66, "eval_loss": 0.5110915899276733, "eval_runtime": 48.9356, "eval_samples_per_second": 41.422, "eval_steps_per_second": 5.19, "eval_wer": 0.4254378046578805, "step": 24800 }, { "epoch": 2.67, "eval_loss": 0.4932540953159332, "eval_runtime": 49.84, "eval_samples_per_second": 40.67, "eval_steps_per_second": 5.096, "eval_wer": 0.4254378046578805, "step": 24900 }, { "epoch": 2.68, "learning_rate": 0.0002473710601719197, "loss": 0.3334, "step": 25000 }, { "epoch": 2.68, "eval_loss": 0.5045706629753113, "eval_runtime": 48.7805, "eval_samples_per_second": 41.553, "eval_steps_per_second": 5.207, "eval_wer": 0.44069326593247876, "step": 25000 }, { "epoch": 2.69, "eval_loss": 0.500957190990448, "eval_runtime": 48.5639, "eval_samples_per_second": 41.739, "eval_steps_per_second": 5.23, "eval_wer": 0.4404224589276043, "step": 25100 }, { "epoch": 2.7, "eval_loss": 0.5044623017311096, "eval_runtime": 48.5838, "eval_samples_per_second": 41.722, "eval_steps_per_second": 5.228, "eval_wer": 0.42363242462538364, "step": 25200 }, { "epoch": 2.71, "eval_loss": 0.4938253164291382, "eval_runtime": 49.0033, "eval_samples_per_second": 41.365, "eval_steps_per_second": 5.183, "eval_wer": 0.43049286874887166, "step": 25300 }, { "epoch": 2.72, "eval_loss": 0.5020812153816223, "eval_runtime": 48.9392, "eval_samples_per_second": 41.419, "eval_steps_per_second": 5.19, "eval_wer": 0.4383462718902329, "step": 25400 }, { "epoch": 2.73, "learning_rate": 0.0002462965616045845, "loss": 0.3366, "step": 25500 }, { "epoch": 2.73, "eval_loss": 0.4953358471393585, "eval_runtime": 48.8378, "eval_samples_per_second": 41.505, "eval_steps_per_second": 5.201, "eval_wer": 0.42020220256363966, "step": 25500 }, { "epoch": 2.74, "eval_loss": 0.4984549880027771, "eval_runtime": 48.6616, "eval_samples_per_second": 41.655, "eval_steps_per_second": 5.22, "eval_wer": 0.4338328218089908, "step": 25600 }, { "epoch": 2.75, "eval_loss": 0.4765419065952301, "eval_runtime": 48.8911, "eval_samples_per_second": 41.46, "eval_steps_per_second": 5.195, "eval_wer": 0.4161400974905218, "step": 25700 }, { "epoch": 2.76, "eval_loss": 0.4873102903366089, "eval_runtime": 49.0181, "eval_samples_per_second": 41.352, "eval_steps_per_second": 5.182, "eval_wer": 0.42922910272612386, "step": 25800 }, { "epoch": 2.77, "eval_loss": 0.49981385469436646, "eval_runtime": 48.989, "eval_samples_per_second": 41.377, "eval_steps_per_second": 5.185, "eval_wer": 0.41893843654089186, "step": 25900 }, { "epoch": 2.78, "learning_rate": 0.0002452242120343839, "loss": 0.3359, "step": 26000 }, { "epoch": 2.78, "eval_loss": 0.49909472465515137, "eval_runtime": 49.0099, "eval_samples_per_second": 41.359, "eval_steps_per_second": 5.183, "eval_wer": 0.4248059216465066, "step": 26000 }, { "epoch": 2.79, "eval_loss": 0.5011939406394958, "eval_runtime": 49.1474, "eval_samples_per_second": 41.243, "eval_steps_per_second": 5.168, "eval_wer": 0.43067340675212135, "step": 26100 }, { "epoch": 2.81, "eval_loss": 0.5080650448799133, "eval_runtime": 48.8435, "eval_samples_per_second": 41.5, "eval_steps_per_second": 5.2, "eval_wer": 0.4151471384726485, "step": 26200 }, { "epoch": 2.82, "eval_loss": 0.4996890127658844, "eval_runtime": 48.7317, "eval_samples_per_second": 41.595, "eval_steps_per_second": 5.212, "eval_wer": 0.43049286874887166, "step": 26300 }, { "epoch": 2.83, "eval_loss": 0.49694108963012695, "eval_runtime": 49.1204, "eval_samples_per_second": 41.266, "eval_steps_per_second": 5.171, "eval_wer": 0.43022206174399713, "step": 26400 }, { "epoch": 2.84, "learning_rate": 0.0002441497134670487, "loss": 0.3396, "step": 26500 }, { "epoch": 2.84, "eval_loss": 0.478350967168808, "eval_runtime": 48.8451, "eval_samples_per_second": 41.499, "eval_steps_per_second": 5.2, "eval_wer": 0.4270626466871276, "step": 26500 }, { "epoch": 2.85, "eval_loss": 0.4804205298423767, "eval_runtime": 48.7331, "eval_samples_per_second": 41.594, "eval_steps_per_second": 5.212, "eval_wer": 0.414876331467774, "step": 26600 }, { "epoch": 2.86, "eval_loss": 0.48998621106147766, "eval_runtime": 49.5501, "eval_samples_per_second": 40.908, "eval_steps_per_second": 5.126, "eval_wer": 0.4192092435457664, "step": 26700 }, { "epoch": 2.87, "eval_loss": 0.5043953061103821, "eval_runtime": 49.2804, "eval_samples_per_second": 41.132, "eval_steps_per_second": 5.154, "eval_wer": 0.43247878678461815, "step": 26800 }, { "epoch": 2.88, "eval_loss": 0.4934612512588501, "eval_runtime": 48.9475, "eval_samples_per_second": 41.412, "eval_steps_per_second": 5.189, "eval_wer": 0.43762411987723415, "step": 26900 }, { "epoch": 2.89, "learning_rate": 0.00024307521489971343, "loss": 0.3356, "step": 27000 }, { "epoch": 2.89, "eval_loss": 0.5006960034370422, "eval_runtime": 48.7024, "eval_samples_per_second": 41.62, "eval_steps_per_second": 5.215, "eval_wer": 0.42688210868387794, "step": 27000 }, { "epoch": 2.9, "eval_loss": 0.48872122168540955, "eval_runtime": 48.7611, "eval_samples_per_second": 41.57, "eval_steps_per_second": 5.209, "eval_wer": 0.4177649395197689, "step": 27100 }, { "epoch": 2.91, "eval_loss": 0.47697293758392334, "eval_runtime": 48.9744, "eval_samples_per_second": 41.389, "eval_steps_per_second": 5.186, "eval_wer": 0.4169525185051453, "step": 27200 }, { "epoch": 2.92, "eval_loss": 0.48469677567481995, "eval_runtime": 48.5931, "eval_samples_per_second": 41.714, "eval_steps_per_second": 5.227, "eval_wer": 0.4166817115002708, "step": 27300 }, { "epoch": 2.93, "eval_loss": 0.4861487150192261, "eval_runtime": 49.0078, "eval_samples_per_second": 41.361, "eval_steps_per_second": 5.183, "eval_wer": 0.4138833724499007, "step": 27400 }, { "epoch": 2.94, "learning_rate": 0.00024200071633237818, "loss": 0.3395, "step": 27500 }, { "epoch": 2.94, "eval_loss": 0.4975493848323822, "eval_runtime": 48.6597, "eval_samples_per_second": 41.657, "eval_steps_per_second": 5.22, "eval_wer": 0.429138833724499, "step": 27500 }, { "epoch": 2.95, "eval_loss": 0.5055610537528992, "eval_runtime": 51.3239, "eval_samples_per_second": 39.494, "eval_steps_per_second": 4.949, "eval_wer": 0.44710236504784256, "step": 27600 }, { "epoch": 2.97, "eval_loss": 0.5111228823661804, "eval_runtime": 50.7513, "eval_samples_per_second": 39.94, "eval_steps_per_second": 5.005, "eval_wer": 0.4375338508756093, "step": 27700 }, { "epoch": 2.98, "eval_loss": 0.5326820611953735, "eval_runtime": 48.8673, "eval_samples_per_second": 41.48, "eval_steps_per_second": 5.198, "eval_wer": 0.4576638382379491, "step": 27800 }, { "epoch": 2.99, "eval_loss": 0.506744384765625, "eval_runtime": 49.0908, "eval_samples_per_second": 41.291, "eval_steps_per_second": 5.174, "eval_wer": 0.43933923090810617, "step": 27900 }, { "epoch": 3.0, "learning_rate": 0.00024092836676217763, "loss": 0.3332, "step": 28000 }, { "epoch": 3.0, "eval_loss": 0.48983654379844666, "eval_runtime": 48.9912, "eval_samples_per_second": 41.375, "eval_steps_per_second": 5.185, "eval_wer": 0.41875789853764217, "step": 28000 }, { "epoch": 3.01, "eval_loss": 0.4790142774581909, "eval_runtime": 48.9473, "eval_samples_per_second": 41.412, "eval_steps_per_second": 5.189, "eval_wer": 0.40927965336703376, "step": 28100 }, { "epoch": 3.02, "eval_loss": 0.48284170031547546, "eval_runtime": 49.4292, "eval_samples_per_second": 41.008, "eval_steps_per_second": 5.139, "eval_wer": 0.42020220256363966, "step": 28200 }, { "epoch": 3.03, "eval_loss": 0.48360347747802734, "eval_runtime": 48.8613, "eval_samples_per_second": 41.485, "eval_steps_per_second": 5.198, "eval_wer": 0.41460552446289944, "step": 28300 }, { "epoch": 3.04, "eval_loss": 0.49010956287384033, "eval_runtime": 49.2751, "eval_samples_per_second": 41.136, "eval_steps_per_second": 5.155, "eval_wer": 0.4241740386351327, "step": 28400 }, { "epoch": 3.05, "learning_rate": 0.00023985386819484238, "loss": 0.2984, "step": 28500 }, { "epoch": 3.05, "eval_loss": 0.47723203897476196, "eval_runtime": 49.0961, "eval_samples_per_second": 41.286, "eval_steps_per_second": 5.174, "eval_wer": 0.41180718541252936, "step": 28500 }, { "epoch": 3.06, "eval_loss": 0.5054998397827148, "eval_runtime": 49.4055, "eval_samples_per_second": 41.028, "eval_steps_per_second": 5.141, "eval_wer": 0.4212854305831378, "step": 28600 }, { "epoch": 3.07, "eval_loss": 0.4910781979560852, "eval_runtime": 49.1346, "eval_samples_per_second": 41.254, "eval_steps_per_second": 5.169, "eval_wer": 0.4100018053800325, "step": 28700 }, { "epoch": 3.08, "eval_loss": 0.47373151779174805, "eval_runtime": 49.1679, "eval_samples_per_second": 41.226, "eval_steps_per_second": 5.166, "eval_wer": 0.4087380393572847, "step": 28800 }, { "epoch": 3.09, "eval_loss": 0.49302175641059875, "eval_runtime": 48.9528, "eval_samples_per_second": 41.407, "eval_steps_per_second": 5.189, "eval_wer": 0.4216465065896371, "step": 28900 }, { "epoch": 3.1, "learning_rate": 0.00023877936962750715, "loss": 0.3056, "step": 29000 }, { "epoch": 3.1, "eval_loss": 0.47357192635536194, "eval_runtime": 49.4511, "eval_samples_per_second": 40.99, "eval_steps_per_second": 5.136, "eval_wer": 0.41090449539628093, "step": 29000 }, { "epoch": 3.12, "eval_loss": 0.4862995743751526, "eval_runtime": 49.3674, "eval_samples_per_second": 41.059, "eval_steps_per_second": 5.145, "eval_wer": 0.4058494313052898, "step": 29100 }, { "epoch": 3.13, "eval_loss": 0.47840672731399536, "eval_runtime": 50.0693, "eval_samples_per_second": 40.484, "eval_steps_per_second": 5.073, "eval_wer": 0.4183968225311428, "step": 29200 }, { "epoch": 3.14, "eval_loss": 0.49233099818229675, "eval_runtime": 49.5351, "eval_samples_per_second": 40.921, "eval_steps_per_second": 5.128, "eval_wer": 0.423993500631883, "step": 29300 }, { "epoch": 3.15, "eval_loss": 0.4845847189426422, "eval_runtime": 49.6836, "eval_samples_per_second": 40.798, "eval_steps_per_second": 5.112, "eval_wer": 0.42263946560751037, "step": 29400 }, { "epoch": 3.16, "learning_rate": 0.0002377048710601719, "loss": 0.2995, "step": 29500 }, { "epoch": 3.16, "eval_loss": 0.4829016923904419, "eval_runtime": 48.9864, "eval_samples_per_second": 41.379, "eval_steps_per_second": 5.185, "eval_wer": 0.408557501354035, "step": 29500 }, { "epoch": 3.17, "eval_loss": 0.4933793544769287, "eval_runtime": 49.2945, "eval_samples_per_second": 41.12, "eval_steps_per_second": 5.153, "eval_wer": 0.423993500631883, "step": 29600 }, { "epoch": 3.18, "eval_loss": 0.48932012915611267, "eval_runtime": 49.1056, "eval_samples_per_second": 41.278, "eval_steps_per_second": 5.173, "eval_wer": 0.41523740747427335, "step": 29700 }, { "epoch": 3.19, "eval_loss": 0.47299858927726746, "eval_runtime": 48.9953, "eval_samples_per_second": 41.371, "eval_steps_per_second": 5.184, "eval_wer": 0.4227297346091352, "step": 29800 }, { "epoch": 3.2, "eval_loss": 0.5027060508728027, "eval_runtime": 50.4849, "eval_samples_per_second": 40.151, "eval_steps_per_second": 5.031, "eval_wer": 0.4330204007943672, "step": 29900 }, { "epoch": 3.21, "learning_rate": 0.00023663037249283664, "loss": 0.2926, "step": 30000 }, { "epoch": 3.21, "eval_loss": 0.4902673363685608, "eval_runtime": 107.9623, "eval_samples_per_second": 18.775, "eval_steps_per_second": 2.353, "eval_wer": 0.41117530240115546, "step": 30000 }, { "epoch": 3.22, "eval_loss": 0.49610400199890137, "eval_runtime": 50.4886, "eval_samples_per_second": 40.148, "eval_steps_per_second": 5.031, "eval_wer": 0.41568875248239756, "step": 30100 }, { "epoch": 3.23, "eval_loss": 0.4980136454105377, "eval_runtime": 51.2384, "eval_samples_per_second": 39.56, "eval_steps_per_second": 4.957, "eval_wer": 0.42688210868387794, "step": 30200 }, { "epoch": 3.24, "eval_loss": 0.48962903022766113, "eval_runtime": 50.3961, "eval_samples_per_second": 40.221, "eval_steps_per_second": 5.04, "eval_wer": 0.4126196064271529, "step": 30300 }, { "epoch": 3.25, "eval_loss": 0.47261691093444824, "eval_runtime": 50.6222, "eval_samples_per_second": 40.042, "eval_steps_per_second": 5.018, "eval_wer": 0.40621050731178915, "step": 30400 }, { "epoch": 3.27, "learning_rate": 0.00023555587392550141, "loss": 0.301, "step": 30500 }, { "epoch": 3.27, "eval_loss": 0.47325438261032104, "eval_runtime": 50.4878, "eval_samples_per_second": 40.148, "eval_steps_per_second": 5.031, "eval_wer": 0.39853764217367754, "step": 30500 }, { "epoch": 3.28, "eval_loss": 0.47721266746520996, "eval_runtime": 50.584, "eval_samples_per_second": 40.072, "eval_steps_per_second": 5.021, "eval_wer": 0.4046759342841668, "step": 30600 }, { "epoch": 3.29, "eval_loss": 0.48059606552124023, "eval_runtime": 50.9656, "eval_samples_per_second": 39.772, "eval_steps_per_second": 4.984, "eval_wer": 0.40819642534753564, "step": 30700 }, { "epoch": 3.3, "eval_loss": 0.4683433771133423, "eval_runtime": 50.2652, "eval_samples_per_second": 40.326, "eval_steps_per_second": 5.053, "eval_wer": 0.40106517421917315, "step": 30800 }, { "epoch": 3.31, "eval_loss": 0.4774733781814575, "eval_runtime": 50.7544, "eval_samples_per_second": 39.937, "eval_steps_per_second": 5.004, "eval_wer": 0.4079256183426611, "step": 30900 }, { "epoch": 3.32, "learning_rate": 0.00023448352435530084, "loss": 0.2933, "step": 31000 }, { "epoch": 3.32, "eval_loss": 0.47292542457580566, "eval_runtime": 49.9791, "eval_samples_per_second": 40.557, "eval_steps_per_second": 5.082, "eval_wer": 0.4082866943491605, "step": 31000 }, { "epoch": 3.33, "eval_loss": 0.4628405272960663, "eval_runtime": 49.7388, "eval_samples_per_second": 40.753, "eval_steps_per_second": 5.107, "eval_wer": 0.4016067882289222, "step": 31100 }, { "epoch": 3.34, "eval_loss": 0.475334107875824, "eval_runtime": 49.8991, "eval_samples_per_second": 40.622, "eval_steps_per_second": 5.09, "eval_wer": 0.4192092435457664, "step": 31200 }, { "epoch": 3.35, "eval_loss": 0.46871381998062134, "eval_runtime": 50.0989, "eval_samples_per_second": 40.46, "eval_steps_per_second": 5.07, "eval_wer": 0.41848709153276764, "step": 31300 }, { "epoch": 3.36, "eval_loss": 0.4805503487586975, "eval_runtime": 50.1378, "eval_samples_per_second": 40.429, "eval_steps_per_second": 5.066, "eval_wer": 0.4106336883914064, "step": 31400 }, { "epoch": 3.37, "learning_rate": 0.0002334090257879656, "loss": 0.2957, "step": 31500 }, { "epoch": 3.37, "eval_loss": 0.48885583877563477, "eval_runtime": 49.7773, "eval_samples_per_second": 40.721, "eval_steps_per_second": 5.103, "eval_wer": 0.423993500631883, "step": 31500 }, { "epoch": 3.38, "eval_loss": 0.48816147446632385, "eval_runtime": 49.8971, "eval_samples_per_second": 40.624, "eval_steps_per_second": 5.09, "eval_wer": 0.4182162845278931, "step": 31600 }, { "epoch": 3.39, "eval_loss": 0.4797750413417816, "eval_runtime": 49.755, "eval_samples_per_second": 40.74, "eval_steps_per_second": 5.105, "eval_wer": 0.4162303664921466, "step": 31700 }, { "epoch": 3.4, "eval_loss": 0.47179311513900757, "eval_runtime": 49.9097, "eval_samples_per_second": 40.613, "eval_steps_per_second": 5.089, "eval_wer": 0.4108142263946561, "step": 31800 }, { "epoch": 3.42, "eval_loss": 0.4685176610946655, "eval_runtime": 49.6497, "eval_samples_per_second": 40.826, "eval_steps_per_second": 5.116, "eval_wer": 0.41009207438165735, "step": 31900 }, { "epoch": 3.43, "learning_rate": 0.00023233452722063035, "loss": 0.3039, "step": 32000 }, { "epoch": 3.43, "eval_loss": 0.4815961420536041, "eval_runtime": 49.8792, "eval_samples_per_second": 40.638, "eval_steps_per_second": 5.092, "eval_wer": 0.418848167539267, "step": 32000 }, { "epoch": 3.44, "eval_loss": 0.48744821548461914, "eval_runtime": 49.9648, "eval_samples_per_second": 40.569, "eval_steps_per_second": 5.084, "eval_wer": 0.4138833724499007, "step": 32100 }, { "epoch": 3.45, "eval_loss": 0.4899212718009949, "eval_runtime": 50.0433, "eval_samples_per_second": 40.505, "eval_steps_per_second": 5.076, "eval_wer": 0.41153637840765483, "step": 32200 }, { "epoch": 3.46, "eval_loss": 0.4851779043674469, "eval_runtime": 49.6408, "eval_samples_per_second": 40.833, "eval_steps_per_second": 5.117, "eval_wer": 0.4180357465246434, "step": 32300 }, { "epoch": 3.47, "eval_loss": 0.5073689222335815, "eval_runtime": 50.1621, "eval_samples_per_second": 40.409, "eval_steps_per_second": 5.064, "eval_wer": 0.4128904134320274, "step": 32400 }, { "epoch": 3.48, "learning_rate": 0.0002312600286532951, "loss": 0.3006, "step": 32500 }, { "epoch": 3.48, "eval_loss": 0.4837365448474884, "eval_runtime": 49.6611, "eval_samples_per_second": 40.817, "eval_steps_per_second": 5.115, "eval_wer": 0.40756454233616174, "step": 32500 }, { "epoch": 3.49, "eval_loss": 0.49273020029067993, "eval_runtime": 50.0235, "eval_samples_per_second": 40.521, "eval_steps_per_second": 5.078, "eval_wer": 0.4098212673767828, "step": 32600 }, { "epoch": 3.5, "eval_loss": 0.49989503622055054, "eval_runtime": 50.1352, "eval_samples_per_second": 40.431, "eval_steps_per_second": 5.066, "eval_wer": 0.41722332551001984, "step": 32700 }, { "epoch": 3.51, "eval_loss": 0.47733768820762634, "eval_runtime": 50.118, "eval_samples_per_second": 40.445, "eval_steps_per_second": 5.068, "eval_wer": 0.41938978154901607, "step": 32800 }, { "epoch": 3.52, "eval_loss": 0.4858909845352173, "eval_runtime": 49.9497, "eval_samples_per_second": 40.581, "eval_steps_per_second": 5.085, "eval_wer": 0.40575916230366493, "step": 32900 }, { "epoch": 3.53, "learning_rate": 0.00023018553008595987, "loss": 0.3089, "step": 33000 }, { "epoch": 3.53, "eval_loss": 0.47827592492103577, "eval_runtime": 50.8869, "eval_samples_per_second": 39.833, "eval_steps_per_second": 4.991, "eval_wer": 0.4103628813865319, "step": 33000 }, { "epoch": 3.54, "eval_loss": 0.46217525005340576, "eval_runtime": 49.9647, "eval_samples_per_second": 40.569, "eval_steps_per_second": 5.084, "eval_wer": 0.4019678642354216, "step": 33100 }, { "epoch": 3.55, "eval_loss": 0.4839652180671692, "eval_runtime": 50.4824, "eval_samples_per_second": 40.153, "eval_steps_per_second": 5.031, "eval_wer": 0.4064813143166637, "step": 33200 }, { "epoch": 3.57, "eval_loss": 0.47563862800598145, "eval_runtime": 50.0519, "eval_samples_per_second": 40.498, "eval_steps_per_second": 5.075, "eval_wer": 0.42408376963350786, "step": 33300 }, { "epoch": 3.58, "eval_loss": 0.4830974340438843, "eval_runtime": 50.2796, "eval_samples_per_second": 40.315, "eval_steps_per_second": 5.052, "eval_wer": 0.41704278750677015, "step": 33400 }, { "epoch": 3.59, "learning_rate": 0.00022911103151862462, "loss": 0.3061, "step": 33500 }, { "epoch": 3.59, "eval_loss": 0.47941431403160095, "eval_runtime": 49.7111, "eval_samples_per_second": 40.776, "eval_steps_per_second": 5.11, "eval_wer": 0.4067521213215382, "step": 33500 }, { "epoch": 3.6, "eval_loss": 0.47304731607437134, "eval_runtime": 50.0694, "eval_samples_per_second": 40.484, "eval_steps_per_second": 5.073, "eval_wer": 0.40368297526629354, "step": 33600 }, { "epoch": 3.61, "eval_loss": 0.4808448851108551, "eval_runtime": 49.8945, "eval_samples_per_second": 40.626, "eval_steps_per_second": 5.091, "eval_wer": 0.41379310344827586, "step": 33700 }, { "epoch": 3.62, "eval_loss": 0.4924474060535431, "eval_runtime": 50.3079, "eval_samples_per_second": 40.292, "eval_steps_per_second": 5.049, "eval_wer": 0.4248059216465066, "step": 33800 }, { "epoch": 3.63, "eval_loss": 0.4748767614364624, "eval_runtime": 49.9339, "eval_samples_per_second": 40.594, "eval_steps_per_second": 5.087, "eval_wer": 0.41117530240115546, "step": 33900 }, { "epoch": 3.64, "learning_rate": 0.0002280365329512894, "loss": 0.3047, "step": 34000 }, { "epoch": 3.64, "eval_loss": 0.49240487813949585, "eval_runtime": 50.046, "eval_samples_per_second": 40.503, "eval_steps_per_second": 5.075, "eval_wer": 0.432569055786243, "step": 34000 }, { "epoch": 3.65, "eval_loss": 0.4745273292064667, "eval_runtime": 49.8993, "eval_samples_per_second": 40.622, "eval_steps_per_second": 5.09, "eval_wer": 0.4103628813865319, "step": 34100 }, { "epoch": 3.66, "eval_loss": 0.4759696125984192, "eval_runtime": 50.0617, "eval_samples_per_second": 40.49, "eval_steps_per_second": 5.074, "eval_wer": 0.4122585304206535, "step": 34200 }, { "epoch": 3.67, "eval_loss": 0.47877970337867737, "eval_runtime": 49.9144, "eval_samples_per_second": 40.61, "eval_steps_per_second": 5.089, "eval_wer": 0.4065715833182885, "step": 34300 }, { "epoch": 3.68, "eval_loss": 0.4626765549182892, "eval_runtime": 50.4559, "eval_samples_per_second": 40.174, "eval_steps_per_second": 5.034, "eval_wer": 0.4157790214840224, "step": 34400 }, { "epoch": 3.69, "learning_rate": 0.00022696203438395414, "loss": 0.3042, "step": 34500 }, { "epoch": 3.69, "eval_loss": 0.4974145293235779, "eval_runtime": 49.7345, "eval_samples_per_second": 40.756, "eval_steps_per_second": 5.107, "eval_wer": 0.4130709514352771, "step": 34500 }, { "epoch": 3.7, "eval_loss": 0.4593214988708496, "eval_runtime": 49.9902, "eval_samples_per_second": 40.548, "eval_steps_per_second": 5.081, "eval_wer": 0.406300776313414, "step": 34600 }, { "epoch": 3.72, "eval_loss": 0.4549331068992615, "eval_runtime": 49.7975, "eval_samples_per_second": 40.705, "eval_steps_per_second": 5.101, "eval_wer": 0.3927604260696877, "step": 34700 }, { "epoch": 3.73, "eval_loss": 0.4690437614917755, "eval_runtime": 50.7669, "eval_samples_per_second": 39.928, "eval_steps_per_second": 5.003, "eval_wer": 0.3897815490160679, "step": 34800 }, { "epoch": 3.74, "eval_loss": 0.4559744596481323, "eval_runtime": 49.4008, "eval_samples_per_second": 41.032, "eval_steps_per_second": 5.142, "eval_wer": 0.4007040982126738, "step": 34900 }, { "epoch": 3.75, "learning_rate": 0.0002258875358166189, "loss": 0.2963, "step": 35000 }, { "epoch": 3.75, "eval_loss": 0.46059346199035645, "eval_runtime": 49.637, "eval_samples_per_second": 40.836, "eval_steps_per_second": 5.117, "eval_wer": 0.39591984112655715, "step": 35000 }, { "epoch": 3.76, "eval_loss": 0.4762277901172638, "eval_runtime": 50.0278, "eval_samples_per_second": 40.517, "eval_steps_per_second": 5.077, "eval_wer": 0.4056688933020401, "step": 35100 }, { "epoch": 3.77, "eval_loss": 0.4749699831008911, "eval_runtime": 49.7739, "eval_samples_per_second": 40.724, "eval_steps_per_second": 5.103, "eval_wer": 0.403412168261419, "step": 35200 }, { "epoch": 3.78, "eval_loss": 0.47716274857521057, "eval_runtime": 49.6995, "eval_samples_per_second": 40.785, "eval_steps_per_second": 5.111, "eval_wer": 0.41144610940603, "step": 35300 }, { "epoch": 3.79, "eval_loss": 0.4668501615524292, "eval_runtime": 49.7899, "eval_samples_per_second": 40.711, "eval_steps_per_second": 5.101, "eval_wer": 0.3995306011915508, "step": 35400 }, { "epoch": 3.8, "learning_rate": 0.00022481518624641833, "loss": 0.3012, "step": 35500 }, { "epoch": 3.8, "eval_loss": 0.47086089849472046, "eval_runtime": 49.7381, "eval_samples_per_second": 40.753, "eval_steps_per_second": 5.107, "eval_wer": 0.40900884636215923, "step": 35500 }, { "epoch": 3.81, "eval_loss": 0.47223708033561707, "eval_runtime": 49.8147, "eval_samples_per_second": 40.691, "eval_steps_per_second": 5.099, "eval_wer": 0.41234879942227837, "step": 35600 }, { "epoch": 3.82, "eval_loss": 0.49128904938697815, "eval_runtime": 50.3648, "eval_samples_per_second": 40.246, "eval_steps_per_second": 5.043, "eval_wer": 0.41650117349702115, "step": 35700 }, { "epoch": 3.83, "eval_loss": 0.48138895630836487, "eval_runtime": 51.0291, "eval_samples_per_second": 39.722, "eval_steps_per_second": 4.978, "eval_wer": 0.406300776313414, "step": 35800 }, { "epoch": 3.84, "eval_loss": 0.4868621230125427, "eval_runtime": 49.5664, "eval_samples_per_second": 40.895, "eval_steps_per_second": 5.124, "eval_wer": 0.417133056508395, "step": 35900 }, { "epoch": 3.85, "learning_rate": 0.00022374068767908305, "loss": 0.3015, "step": 36000 }, { "epoch": 3.85, "eval_loss": 0.4791094660758972, "eval_runtime": 50.1246, "eval_samples_per_second": 40.439, "eval_steps_per_second": 5.067, "eval_wer": 0.4059397003069146, "step": 36000 }, { "epoch": 3.87, "eval_loss": 0.45353808999061584, "eval_runtime": 49.889, "eval_samples_per_second": 40.63, "eval_steps_per_second": 5.091, "eval_wer": 0.3976349521574291, "step": 36100 }, { "epoch": 3.88, "eval_loss": 0.4706454575061798, "eval_runtime": 50.016, "eval_samples_per_second": 40.527, "eval_steps_per_second": 5.078, "eval_wer": 0.40088463621592346, "step": 36200 }, { "epoch": 3.89, "eval_loss": 0.4678768217563629, "eval_runtime": 49.8077, "eval_samples_per_second": 40.697, "eval_steps_per_second": 5.1, "eval_wer": 0.40124571222242283, "step": 36300 }, { "epoch": 3.9, "eval_loss": 0.4735689163208008, "eval_runtime": 50.0515, "eval_samples_per_second": 40.498, "eval_steps_per_second": 5.075, "eval_wer": 0.40964072937353313, "step": 36400 }, { "epoch": 3.91, "learning_rate": 0.00022266618911174783, "loss": 0.2965, "step": 36500 }, { "epoch": 3.91, "eval_loss": 0.4755512475967407, "eval_runtime": 49.592, "eval_samples_per_second": 40.874, "eval_steps_per_second": 5.122, "eval_wer": 0.4106336883914064, "step": 36500 }, { "epoch": 3.92, "eval_loss": 0.4669349789619446, "eval_runtime": 50.1764, "eval_samples_per_second": 40.397, "eval_steps_per_second": 5.062, "eval_wer": 0.40846723235241017, "step": 36600 }, { "epoch": 3.93, "eval_loss": 0.47956836223602295, "eval_runtime": 49.6711, "eval_samples_per_second": 40.808, "eval_steps_per_second": 5.114, "eval_wer": 0.40539808629716556, "step": 36700 }, { "epoch": 3.94, "eval_loss": 0.4583274722099304, "eval_runtime": 49.5945, "eval_samples_per_second": 40.871, "eval_steps_per_second": 5.122, "eval_wer": 0.39321177107781186, "step": 36800 }, { "epoch": 3.95, "eval_loss": 0.4429765045642853, "eval_runtime": 49.6156, "eval_samples_per_second": 40.854, "eval_steps_per_second": 5.119, "eval_wer": 0.3969128001444304, "step": 36900 }, { "epoch": 3.96, "learning_rate": 0.00022159169054441257, "loss": 0.2993, "step": 37000 }, { "epoch": 3.96, "eval_loss": 0.45601701736450195, "eval_runtime": 50.1949, "eval_samples_per_second": 40.383, "eval_steps_per_second": 5.06, "eval_wer": 0.39140639104531505, "step": 37000 }, { "epoch": 3.97, "eval_loss": 0.4738839864730835, "eval_runtime": 49.7611, "eval_samples_per_second": 40.735, "eval_steps_per_second": 5.104, "eval_wer": 0.4001624842029247, "step": 37100 }, { "epoch": 3.98, "eval_loss": 0.45979049801826477, "eval_runtime": 50.036, "eval_samples_per_second": 40.511, "eval_steps_per_second": 5.076, "eval_wer": 0.39122585304206536, "step": 37200 }, { "epoch": 3.99, "eval_loss": 0.46073099970817566, "eval_runtime": 49.9116, "eval_samples_per_second": 40.612, "eval_steps_per_second": 5.089, "eval_wer": 0.3906842390323163, "step": 37300 }, { "epoch": 4.0, "eval_loss": 0.4708978235721588, "eval_runtime": 50.1501, "eval_samples_per_second": 40.419, "eval_steps_per_second": 5.065, "eval_wer": 0.3986279111753024, "step": 37400 }, { "epoch": 4.01, "learning_rate": 0.000220519340974212, "loss": 0.2886, "step": 37500 }, { "epoch": 4.01, "eval_loss": 0.46422716975212097, "eval_runtime": 49.9196, "eval_samples_per_second": 40.605, "eval_steps_per_second": 5.088, "eval_wer": 0.40666185231991336, "step": 37500 }, { "epoch": 4.03, "eval_loss": 0.4683905839920044, "eval_runtime": 50.3714, "eval_samples_per_second": 40.241, "eval_steps_per_second": 5.043, "eval_wer": 0.3984473731720527, "step": 37600 }, { "epoch": 4.04, "eval_loss": 0.4689880311489105, "eval_runtime": 50.2882, "eval_samples_per_second": 40.308, "eval_steps_per_second": 5.051, "eval_wer": 0.39790575916230364, "step": 37700 }, { "epoch": 4.05, "eval_loss": 0.47223958373069763, "eval_runtime": 50.6582, "eval_samples_per_second": 40.013, "eval_steps_per_second": 5.014, "eval_wer": 0.3979960281639285, "step": 37800 }, { "epoch": 4.06, "eval_loss": 0.47339245676994324, "eval_runtime": 50.5606, "eval_samples_per_second": 40.091, "eval_steps_per_second": 5.024, "eval_wer": 0.39267015706806285, "step": 37900 }, { "epoch": 4.07, "learning_rate": 0.00021944484240687677, "loss": 0.2534, "step": 38000 }, { "epoch": 4.07, "eval_loss": 0.4724343717098236, "eval_runtime": 51.0309, "eval_samples_per_second": 39.721, "eval_steps_per_second": 4.977, "eval_wer": 0.39880844917855207, "step": 38000 }, { "epoch": 4.08, "eval_loss": 0.4664517343044281, "eval_runtime": 51.1346, "eval_samples_per_second": 39.641, "eval_steps_per_second": 4.967, "eval_wer": 0.3986279111753024, "step": 38100 }, { "epoch": 4.09, "eval_loss": 0.4658842086791992, "eval_runtime": 50.3243, "eval_samples_per_second": 40.279, "eval_steps_per_second": 5.047, "eval_wer": 0.4035927062646687, "step": 38200 }, { "epoch": 4.1, "eval_loss": 0.469433456659317, "eval_runtime": 49.619, "eval_samples_per_second": 40.851, "eval_steps_per_second": 5.119, "eval_wer": 0.3951976891135584, "step": 38300 }, { "epoch": 4.11, "eval_loss": 0.47190093994140625, "eval_runtime": 49.7683, "eval_samples_per_second": 40.729, "eval_steps_per_second": 5.104, "eval_wer": 0.38905939700306913, "step": 38400 }, { "epoch": 4.12, "learning_rate": 0.0002183703438395415, "loss": 0.2596, "step": 38500 }, { "epoch": 4.12, "eval_loss": 0.46866583824157715, "eval_runtime": 50.0111, "eval_samples_per_second": 40.531, "eval_steps_per_second": 5.079, "eval_wer": 0.399440332189926, "step": 38500 }, { "epoch": 4.13, "eval_loss": 0.47052884101867676, "eval_runtime": 49.7745, "eval_samples_per_second": 40.724, "eval_steps_per_second": 5.103, "eval_wer": 0.39032316302581693, "step": 38600 }, { "epoch": 4.14, "eval_loss": 0.460104376077652, "eval_runtime": 49.9336, "eval_samples_per_second": 40.594, "eval_steps_per_second": 5.087, "eval_wer": 0.3974544141541795, "step": 38700 }, { "epoch": 4.15, "eval_loss": 0.4666154384613037, "eval_runtime": 50.032, "eval_samples_per_second": 40.514, "eval_steps_per_second": 5.077, "eval_wer": 0.3970933381476801, "step": 38800 }, { "epoch": 4.16, "eval_loss": 0.4772312641143799, "eval_runtime": 49.9053, "eval_samples_per_second": 40.617, "eval_steps_per_second": 5.09, "eval_wer": 0.3892399350063188, "step": 38900 }, { "epoch": 4.18, "learning_rate": 0.00021729799426934096, "loss": 0.2643, "step": 39000 }, { "epoch": 4.18, "eval_loss": 0.48102715611457825, "eval_runtime": 49.7263, "eval_samples_per_second": 40.763, "eval_steps_per_second": 5.108, "eval_wer": 0.4071131973280376, "step": 39000 }, { "epoch": 4.19, "eval_loss": 0.49802666902542114, "eval_runtime": 49.6686, "eval_samples_per_second": 40.81, "eval_steps_per_second": 5.114, "eval_wer": 0.4166817115002708, "step": 39100 }, { "epoch": 4.2, "eval_loss": 0.4657323956489563, "eval_runtime": 49.7618, "eval_samples_per_second": 40.734, "eval_steps_per_second": 5.104, "eval_wer": 0.39962087019317566, "step": 39200 }, { "epoch": 4.21, "eval_loss": 0.48691385984420776, "eval_runtime": 49.7124, "eval_samples_per_second": 40.775, "eval_steps_per_second": 5.109, "eval_wer": 0.4001624842029247, "step": 39300 }, { "epoch": 4.22, "eval_loss": 0.46561890840530396, "eval_runtime": 49.9565, "eval_samples_per_second": 40.575, "eval_steps_per_second": 5.084, "eval_wer": 0.3913161220436902, "step": 39400 }, { "epoch": 4.23, "learning_rate": 0.0002162234957020057, "loss": 0.265, "step": 39500 }, { "epoch": 4.23, "eval_loss": 0.47198420763015747, "eval_runtime": 49.854, "eval_samples_per_second": 40.659, "eval_steps_per_second": 5.095, "eval_wer": 0.3947463441054342, "step": 39500 }, { "epoch": 4.24, "eval_loss": 0.4710632562637329, "eval_runtime": 50.0216, "eval_samples_per_second": 40.523, "eval_steps_per_second": 5.078, "eval_wer": 0.39700306914605527, "step": 39600 }, { "epoch": 4.25, "eval_loss": 0.46885937452316284, "eval_runtime": 50.8629, "eval_samples_per_second": 39.852, "eval_steps_per_second": 4.994, "eval_wer": 0.3933020400794367, "step": 39700 }, { "epoch": 4.26, "eval_loss": 0.47284629940986633, "eval_runtime": 50.0447, "eval_samples_per_second": 40.504, "eval_steps_per_second": 5.075, "eval_wer": 0.40169705723054705, "step": 39800 }, { "epoch": 4.27, "eval_loss": 0.46733906865119934, "eval_runtime": 49.6974, "eval_samples_per_second": 40.787, "eval_steps_per_second": 5.111, "eval_wer": 0.3847264849250767, "step": 39900 }, { "epoch": 4.28, "learning_rate": 0.00021514899713467045, "loss": 0.2644, "step": 40000 }, { "epoch": 4.28, "eval_loss": 0.46359318494796753, "eval_runtime": 49.5988, "eval_samples_per_second": 40.868, "eval_steps_per_second": 5.121, "eval_wer": 0.396010110128182, "step": 40000 }, { "epoch": 4.29, "eval_loss": 0.46991944313049316, "eval_runtime": 50.3998, "eval_samples_per_second": 40.218, "eval_steps_per_second": 5.04, "eval_wer": 0.38644159595594874, "step": 40100 }, { "epoch": 4.3, "eval_loss": 0.4580465257167816, "eval_runtime": 49.4799, "eval_samples_per_second": 40.966, "eval_steps_per_second": 5.133, "eval_wer": 0.387434554973822, "step": 40200 }, { "epoch": 4.31, "eval_loss": 0.47626662254333496, "eval_runtime": 49.6505, "eval_samples_per_second": 40.825, "eval_steps_per_second": 5.116, "eval_wer": 0.39510742011193356, "step": 40300 }, { "epoch": 4.33, "eval_loss": 0.47517192363739014, "eval_runtime": 49.3981, "eval_samples_per_second": 41.034, "eval_steps_per_second": 5.142, "eval_wer": 0.4140639104531504, "step": 40400 }, { "epoch": 4.34, "learning_rate": 0.00021407449856733523, "loss": 0.2633, "step": 40500 }, { "epoch": 4.34, "eval_loss": 0.49175700545310974, "eval_runtime": 49.6012, "eval_samples_per_second": 40.866, "eval_steps_per_second": 5.121, "eval_wer": 0.39935006318830113, "step": 40500 }, { "epoch": 4.35, "eval_loss": 0.4782505929470062, "eval_runtime": 49.7601, "eval_samples_per_second": 40.735, "eval_steps_per_second": 5.104, "eval_wer": 0.4025997472467954, "step": 40600 }, { "epoch": 4.36, "eval_loss": 0.4738580286502838, "eval_runtime": 50.9085, "eval_samples_per_second": 39.817, "eval_steps_per_second": 4.989, "eval_wer": 0.403412168261419, "step": 40700 }, { "epoch": 4.37, "eval_loss": 0.47499799728393555, "eval_runtime": 49.9805, "eval_samples_per_second": 40.556, "eval_steps_per_second": 5.082, "eval_wer": 0.39998194619967503, "step": 40800 }, { "epoch": 4.38, "eval_loss": 0.46082910895347595, "eval_runtime": 49.827, "eval_samples_per_second": 40.681, "eval_steps_per_second": 5.098, "eval_wer": 0.39429499909731, "step": 40900 }, { "epoch": 4.39, "learning_rate": 0.00021299999999999997, "loss": 0.2679, "step": 41000 }, { "epoch": 4.39, "eval_loss": 0.46146294474601746, "eval_runtime": 49.5199, "eval_samples_per_second": 40.933, "eval_steps_per_second": 5.129, "eval_wer": 0.389149666004694, "step": 41000 }, { "epoch": 4.4, "eval_loss": 0.47296470403671265, "eval_runtime": 49.5896, "eval_samples_per_second": 40.875, "eval_steps_per_second": 5.122, "eval_wer": 0.3984473731720527, "step": 41100 }, { "epoch": 4.41, "eval_loss": 0.47276759147644043, "eval_runtime": 49.8499, "eval_samples_per_second": 40.662, "eval_steps_per_second": 5.095, "eval_wer": 0.40106517421917315, "step": 41200 }, { "epoch": 4.42, "eval_loss": 0.46751782298088074, "eval_runtime": 49.7874, "eval_samples_per_second": 40.713, "eval_steps_per_second": 5.102, "eval_wer": 0.39321177107781186, "step": 41300 }, { "epoch": 4.43, "eval_loss": 0.46617743372917175, "eval_runtime": 50.1545, "eval_samples_per_second": 40.415, "eval_steps_per_second": 5.064, "eval_wer": 0.39285069507131254, "step": 41400 }, { "epoch": 4.44, "learning_rate": 0.00021192550143266475, "loss": 0.2682, "step": 41500 }, { "epoch": 4.44, "eval_loss": 0.44897398352622986, "eval_runtime": 50.9668, "eval_samples_per_second": 39.771, "eval_steps_per_second": 4.984, "eval_wer": 0.38373352590720344, "step": 41500 }, { "epoch": 4.45, "eval_loss": 0.46106940507888794, "eval_runtime": 49.9064, "eval_samples_per_second": 40.616, "eval_steps_per_second": 5.09, "eval_wer": 0.3838237949088283, "step": 41600 }, { "epoch": 4.46, "eval_loss": 0.46049293875694275, "eval_runtime": 49.6932, "eval_samples_per_second": 40.79, "eval_steps_per_second": 5.111, "eval_wer": 0.39447553710055966, "step": 41700 }, { "epoch": 4.48, "eval_loss": 0.4730290472507477, "eval_runtime": 49.4559, "eval_samples_per_second": 40.986, "eval_steps_per_second": 5.136, "eval_wer": 0.39384365408918576, "step": 41800 }, { "epoch": 4.49, "eval_loss": 0.4566921293735504, "eval_runtime": 49.6481, "eval_samples_per_second": 40.827, "eval_steps_per_second": 5.116, "eval_wer": 0.387434554973822, "step": 41900 }, { "epoch": 4.5, "learning_rate": 0.0002108510028653295, "loss": 0.2658, "step": 42000 }, { "epoch": 4.5, "eval_loss": 0.47149142622947693, "eval_runtime": 49.8048, "eval_samples_per_second": 40.699, "eval_steps_per_second": 5.1, "eval_wer": 0.38689294096407295, "step": 42000 }, { "epoch": 4.51, "eval_loss": 0.45138201117515564, "eval_runtime": 50.5648, "eval_samples_per_second": 40.087, "eval_steps_per_second": 5.023, "eval_wer": 0.3832821808990793, "step": 42100 }, { "epoch": 4.52, "eval_loss": 0.46020662784576416, "eval_runtime": 49.6896, "eval_samples_per_second": 40.793, "eval_steps_per_second": 5.112, "eval_wer": 0.3897815490160679, "step": 42200 }, { "epoch": 4.53, "eval_loss": 0.4846310615539551, "eval_runtime": 49.7205, "eval_samples_per_second": 40.768, "eval_steps_per_second": 5.109, "eval_wer": 0.4022386712402961, "step": 42300 }, { "epoch": 4.54, "eval_loss": 0.44736534357070923, "eval_runtime": 49.9456, "eval_samples_per_second": 40.584, "eval_steps_per_second": 5.086, "eval_wer": 0.3810254558584582, "step": 42400 }, { "epoch": 4.55, "learning_rate": 0.00020977650429799427, "loss": 0.2676, "step": 42500 }, { "epoch": 4.55, "eval_loss": 0.4513036608695984, "eval_runtime": 49.7727, "eval_samples_per_second": 40.725, "eval_steps_per_second": 5.103, "eval_wer": 0.3820184148763315, "step": 42500 }, { "epoch": 4.56, "eval_loss": 0.4588390588760376, "eval_runtime": 49.7619, "eval_samples_per_second": 40.734, "eval_steps_per_second": 5.104, "eval_wer": 0.3927604260696877, "step": 42600 }, { "epoch": 4.57, "eval_loss": 0.4601156413555145, "eval_runtime": 49.7259, "eval_samples_per_second": 40.763, "eval_steps_per_second": 5.108, "eval_wer": 0.3894204730095685, "step": 42700 }, { "epoch": 4.58, "eval_loss": 0.45155754685401917, "eval_runtime": 49.7075, "eval_samples_per_second": 40.779, "eval_steps_per_second": 5.11, "eval_wer": 0.37922007582596134, "step": 42800 }, { "epoch": 4.59, "eval_loss": 0.4481757581233978, "eval_runtime": 49.8315, "eval_samples_per_second": 40.677, "eval_steps_per_second": 5.097, "eval_wer": 0.38481675392670156, "step": 42900 }, { "epoch": 4.6, "learning_rate": 0.000208702005730659, "loss": 0.2693, "step": 43000 }, { "epoch": 4.6, "eval_loss": 0.4695383310317993, "eval_runtime": 50.2493, "eval_samples_per_second": 40.339, "eval_steps_per_second": 5.055, "eval_wer": 0.4007943672142986, "step": 43000 }, { "epoch": 4.61, "eval_loss": 0.45803362131118774, "eval_runtime": 50.1652, "eval_samples_per_second": 40.407, "eval_steps_per_second": 5.063, "eval_wer": 0.38707347896732264, "step": 43100 }, { "epoch": 4.63, "eval_loss": 0.44191282987594604, "eval_runtime": 49.9048, "eval_samples_per_second": 40.617, "eval_steps_per_second": 5.09, "eval_wer": 0.38571944394295, "step": 43200 }, { "epoch": 4.64, "eval_loss": 0.45340240001678467, "eval_runtime": 51.1795, "eval_samples_per_second": 39.606, "eval_steps_per_second": 4.963, "eval_wer": 0.3795811518324607, "step": 43300 }, { "epoch": 4.65, "eval_loss": 0.4532068073749542, "eval_runtime": 49.8489, "eval_samples_per_second": 40.663, "eval_steps_per_second": 5.095, "eval_wer": 0.38562917494132515, "step": 43400 }, { "epoch": 4.66, "learning_rate": 0.00020762750716332376, "loss": 0.2641, "step": 43500 }, { "epoch": 4.66, "eval_loss": 0.442064106464386, "eval_runtime": 49.9503, "eval_samples_per_second": 40.58, "eval_steps_per_second": 5.085, "eval_wer": 0.38093518685683336, "step": 43500 }, { "epoch": 4.67, "eval_loss": 0.44000962376594543, "eval_runtime": 50.1474, "eval_samples_per_second": 40.421, "eval_steps_per_second": 5.065, "eval_wer": 0.38436540891857734, "step": 43600 }, { "epoch": 4.68, "eval_loss": 0.45147180557250977, "eval_runtime": 49.9827, "eval_samples_per_second": 40.554, "eval_steps_per_second": 5.082, "eval_wer": 0.3832821808990793, "step": 43700 }, { "epoch": 4.69, "eval_loss": 0.4462360143661499, "eval_runtime": 50.1109, "eval_samples_per_second": 40.45, "eval_steps_per_second": 5.069, "eval_wer": 0.3807546488535837, "step": 43800 }, { "epoch": 4.7, "eval_loss": 0.47406265139579773, "eval_runtime": 50.0121, "eval_samples_per_second": 40.53, "eval_steps_per_second": 5.079, "eval_wer": 0.392579888066438, "step": 43900 }, { "epoch": 4.71, "learning_rate": 0.0002065551575931232, "loss": 0.2626, "step": 44000 }, { "epoch": 4.71, "eval_loss": 0.4542163014411926, "eval_runtime": 50.5956, "eval_samples_per_second": 40.063, "eval_steps_per_second": 5.02, "eval_wer": 0.393121502076187, "step": 44000 }, { "epoch": 4.72, "eval_loss": 0.4554780125617981, "eval_runtime": 49.9867, "eval_samples_per_second": 40.551, "eval_steps_per_second": 5.081, "eval_wer": 0.38851778299332007, "step": 44100 }, { "epoch": 4.73, "eval_loss": 0.45047158002853394, "eval_runtime": 50.0094, "eval_samples_per_second": 40.532, "eval_steps_per_second": 5.079, "eval_wer": 0.38454594692182703, "step": 44200 }, { "epoch": 4.74, "eval_loss": 0.45926421880722046, "eval_runtime": 49.6573, "eval_samples_per_second": 40.82, "eval_steps_per_second": 5.115, "eval_wer": 0.38707347896732264, "step": 44300 }, { "epoch": 4.75, "eval_loss": 0.43586495518684387, "eval_runtime": 50.2993, "eval_samples_per_second": 40.299, "eval_steps_per_second": 5.05, "eval_wer": 0.38301137389420475, "step": 44400 }, { "epoch": 4.76, "learning_rate": 0.00020548280802292263, "loss": 0.2648, "step": 44500 }, { "epoch": 4.76, "eval_loss": 0.43868881464004517, "eval_runtime": 49.9728, "eval_samples_per_second": 40.562, "eval_steps_per_second": 5.083, "eval_wer": 0.3736233977252212, "step": 44500 }, { "epoch": 4.78, "eval_loss": 0.45290684700012207, "eval_runtime": 49.8631, "eval_samples_per_second": 40.651, "eval_steps_per_second": 5.094, "eval_wer": 0.38066437985195883, "step": 44600 }, { "epoch": 4.79, "eval_loss": 0.45659151673316956, "eval_runtime": 50.0989, "eval_samples_per_second": 40.46, "eval_steps_per_second": 5.07, "eval_wer": 0.38373352590720344, "step": 44700 }, { "epoch": 4.8, "eval_loss": 0.45571401715278625, "eval_runtime": 50.5772, "eval_samples_per_second": 40.077, "eval_steps_per_second": 5.022, "eval_wer": 0.40666185231991336, "step": 44800 }, { "epoch": 4.81, "eval_loss": 0.4609202742576599, "eval_runtime": 50.0904, "eval_samples_per_second": 40.467, "eval_steps_per_second": 5.071, "eval_wer": 0.38517782993320093, "step": 44900 }, { "epoch": 4.82, "learning_rate": 0.00020440830945558735, "loss": 0.2603, "step": 45000 }, { "epoch": 4.82, "eval_loss": 0.46665722131729126, "eval_runtime": 49.8766, "eval_samples_per_second": 40.64, "eval_steps_per_second": 5.093, "eval_wer": 0.4005235602094241, "step": 45000 }, { "epoch": 4.83, "eval_loss": 0.46655377745628357, "eval_runtime": 49.8776, "eval_samples_per_second": 40.639, "eval_steps_per_second": 5.092, "eval_wer": 0.3836432569055786, "step": 45100 }, { "epoch": 4.84, "eval_loss": 0.47749215364456177, "eval_runtime": 49.9, "eval_samples_per_second": 40.621, "eval_steps_per_second": 5.09, "eval_wer": 0.3945658061021845, "step": 45200 }, { "epoch": 4.85, "eval_loss": 0.4701036810874939, "eval_runtime": 50.0063, "eval_samples_per_second": 40.535, "eval_steps_per_second": 5.079, "eval_wer": 0.39248961906481317, "step": 45300 }, { "epoch": 4.86, "eval_loss": 0.4578703045845032, "eval_runtime": 50.0708, "eval_samples_per_second": 40.483, "eval_steps_per_second": 5.073, "eval_wer": 0.38887885899981944, "step": 45400 }, { "epoch": 4.87, "learning_rate": 0.00020333381088825215, "loss": 0.2626, "step": 45500 }, { "epoch": 4.87, "eval_loss": 0.4515564739704132, "eval_runtime": 49.915, "eval_samples_per_second": 40.609, "eval_steps_per_second": 5.089, "eval_wer": 0.38842751399169523, "step": 45500 }, { "epoch": 4.88, "eval_loss": 0.46054086089134216, "eval_runtime": 49.7949, "eval_samples_per_second": 40.707, "eval_steps_per_second": 5.101, "eval_wer": 0.3877956309803214, "step": 45600 }, { "epoch": 4.89, "eval_loss": 0.4576418101787567, "eval_runtime": 50.3057, "eval_samples_per_second": 40.294, "eval_steps_per_second": 5.049, "eval_wer": 0.3802130348438346, "step": 45700 }, { "epoch": 4.9, "eval_loss": 0.45533105731010437, "eval_runtime": 49.7254, "eval_samples_per_second": 40.764, "eval_steps_per_second": 5.108, "eval_wer": 0.37804657880483844, "step": 45800 }, { "epoch": 4.91, "eval_loss": 0.4335707724094391, "eval_runtime": 50.3097, "eval_samples_per_second": 40.29, "eval_steps_per_second": 5.049, "eval_wer": 0.3752482397544683, "step": 45900 }, { "epoch": 4.93, "learning_rate": 0.00020225931232091687, "loss": 0.2602, "step": 46000 }, { "epoch": 4.93, "eval_loss": 0.44188374280929565, "eval_runtime": 49.9873, "eval_samples_per_second": 40.55, "eval_steps_per_second": 5.081, "eval_wer": 0.3880664379851959, "step": 46000 }, { "epoch": 4.94, "eval_loss": 0.46014997363090515, "eval_runtime": 50.4086, "eval_samples_per_second": 40.211, "eval_steps_per_second": 5.039, "eval_wer": 0.3842751399169525, "step": 46100 }, { "epoch": 4.95, "eval_loss": 0.44370460510253906, "eval_runtime": 49.8698, "eval_samples_per_second": 40.646, "eval_steps_per_second": 5.093, "eval_wer": 0.3956490341216826, "step": 46200 }, { "epoch": 4.96, "eval_loss": 0.4524065852165222, "eval_runtime": 50.044, "eval_samples_per_second": 40.504, "eval_steps_per_second": 5.076, "eval_wer": 0.38436540891857734, "step": 46300 }, { "epoch": 4.97, "eval_loss": 0.4709448218345642, "eval_runtime": 49.8637, "eval_samples_per_second": 40.651, "eval_steps_per_second": 5.094, "eval_wer": 0.4031413612565445, "step": 46400 }, { "epoch": 4.98, "learning_rate": 0.00020118481375358164, "loss": 0.2609, "step": 46500 }, { "epoch": 4.98, "eval_loss": 0.45001140236854553, "eval_runtime": 50.2152, "eval_samples_per_second": 40.366, "eval_steps_per_second": 5.058, "eval_wer": 0.3871637479689475, "step": 46500 }, { "epoch": 4.99, "eval_loss": 0.43656888604164124, "eval_runtime": 49.6836, "eval_samples_per_second": 40.798, "eval_steps_per_second": 5.112, "eval_wer": 0.3846362159234519, "step": 46600 }, { "epoch": 5.0, "eval_loss": 0.46530061960220337, "eval_runtime": 49.7235, "eval_samples_per_second": 40.765, "eval_steps_per_second": 5.108, "eval_wer": 0.38842751399169523, "step": 46700 }, { "epoch": 5.01, "eval_loss": 0.4602296054363251, "eval_runtime": 50.5077, "eval_samples_per_second": 40.133, "eval_steps_per_second": 5.029, "eval_wer": 0.39321177107781186, "step": 46800 }, { "epoch": 5.02, "eval_loss": 0.4668322801589966, "eval_runtime": 50.0245, "eval_samples_per_second": 40.52, "eval_steps_per_second": 5.078, "eval_wer": 0.3853583679364506, "step": 46900 }, { "epoch": 5.03, "learning_rate": 0.00020011031518624639, "loss": 0.2472, "step": 47000 }, { "epoch": 5.03, "eval_loss": 0.4615883529186249, "eval_runtime": 50.0103, "eval_samples_per_second": 40.532, "eval_steps_per_second": 5.079, "eval_wer": 0.389149666004694, "step": 47000 }, { "epoch": 5.04, "eval_loss": 0.4542787969112396, "eval_runtime": 50.2585, "eval_samples_per_second": 40.331, "eval_steps_per_second": 5.054, "eval_wer": 0.38355298790395376, "step": 47100 }, { "epoch": 5.05, "eval_loss": 0.4526177644729614, "eval_runtime": 50.0483, "eval_samples_per_second": 40.501, "eval_steps_per_second": 5.075, "eval_wer": 0.38219895287958117, "step": 47200 }, { "epoch": 5.06, "eval_loss": 0.45387881994247437, "eval_runtime": 50.0828, "eval_samples_per_second": 40.473, "eval_steps_per_second": 5.072, "eval_wer": 0.37407474273334534, "step": 47300 }, { "epoch": 5.07, "eval_loss": 0.4776493310928345, "eval_runtime": 49.8454, "eval_samples_per_second": 40.666, "eval_steps_per_second": 5.096, "eval_wer": 0.3818378768730818, "step": 47400 }, { "epoch": 5.09, "learning_rate": 0.0001990379656160458, "loss": 0.2278, "step": 47500 }, { "epoch": 5.09, "eval_loss": 0.47709885239601135, "eval_runtime": 51.1106, "eval_samples_per_second": 39.659, "eval_steps_per_second": 4.97, "eval_wer": 0.37940061382921103, "step": 47500 }, { "epoch": 5.1, "eval_loss": 0.46624356508255005, "eval_runtime": 49.8637, "eval_samples_per_second": 40.651, "eval_steps_per_second": 5.094, "eval_wer": 0.3831016428958296, "step": 47600 }, { "epoch": 5.11, "eval_loss": 0.45577922463417053, "eval_runtime": 49.9202, "eval_samples_per_second": 40.605, "eval_steps_per_second": 5.088, "eval_wer": 0.4032316302581693, "step": 47700 }, { "epoch": 5.12, "eval_loss": 0.4903823733329773, "eval_runtime": 50.3451, "eval_samples_per_second": 40.262, "eval_steps_per_second": 5.045, "eval_wer": 0.3917674670518144, "step": 47800 }, { "epoch": 5.13, "eval_loss": 0.4764585494995117, "eval_runtime": 50.0404, "eval_samples_per_second": 40.507, "eval_steps_per_second": 5.076, "eval_wer": 0.3889691280014443, "step": 47900 }, { "epoch": 5.14, "learning_rate": 0.00019796346704871058, "loss": 0.2311, "step": 48000 }, { "epoch": 5.14, "eval_loss": 0.4673701822757721, "eval_runtime": 49.7968, "eval_samples_per_second": 40.705, "eval_steps_per_second": 5.101, "eval_wer": 0.38824697598844554, "step": 48000 }, { "epoch": 5.15, "eval_loss": 0.460916131734848, "eval_runtime": 49.6923, "eval_samples_per_second": 40.791, "eval_steps_per_second": 5.111, "eval_wer": 0.39465607510380935, "step": 48100 }, { "epoch": 5.16, "eval_loss": 0.4587761163711548, "eval_runtime": 49.8661, "eval_samples_per_second": 40.649, "eval_steps_per_second": 5.094, "eval_wer": 0.38373352590720344, "step": 48200 }, { "epoch": 5.17, "eval_loss": 0.48272979259490967, "eval_runtime": 49.3238, "eval_samples_per_second": 41.096, "eval_steps_per_second": 5.15, "eval_wer": 0.3844556779202022, "step": 48300 }, { "epoch": 5.18, "eval_loss": 0.4711352288722992, "eval_runtime": 49.1004, "eval_samples_per_second": 41.283, "eval_steps_per_second": 5.173, "eval_wer": 0.38391406391045313, "step": 48400 }, { "epoch": 5.19, "learning_rate": 0.00019689111747851, "loss": 0.229, "step": 48500 }, { "epoch": 5.19, "eval_loss": 0.45826002955436707, "eval_runtime": 48.9232, "eval_samples_per_second": 41.432, "eval_steps_per_second": 5.192, "eval_wer": 0.3872540169705723, "step": 48500 }, { "epoch": 5.2, "eval_loss": 0.47996604442596436, "eval_runtime": 48.7886, "eval_samples_per_second": 41.547, "eval_steps_per_second": 5.206, "eval_wer": 0.38580971294457483, "step": 48600 }, { "epoch": 5.21, "eval_loss": 0.46112576127052307, "eval_runtime": 48.9997, "eval_samples_per_second": 41.368, "eval_steps_per_second": 5.184, "eval_wer": 0.38003249684058493, "step": 48700 }, { "epoch": 5.22, "eval_loss": 0.45038747787475586, "eval_runtime": 48.9685, "eval_samples_per_second": 41.394, "eval_steps_per_second": 5.187, "eval_wer": 0.38887885899981944, "step": 48800 }, { "epoch": 5.24, "eval_loss": 0.45691677927970886, "eval_runtime": 49.0298, "eval_samples_per_second": 41.342, "eval_steps_per_second": 5.181, "eval_wer": 0.3760606607690919, "step": 48900 }, { "epoch": 5.25, "learning_rate": 0.00019581661891117478, "loss": 0.2313, "step": 49000 }, { "epoch": 5.25, "eval_loss": 0.47323185205459595, "eval_runtime": 48.7503, "eval_samples_per_second": 41.579, "eval_steps_per_second": 5.21, "eval_wer": 0.3914966600469399, "step": 49000 }, { "epoch": 5.26, "eval_loss": 0.4727950692176819, "eval_runtime": 49.3693, "eval_samples_per_second": 41.058, "eval_steps_per_second": 5.145, "eval_wer": 0.38319191189745444, "step": 49100 }, { "epoch": 5.27, "eval_loss": 0.4667152464389801, "eval_runtime": 48.9142, "eval_samples_per_second": 41.44, "eval_steps_per_second": 5.193, "eval_wer": 0.3814768008665824, "step": 49200 }, { "epoch": 5.28, "eval_loss": 0.49122875928878784, "eval_runtime": 49.9108, "eval_samples_per_second": 40.612, "eval_steps_per_second": 5.089, "eval_wer": 0.38562917494132515, "step": 49300 }, { "epoch": 5.29, "eval_loss": 0.47898349165916443, "eval_runtime": 48.5465, "eval_samples_per_second": 41.754, "eval_steps_per_second": 5.232, "eval_wer": 0.3945658061021845, "step": 49400 }, { "epoch": 5.3, "learning_rate": 0.00019474212034383952, "loss": 0.2266, "step": 49500 }, { "epoch": 5.3, "eval_loss": 0.4596710801124573, "eval_runtime": 49.2944, "eval_samples_per_second": 41.12, "eval_steps_per_second": 5.153, "eval_wer": 0.3763314677739664, "step": 49500 }, { "epoch": 5.31, "eval_loss": 0.45802178978919983, "eval_runtime": 49.1967, "eval_samples_per_second": 41.202, "eval_steps_per_second": 5.163, "eval_wer": 0.3777757717999639, "step": 49600 }, { "epoch": 5.32, "eval_loss": 0.4439472556114197, "eval_runtime": 48.6894, "eval_samples_per_second": 41.631, "eval_steps_per_second": 5.217, "eval_wer": 0.37208882469759885, "step": 49700 }, { "epoch": 5.33, "eval_loss": 0.46113863587379456, "eval_runtime": 48.9061, "eval_samples_per_second": 41.447, "eval_steps_per_second": 5.194, "eval_wer": 0.37037371366672683, "step": 49800 }, { "epoch": 5.34, "eval_loss": 0.45986300706863403, "eval_runtime": 49.0073, "eval_samples_per_second": 41.361, "eval_steps_per_second": 5.183, "eval_wer": 0.3768730817837155, "step": 49900 }, { "epoch": 5.35, "learning_rate": 0.00019366762177650427, "loss": 0.235, "step": 50000 }, { "epoch": 5.35, "eval_loss": 0.45431894063949585, "eval_runtime": 49.0294, "eval_samples_per_second": 41.343, "eval_steps_per_second": 5.181, "eval_wer": 0.3808449178552085, "step": 50000 }, { "epoch": 5.36, "eval_loss": 0.45549678802490234, "eval_runtime": 49.0356, "eval_samples_per_second": 41.337, "eval_steps_per_second": 5.18, "eval_wer": 0.3773244267918397, "step": 50100 }, { "epoch": 5.37, "eval_loss": 0.45248955488204956, "eval_runtime": 48.9938, "eval_samples_per_second": 41.373, "eval_steps_per_second": 5.184, "eval_wer": 0.3814768008665824, "step": 50200 }, { "epoch": 5.39, "eval_loss": 0.45570600032806396, "eval_runtime": 48.9527, "eval_samples_per_second": 41.407, "eval_steps_per_second": 5.189, "eval_wer": 0.3813865318649576, "step": 50300 }, { "epoch": 5.4, "eval_loss": 0.46039825677871704, "eval_runtime": 48.6359, "eval_samples_per_second": 41.677, "eval_steps_per_second": 5.222, "eval_wer": 0.375428777757718, "step": 50400 }, { "epoch": 5.41, "learning_rate": 0.00019259312320916904, "loss": 0.2299, "step": 50500 }, { "epoch": 5.41, "eval_loss": 0.4657667875289917, "eval_runtime": 49.1397, "eval_samples_per_second": 41.25, "eval_steps_per_second": 5.169, "eval_wer": 0.3769633507853403, "step": 50500 }, { "epoch": 5.42, "eval_loss": 0.4657803177833557, "eval_runtime": 49.0879, "eval_samples_per_second": 41.293, "eval_steps_per_second": 5.174, "eval_wer": 0.38842751399169523, "step": 50600 }, { "epoch": 5.43, "eval_loss": 0.4701368510723114, "eval_runtime": 48.9419, "eval_samples_per_second": 41.416, "eval_steps_per_second": 5.19, "eval_wer": 0.3919480050550641, "step": 50700 }, { "epoch": 5.44, "eval_loss": 0.4495311677455902, "eval_runtime": 48.8139, "eval_samples_per_second": 41.525, "eval_steps_per_second": 5.203, "eval_wer": 0.3818378768730818, "step": 50800 }, { "epoch": 5.45, "eval_loss": 0.47025540471076965, "eval_runtime": 48.7211, "eval_samples_per_second": 41.604, "eval_steps_per_second": 5.213, "eval_wer": 0.3886080519949449, "step": 50900 }, { "epoch": 5.46, "learning_rate": 0.0001915186246418338, "loss": 0.2307, "step": 51000 }, { "epoch": 5.46, "eval_loss": 0.4395087659358978, "eval_runtime": 48.5097, "eval_samples_per_second": 41.785, "eval_steps_per_second": 5.236, "eval_wer": 0.37425528073659503, "step": 51000 }, { "epoch": 5.47, "eval_loss": 0.44871771335601807, "eval_runtime": 48.9604, "eval_samples_per_second": 41.401, "eval_steps_per_second": 5.188, "eval_wer": 0.3750677017512186, "step": 51100 }, { "epoch": 5.48, "eval_loss": 0.4355129301548004, "eval_runtime": 49.0556, "eval_samples_per_second": 41.32, "eval_steps_per_second": 5.178, "eval_wer": 0.3732623217187218, "step": 51200 }, { "epoch": 5.49, "eval_loss": 0.4622361958026886, "eval_runtime": 48.6307, "eval_samples_per_second": 41.681, "eval_steps_per_second": 5.223, "eval_wer": 0.38111572486008305, "step": 51300 }, { "epoch": 5.5, "eval_loss": 0.44426313042640686, "eval_runtime": 49.0933, "eval_samples_per_second": 41.289, "eval_steps_per_second": 5.174, "eval_wer": 0.3801227658422098, "step": 51400 }, { "epoch": 5.51, "learning_rate": 0.00019044412607449856, "loss": 0.2383, "step": 51500 }, { "epoch": 5.51, "eval_loss": 0.4410970211029053, "eval_runtime": 48.6889, "eval_samples_per_second": 41.632, "eval_steps_per_second": 5.217, "eval_wer": 0.3743455497382199, "step": 51500 }, { "epoch": 5.52, "eval_loss": 0.4437633454799652, "eval_runtime": 49.0805, "eval_samples_per_second": 41.3, "eval_steps_per_second": 5.175, "eval_wer": 0.3777757717999639, "step": 51600 }, { "epoch": 5.54, "eval_loss": 0.45590972900390625, "eval_runtime": 48.7252, "eval_samples_per_second": 41.601, "eval_steps_per_second": 5.213, "eval_wer": 0.3784076548113378, "step": 51700 }, { "epoch": 5.55, "eval_loss": 0.43089374899864197, "eval_runtime": 49.0544, "eval_samples_per_second": 41.322, "eval_steps_per_second": 5.178, "eval_wer": 0.3655894565806102, "step": 51800 }, { "epoch": 5.56, "eval_loss": 0.4454806447029114, "eval_runtime": 50.091, "eval_samples_per_second": 40.466, "eval_steps_per_second": 5.071, "eval_wer": 0.3660408015887344, "step": 51900 }, { "epoch": 5.57, "learning_rate": 0.0001893696275071633, "loss": 0.23, "step": 52000 }, { "epoch": 5.57, "eval_loss": 0.4435708224773407, "eval_runtime": 48.8139, "eval_samples_per_second": 41.525, "eval_steps_per_second": 5.203, "eval_wer": 0.3598122404766203, "step": 52000 }, { "epoch": 5.58, "eval_loss": 0.43444132804870605, "eval_runtime": 48.9776, "eval_samples_per_second": 41.386, "eval_steps_per_second": 5.186, "eval_wer": 0.3684780646326052, "step": 52100 }, { "epoch": 5.59, "eval_loss": 0.42824628949165344, "eval_runtime": 49.2816, "eval_samples_per_second": 41.131, "eval_steps_per_second": 5.154, "eval_wer": 0.36901967864235424, "step": 52200 }, { "epoch": 5.6, "eval_loss": 0.44636350870132446, "eval_runtime": 49.2151, "eval_samples_per_second": 41.187, "eval_steps_per_second": 5.161, "eval_wer": 0.38003249684058493, "step": 52300 }, { "epoch": 5.61, "eval_loss": 0.4458146393299103, "eval_runtime": 48.8414, "eval_samples_per_second": 41.502, "eval_steps_per_second": 5.201, "eval_wer": 0.390864777035566, "step": 52400 }, { "epoch": 5.62, "learning_rate": 0.00018829512893982808, "loss": 0.2305, "step": 52500 }, { "epoch": 5.62, "eval_loss": 0.448255330324173, "eval_runtime": 49.3278, "eval_samples_per_second": 41.092, "eval_steps_per_second": 5.149, "eval_wer": 0.3756093157609677, "step": 52500 }, { "epoch": 5.63, "eval_loss": 0.4547184705734253, "eval_runtime": 49.758, "eval_samples_per_second": 40.737, "eval_steps_per_second": 5.105, "eval_wer": 0.37849792381296266, "step": 52600 }, { "epoch": 5.64, "eval_loss": 0.46712735295295715, "eval_runtime": 48.8295, "eval_samples_per_second": 41.512, "eval_steps_per_second": 5.202, "eval_wer": 0.3820184148763315, "step": 52700 }, { "epoch": 5.65, "eval_loss": 0.4449251890182495, "eval_runtime": 51.0114, "eval_samples_per_second": 39.736, "eval_steps_per_second": 4.979, "eval_wer": 0.3657699945838599, "step": 52800 }, { "epoch": 5.66, "eval_loss": 0.45962706208229065, "eval_runtime": 48.8671, "eval_samples_per_second": 41.48, "eval_steps_per_second": 5.198, "eval_wer": 0.37163747968947464, "step": 52900 }, { "epoch": 5.67, "learning_rate": 0.0001872227793696275, "loss": 0.2237, "step": 53000 }, { "epoch": 5.67, "eval_loss": 0.4399178624153137, "eval_runtime": 48.9657, "eval_samples_per_second": 41.396, "eval_steps_per_second": 5.187, "eval_wer": 0.36694349160498285, "step": 53000 }, { "epoch": 5.69, "eval_loss": 0.44098395109176636, "eval_runtime": 50.1368, "eval_samples_per_second": 40.429, "eval_steps_per_second": 5.066, "eval_wer": 0.37190828669434917, "step": 53100 }, { "epoch": 5.7, "eval_loss": 0.45740246772766113, "eval_runtime": 48.7603, "eval_samples_per_second": 41.571, "eval_steps_per_second": 5.209, "eval_wer": 0.3618884275139917, "step": 53200 }, { "epoch": 5.71, "eval_loss": 0.44431784749031067, "eval_runtime": 48.9893, "eval_samples_per_second": 41.376, "eval_steps_per_second": 5.185, "eval_wer": 0.36901967864235424, "step": 53300 }, { "epoch": 5.72, "eval_loss": 0.4380861818790436, "eval_runtime": 49.01, "eval_samples_per_second": 41.359, "eval_steps_per_second": 5.183, "eval_wer": 0.36775591261960644, "step": 53400 }, { "epoch": 5.73, "learning_rate": 0.00018614828080229225, "loss": 0.2337, "step": 53500 }, { "epoch": 5.73, "eval_loss": 0.44900110363960266, "eval_runtime": 49.3359, "eval_samples_per_second": 41.086, "eval_steps_per_second": 5.148, "eval_wer": 0.3687488716374797, "step": 53500 }, { "epoch": 5.74, "eval_loss": 0.4427066743373871, "eval_runtime": 49.2278, "eval_samples_per_second": 41.176, "eval_steps_per_second": 5.16, "eval_wer": 0.37515797075284346, "step": 53600 }, { "epoch": 5.75, "eval_loss": 0.4423009157180786, "eval_runtime": 49.2643, "eval_samples_per_second": 41.145, "eval_steps_per_second": 5.156, "eval_wer": 0.38580971294457483, "step": 53700 }, { "epoch": 5.76, "eval_loss": 0.4701789617538452, "eval_runtime": 49.1364, "eval_samples_per_second": 41.253, "eval_steps_per_second": 5.169, "eval_wer": 0.3824697598844557, "step": 53800 }, { "epoch": 5.77, "eval_loss": 0.4724409580230713, "eval_runtime": 49.3384, "eval_samples_per_second": 41.084, "eval_steps_per_second": 5.148, "eval_wer": 0.38003249684058493, "step": 53900 }, { "epoch": 5.78, "learning_rate": 0.00018507378223495702, "loss": 0.23, "step": 54000 }, { "epoch": 5.78, "eval_loss": 0.44759470224380493, "eval_runtime": 49.0243, "eval_samples_per_second": 41.347, "eval_steps_per_second": 5.181, "eval_wer": 0.3826502978877054, "step": 54000 }, { "epoch": 5.79, "eval_loss": 0.4508274793624878, "eval_runtime": 48.7547, "eval_samples_per_second": 41.575, "eval_steps_per_second": 5.21, "eval_wer": 0.39185773605343927, "step": 54100 }, { "epoch": 5.8, "eval_loss": 0.45642468333244324, "eval_runtime": 49.1232, "eval_samples_per_second": 41.264, "eval_steps_per_second": 5.171, "eval_wer": 0.37876873081783713, "step": 54200 }, { "epoch": 5.81, "eval_loss": 0.46016448736190796, "eval_runtime": 48.8959, "eval_samples_per_second": 41.455, "eval_steps_per_second": 5.195, "eval_wer": 0.3887885899981946, "step": 54300 }, { "epoch": 5.82, "eval_loss": 0.4537946581840515, "eval_runtime": 49.0323, "eval_samples_per_second": 41.34, "eval_steps_per_second": 5.18, "eval_wer": 0.37317205271709697, "step": 54400 }, { "epoch": 5.84, "learning_rate": 0.00018399928366762177, "loss": 0.2334, "step": 54500 }, { "epoch": 5.84, "eval_loss": 0.4499867558479309, "eval_runtime": 48.5461, "eval_samples_per_second": 41.754, "eval_steps_per_second": 5.232, "eval_wer": 0.3807546488535837, "step": 54500 }, { "epoch": 5.85, "eval_loss": 0.44750362634658813, "eval_runtime": 48.962, "eval_samples_per_second": 41.399, "eval_steps_per_second": 5.188, "eval_wer": 0.3704639826683517, "step": 54600 }, { "epoch": 5.86, "eval_loss": 0.4414827823638916, "eval_runtime": 48.6484, "eval_samples_per_second": 41.666, "eval_steps_per_second": 5.221, "eval_wer": 0.37723415779021485, "step": 54700 }, { "epoch": 5.87, "eval_loss": 0.4515135586261749, "eval_runtime": 48.8475, "eval_samples_per_second": 41.497, "eval_steps_per_second": 5.2, "eval_wer": 0.37705361978696517, "step": 54800 }, { "epoch": 5.88, "eval_loss": 0.44104623794555664, "eval_runtime": 48.6499, "eval_samples_per_second": 41.665, "eval_steps_per_second": 5.221, "eval_wer": 0.3676656436179816, "step": 54900 }, { "epoch": 5.89, "learning_rate": 0.00018292693409742116, "loss": 0.2259, "step": 55000 }, { "epoch": 5.89, "eval_loss": 0.45551472902297974, "eval_runtime": 48.9097, "eval_samples_per_second": 41.444, "eval_steps_per_second": 5.193, "eval_wer": 0.37019317566347715, "step": 55000 }, { "epoch": 5.9, "eval_loss": 0.4508730471134186, "eval_runtime": 48.4437, "eval_samples_per_second": 41.842, "eval_steps_per_second": 5.243, "eval_wer": 0.3894204730095685, "step": 55100 }, { "epoch": 5.91, "eval_loss": 0.4472365379333496, "eval_runtime": 48.759, "eval_samples_per_second": 41.572, "eval_steps_per_second": 5.209, "eval_wer": 0.3692002166456039, "step": 55200 }, { "epoch": 5.92, "eval_loss": 0.44380319118499756, "eval_runtime": 48.6197, "eval_samples_per_second": 41.691, "eval_steps_per_second": 5.224, "eval_wer": 0.375428777757718, "step": 55300 }, { "epoch": 5.93, "eval_loss": 0.4398874044418335, "eval_runtime": 48.7782, "eval_samples_per_second": 41.555, "eval_steps_per_second": 5.207, "eval_wer": 0.3698320996569778, "step": 55400 }, { "epoch": 5.94, "learning_rate": 0.00018185243553008596, "loss": 0.2289, "step": 55500 }, { "epoch": 5.94, "eval_loss": 0.44961434602737427, "eval_runtime": 50.0268, "eval_samples_per_second": 40.518, "eval_steps_per_second": 5.077, "eval_wer": 0.37533850875609315, "step": 55500 }, { "epoch": 5.95, "eval_loss": 0.4505833685398102, "eval_runtime": 51.0999, "eval_samples_per_second": 39.667, "eval_steps_per_second": 4.971, "eval_wer": 0.3752482397544683, "step": 55600 }, { "epoch": 5.96, "eval_loss": 0.448152095079422, "eval_runtime": 49.8088, "eval_samples_per_second": 40.696, "eval_steps_per_second": 5.1, "eval_wer": 0.37660227477884095, "step": 55700 }, { "epoch": 5.97, "eval_loss": 0.4415203630924225, "eval_runtime": 50.6483, "eval_samples_per_second": 40.021, "eval_steps_per_second": 5.015, "eval_wer": 0.37723415779021485, "step": 55800 }, { "epoch": 5.98, "eval_loss": 0.44465985894203186, "eval_runtime": 49.654, "eval_samples_per_second": 40.822, "eval_steps_per_second": 5.115, "eval_wer": 0.3749774327495938, "step": 55900 }, { "epoch": 6.0, "learning_rate": 0.00018078008595988536, "loss": 0.2281, "step": 56000 }, { "epoch": 6.0, "eval_loss": 0.45663803815841675, "eval_runtime": 49.5628, "eval_samples_per_second": 40.898, "eval_steps_per_second": 5.125, "eval_wer": 0.38418487091532766, "step": 56000 }, { "epoch": 6.01, "eval_loss": 0.4693831205368042, "eval_runtime": 50.0809, "eval_samples_per_second": 40.475, "eval_steps_per_second": 5.072, "eval_wer": 0.37741469579346454, "step": 56100 }, { "epoch": 6.02, "eval_loss": 0.4454186260700226, "eval_runtime": 50.0614, "eval_samples_per_second": 40.49, "eval_steps_per_second": 5.074, "eval_wer": 0.37876873081783713, "step": 56200 }, { "epoch": 6.03, "eval_loss": 0.467598557472229, "eval_runtime": 50.2364, "eval_samples_per_second": 40.349, "eval_steps_per_second": 5.056, "eval_wer": 0.3718180176927243, "step": 56300 }, { "epoch": 6.04, "eval_loss": 0.46499374508857727, "eval_runtime": 50.1973, "eval_samples_per_second": 40.381, "eval_steps_per_second": 5.06, "eval_wer": 0.3750677017512186, "step": 56400 }, { "epoch": 6.05, "learning_rate": 0.00017970558739255016, "loss": 0.1979, "step": 56500 }, { "epoch": 6.05, "eval_loss": 0.4601166844367981, "eval_runtime": 49.9764, "eval_samples_per_second": 40.559, "eval_steps_per_second": 5.082, "eval_wer": 0.3765120057772161, "step": 56500 }, { "epoch": 6.06, "eval_loss": 0.4647436738014221, "eval_runtime": 50.0745, "eval_samples_per_second": 40.48, "eval_steps_per_second": 5.072, "eval_wer": 0.384004332912078, "step": 56600 }, { "epoch": 6.07, "eval_loss": 0.4781748950481415, "eval_runtime": 50.0517, "eval_samples_per_second": 40.498, "eval_steps_per_second": 5.075, "eval_wer": 0.3756093157609677, "step": 56700 }, { "epoch": 6.08, "eval_loss": 0.4708513617515564, "eval_runtime": 49.8736, "eval_samples_per_second": 40.643, "eval_steps_per_second": 5.093, "eval_wer": 0.3736233977252212, "step": 56800 }, { "epoch": 6.09, "eval_loss": 0.4707356095314026, "eval_runtime": 50.2175, "eval_samples_per_second": 40.364, "eval_steps_per_second": 5.058, "eval_wer": 0.37335259072034666, "step": 56900 }, { "epoch": 6.1, "learning_rate": 0.00017863108882521487, "loss": 0.1923, "step": 57000 }, { "epoch": 6.1, "eval_loss": 0.4704015254974365, "eval_runtime": 50.2985, "eval_samples_per_second": 40.299, "eval_steps_per_second": 5.05, "eval_wer": 0.3750677017512186, "step": 57000 }, { "epoch": 6.11, "eval_loss": 0.4542071223258972, "eval_runtime": 49.8684, "eval_samples_per_second": 40.647, "eval_steps_per_second": 5.093, "eval_wer": 0.37208882469759885, "step": 57100 }, { "epoch": 6.12, "eval_loss": 0.45417317748069763, "eval_runtime": 51.0162, "eval_samples_per_second": 39.732, "eval_steps_per_second": 4.979, "eval_wer": 0.37353312872359634, "step": 57200 }, { "epoch": 6.13, "eval_loss": 0.4587162435054779, "eval_runtime": 49.7221, "eval_samples_per_second": 40.767, "eval_steps_per_second": 5.108, "eval_wer": 0.3803935728470843, "step": 57300 }, { "epoch": 6.15, "eval_loss": 0.4428020715713501, "eval_runtime": 50.0675, "eval_samples_per_second": 40.485, "eval_steps_per_second": 5.073, "eval_wer": 0.3687488716374797, "step": 57400 }, { "epoch": 6.16, "learning_rate": 0.00017755659025787962, "loss": 0.2012, "step": 57500 }, { "epoch": 6.16, "eval_loss": 0.4456498920917511, "eval_runtime": 50.0097, "eval_samples_per_second": 40.532, "eval_steps_per_second": 5.079, "eval_wer": 0.3747968947463441, "step": 57500 }, { "epoch": 6.17, "eval_loss": 0.45776355266571045, "eval_runtime": 50.0851, "eval_samples_per_second": 40.471, "eval_steps_per_second": 5.071, "eval_wer": 0.37615092977071674, "step": 57600 }, { "epoch": 6.18, "eval_loss": 0.4699217975139618, "eval_runtime": 50.0917, "eval_samples_per_second": 40.466, "eval_steps_per_second": 5.071, "eval_wer": 0.3721790936992237, "step": 57700 }, { "epoch": 6.19, "eval_loss": 0.44986045360565186, "eval_runtime": 50.1466, "eval_samples_per_second": 40.422, "eval_steps_per_second": 5.065, "eval_wer": 0.3756093157609677, "step": 57800 }, { "epoch": 6.2, "eval_loss": 0.46329542994499207, "eval_runtime": 49.6477, "eval_samples_per_second": 40.828, "eval_steps_per_second": 5.116, "eval_wer": 0.36802671962448097, "step": 57900 }, { "epoch": 6.21, "learning_rate": 0.0001764820916905444, "loss": 0.1951, "step": 58000 }, { "epoch": 6.21, "eval_loss": 0.45481452345848083, "eval_runtime": 50.2015, "eval_samples_per_second": 40.377, "eval_steps_per_second": 5.06, "eval_wer": 0.3711861346813504, "step": 58000 }, { "epoch": 6.22, "eval_loss": 0.4520038366317749, "eval_runtime": 50.0272, "eval_samples_per_second": 40.518, "eval_steps_per_second": 5.077, "eval_wer": 0.3758801227658422, "step": 58100 }, { "epoch": 6.23, "eval_loss": 0.4458475410938263, "eval_runtime": 50.0331, "eval_samples_per_second": 40.513, "eval_steps_per_second": 5.077, "eval_wer": 0.36161762050911717, "step": 58200 }, { "epoch": 6.24, "eval_loss": 0.43071892857551575, "eval_runtime": 50.4559, "eval_samples_per_second": 40.174, "eval_steps_per_second": 5.034, "eval_wer": 0.36369380754648856, "step": 58300 }, { "epoch": 6.25, "eval_loss": 0.45458078384399414, "eval_runtime": 50.2084, "eval_samples_per_second": 40.372, "eval_steps_per_second": 5.059, "eval_wer": 0.3620689655172414, "step": 58400 }, { "epoch": 6.26, "learning_rate": 0.00017540759312320914, "loss": 0.1967, "step": 58500 }, { "epoch": 6.26, "eval_loss": 0.4458640217781067, "eval_runtime": 50.4951, "eval_samples_per_second": 40.143, "eval_steps_per_second": 5.03, "eval_wer": 0.3623397725221159, "step": 58500 }, { "epoch": 6.27, "eval_loss": 0.45346349477767944, "eval_runtime": 50.6118, "eval_samples_per_second": 40.05, "eval_steps_per_second": 5.019, "eval_wer": 0.36901967864235424, "step": 58600 }, { "epoch": 6.28, "eval_loss": 0.4573749899864197, "eval_runtime": 50.4308, "eval_samples_per_second": 40.194, "eval_steps_per_second": 5.037, "eval_wer": 0.37714388878859, "step": 58700 }, { "epoch": 6.3, "eval_loss": 0.44925975799560547, "eval_runtime": 50.8786, "eval_samples_per_second": 39.84, "eval_steps_per_second": 4.992, "eval_wer": 0.3744358187398447, "step": 58800 }, { "epoch": 6.31, "eval_loss": 0.44936132431030273, "eval_runtime": 50.0403, "eval_samples_per_second": 40.507, "eval_steps_per_second": 5.076, "eval_wer": 0.3768730817837155, "step": 58900 }, { "epoch": 6.32, "learning_rate": 0.0001743330945558739, "loss": 0.1998, "step": 59000 }, { "epoch": 6.32, "eval_loss": 0.45291775465011597, "eval_runtime": 50.0663, "eval_samples_per_second": 40.486, "eval_steps_per_second": 5.073, "eval_wer": 0.36441595955948725, "step": 59000 }, { "epoch": 6.33, "eval_loss": 0.44164779782295227, "eval_runtime": 50.3619, "eval_samples_per_second": 40.249, "eval_steps_per_second": 5.043, "eval_wer": 0.3662213395919841, "step": 59100 }, { "epoch": 6.34, "eval_loss": 0.44675391912460327, "eval_runtime": 50.2818, "eval_samples_per_second": 40.313, "eval_steps_per_second": 5.052, "eval_wer": 0.37849792381296266, "step": 59200 }, { "epoch": 6.35, "eval_loss": 0.43772903084754944, "eval_runtime": 51.8248, "eval_samples_per_second": 39.113, "eval_steps_per_second": 4.901, "eval_wer": 0.3664018775952338, "step": 59300 }, { "epoch": 6.36, "eval_loss": 0.46470198035240173, "eval_runtime": 49.603, "eval_samples_per_second": 40.865, "eval_steps_per_second": 5.121, "eval_wer": 0.37551904675934283, "step": 59400 }, { "epoch": 6.37, "learning_rate": 0.00017325859598853866, "loss": 0.2009, "step": 59500 }, { "epoch": 6.37, "eval_loss": 0.46995046734809875, "eval_runtime": 49.547, "eval_samples_per_second": 40.911, "eval_steps_per_second": 5.126, "eval_wer": 0.38237949088283085, "step": 59500 }, { "epoch": 6.38, "eval_loss": 0.448755145072937, "eval_runtime": 49.6968, "eval_samples_per_second": 40.787, "eval_steps_per_second": 5.111, "eval_wer": 0.3684780646326052, "step": 59600 }, { "epoch": 6.39, "eval_loss": 0.4649437665939331, "eval_runtime": 49.5562, "eval_samples_per_second": 40.903, "eval_steps_per_second": 5.125, "eval_wer": 0.3803935728470843, "step": 59700 }, { "epoch": 6.4, "eval_loss": 0.4388504922389984, "eval_runtime": 49.9037, "eval_samples_per_second": 40.618, "eval_steps_per_second": 5.09, "eval_wer": 0.3689294096407294, "step": 59800 }, { "epoch": 6.41, "eval_loss": 0.4456236958503723, "eval_runtime": 49.5129, "eval_samples_per_second": 40.939, "eval_steps_per_second": 5.13, "eval_wer": 0.353132334356382, "step": 59900 }, { "epoch": 6.42, "learning_rate": 0.00017218409742120343, "loss": 0.2007, "step": 60000 }, { "epoch": 6.42, "eval_loss": 0.45720431208610535, "eval_runtime": 49.5962, "eval_samples_per_second": 40.87, "eval_steps_per_second": 5.121, "eval_wer": 0.3657699945838599, "step": 60000 }, { "epoch": 6.43, "eval_loss": 0.44642525911331177, "eval_runtime": 49.5448, "eval_samples_per_second": 40.912, "eval_steps_per_second": 5.127, "eval_wer": 0.366853222603358, "step": 60100 }, { "epoch": 6.45, "eval_loss": 0.46656882762908936, "eval_runtime": 49.5603, "eval_samples_per_second": 40.9, "eval_steps_per_second": 5.125, "eval_wer": 0.3710958656797256, "step": 60200 }, { "epoch": 6.46, "eval_loss": 0.4399396777153015, "eval_runtime": 49.6905, "eval_samples_per_second": 40.793, "eval_steps_per_second": 5.112, "eval_wer": 0.3659505325871096, "step": 60300 }, { "epoch": 6.47, "eval_loss": 0.44454124569892883, "eval_runtime": 49.5472, "eval_samples_per_second": 40.91, "eval_steps_per_second": 5.126, "eval_wer": 0.36306192453511466, "step": 60400 }, { "epoch": 6.48, "learning_rate": 0.00017111174785100285, "loss": 0.2005, "step": 60500 }, { "epoch": 6.48, "eval_loss": 0.4450042247772217, "eval_runtime": 49.7013, "eval_samples_per_second": 40.784, "eval_steps_per_second": 5.111, "eval_wer": 0.3620689655172414, "step": 60500 }, { "epoch": 6.49, "eval_loss": 0.4346451163291931, "eval_runtime": 49.7485, "eval_samples_per_second": 40.745, "eval_steps_per_second": 5.106, "eval_wer": 0.35710417042787507, "step": 60600 }, { "epoch": 6.5, "eval_loss": 0.43582871556282043, "eval_runtime": 49.5116, "eval_samples_per_second": 40.94, "eval_steps_per_second": 5.13, "eval_wer": 0.35809712944574834, "step": 60700 }, { "epoch": 6.51, "eval_loss": 0.43437883257865906, "eval_runtime": 49.4394, "eval_samples_per_second": 41.0, "eval_steps_per_second": 5.138, "eval_wer": 0.36459649756273693, "step": 60800 }, { "epoch": 6.52, "eval_loss": 0.4377478063106537, "eval_runtime": 49.4072, "eval_samples_per_second": 41.026, "eval_steps_per_second": 5.141, "eval_wer": 0.3620689655172414, "step": 60900 }, { "epoch": 6.53, "learning_rate": 0.0001700372492836676, "loss": 0.2038, "step": 61000 }, { "epoch": 6.53, "eval_loss": 0.42619436979293823, "eval_runtime": 49.2219, "eval_samples_per_second": 41.181, "eval_steps_per_second": 5.16, "eval_wer": 0.3570139014262502, "step": 61000 }, { "epoch": 6.54, "eval_loss": 0.4269231855869293, "eval_runtime": 49.1941, "eval_samples_per_second": 41.204, "eval_steps_per_second": 5.163, "eval_wer": 0.3614370825058675, "step": 61100 }, { "epoch": 6.55, "eval_loss": 0.42971500754356384, "eval_runtime": 49.2417, "eval_samples_per_second": 41.164, "eval_steps_per_second": 5.158, "eval_wer": 0.35918035746524646, "step": 61200 }, { "epoch": 6.56, "eval_loss": 0.4432744085788727, "eval_runtime": 49.2842, "eval_samples_per_second": 41.129, "eval_steps_per_second": 5.154, "eval_wer": 0.36820725762773066, "step": 61300 }, { "epoch": 6.57, "eval_loss": 0.44737276434898376, "eval_runtime": 49.0666, "eval_samples_per_second": 41.311, "eval_steps_per_second": 5.177, "eval_wer": 0.36441595955948725, "step": 61400 }, { "epoch": 6.58, "learning_rate": 0.00016896275071633237, "loss": 0.199, "step": 61500 }, { "epoch": 6.58, "eval_loss": 0.44639796018600464, "eval_runtime": 49.2396, "eval_samples_per_second": 41.166, "eval_steps_per_second": 5.158, "eval_wer": 0.3678461816212313, "step": 61500 }, { "epoch": 6.6, "eval_loss": 0.43974536657333374, "eval_runtime": 50.0219, "eval_samples_per_second": 40.522, "eval_steps_per_second": 5.078, "eval_wer": 0.35620148041162664, "step": 61600 }, { "epoch": 6.61, "eval_loss": 0.4415305256843567, "eval_runtime": 49.2213, "eval_samples_per_second": 41.181, "eval_steps_per_second": 5.16, "eval_wer": 0.36116627550099295, "step": 61700 }, { "epoch": 6.62, "eval_loss": 0.4362453520298004, "eval_runtime": 49.2548, "eval_samples_per_second": 41.153, "eval_steps_per_second": 5.157, "eval_wer": 0.36008304748149483, "step": 61800 }, { "epoch": 6.63, "eval_loss": 0.44418972730636597, "eval_runtime": 49.1447, "eval_samples_per_second": 41.246, "eval_steps_per_second": 5.168, "eval_wer": 0.3623397725221159, "step": 61900 }, { "epoch": 6.64, "learning_rate": 0.00016788825214899712, "loss": 0.1995, "step": 62000 }, { "epoch": 6.64, "eval_loss": 0.45579132437705994, "eval_runtime": 49.0853, "eval_samples_per_second": 41.295, "eval_steps_per_second": 5.175, "eval_wer": 0.3662213395919841, "step": 62000 }, { "epoch": 6.65, "eval_loss": 0.44767463207244873, "eval_runtime": 49.0065, "eval_samples_per_second": 41.362, "eval_steps_per_second": 5.183, "eval_wer": 0.3646867665643618, "step": 62100 }, { "epoch": 6.66, "eval_loss": 0.4542370140552521, "eval_runtime": 49.7999, "eval_samples_per_second": 40.703, "eval_steps_per_second": 5.1, "eval_wer": 0.3699223686586026, "step": 62200 }, { "epoch": 6.67, "eval_loss": 0.4411347508430481, "eval_runtime": 49.1039, "eval_samples_per_second": 41.28, "eval_steps_per_second": 5.173, "eval_wer": 0.36324246253836434, "step": 62300 }, { "epoch": 6.68, "eval_loss": 0.44079679250717163, "eval_runtime": 48.9326, "eval_samples_per_second": 41.424, "eval_steps_per_second": 5.191, "eval_wer": 0.3657699945838599, "step": 62400 }, { "epoch": 6.69, "learning_rate": 0.00016681590257879654, "loss": 0.2014, "step": 62500 }, { "epoch": 6.69, "eval_loss": 0.4426039755344391, "eval_runtime": 50.1246, "eval_samples_per_second": 40.439, "eval_steps_per_second": 5.067, "eval_wer": 0.36910994764397903, "step": 62500 }, { "epoch": 6.7, "eval_loss": 0.42458194494247437, "eval_runtime": 49.2003, "eval_samples_per_second": 41.199, "eval_steps_per_second": 5.163, "eval_wer": 0.3645062285611121, "step": 62600 }, { "epoch": 6.71, "eval_loss": 0.4466419219970703, "eval_runtime": 49.1925, "eval_samples_per_second": 41.205, "eval_steps_per_second": 5.163, "eval_wer": 0.36757537461635675, "step": 62700 }, { "epoch": 6.72, "eval_loss": 0.4493255913257599, "eval_runtime": 49.3043, "eval_samples_per_second": 41.112, "eval_steps_per_second": 5.152, "eval_wer": 0.356562556418126, "step": 62800 }, { "epoch": 6.73, "eval_loss": 0.43360260128974915, "eval_runtime": 49.2395, "eval_samples_per_second": 41.166, "eval_steps_per_second": 5.158, "eval_wer": 0.3620689655172414, "step": 62900 }, { "epoch": 6.75, "learning_rate": 0.00016574140401146131, "loss": 0.2015, "step": 63000 }, { "epoch": 6.75, "eval_loss": 0.4367372393608093, "eval_runtime": 49.3894, "eval_samples_per_second": 41.041, "eval_steps_per_second": 5.143, "eval_wer": 0.36035385448636936, "step": 63000 }, { "epoch": 6.76, "eval_loss": 0.4424467086791992, "eval_runtime": 50.5332, "eval_samples_per_second": 40.112, "eval_steps_per_second": 5.026, "eval_wer": 0.375428777757718, "step": 63100 }, { "epoch": 6.77, "eval_loss": 0.46792829036712646, "eval_runtime": 49.3356, "eval_samples_per_second": 41.086, "eval_steps_per_second": 5.148, "eval_wer": 0.3732623217187218, "step": 63200 }, { "epoch": 6.78, "eval_loss": 0.4482695758342743, "eval_runtime": 49.3364, "eval_samples_per_second": 41.085, "eval_steps_per_second": 5.148, "eval_wer": 0.37515797075284346, "step": 63300 }, { "epoch": 6.79, "eval_loss": 0.47460225224494934, "eval_runtime": 49.3305, "eval_samples_per_second": 41.09, "eval_steps_per_second": 5.149, "eval_wer": 0.38219895287958117, "step": 63400 }, { "epoch": 6.8, "learning_rate": 0.00016466690544412606, "loss": 0.2048, "step": 63500 }, { "epoch": 6.8, "eval_loss": 0.4340318739414215, "eval_runtime": 49.2, "eval_samples_per_second": 41.199, "eval_steps_per_second": 5.163, "eval_wer": 0.3730817837154721, "step": 63500 }, { "epoch": 6.81, "eval_loss": 0.4346422851085663, "eval_runtime": 49.239, "eval_samples_per_second": 41.167, "eval_steps_per_second": 5.159, "eval_wer": 0.36306192453511466, "step": 63600 }, { "epoch": 6.82, "eval_loss": 0.452511727809906, "eval_runtime": 49.0618, "eval_samples_per_second": 41.315, "eval_steps_per_second": 5.177, "eval_wer": 0.36802671962448097, "step": 63700 }, { "epoch": 6.83, "eval_loss": 0.4359569549560547, "eval_runtime": 49.4157, "eval_samples_per_second": 41.019, "eval_steps_per_second": 5.14, "eval_wer": 0.36405488355298793, "step": 63800 }, { "epoch": 6.84, "eval_loss": 0.42985743284225464, "eval_runtime": 49.1072, "eval_samples_per_second": 41.277, "eval_steps_per_second": 5.172, "eval_wer": 0.3557501354035024, "step": 63900 }, { "epoch": 6.85, "learning_rate": 0.00016359240687679083, "loss": 0.2017, "step": 64000 }, { "epoch": 6.85, "eval_loss": 0.43702712655067444, "eval_runtime": 49.7634, "eval_samples_per_second": 40.733, "eval_steps_per_second": 5.104, "eval_wer": 0.3533128723596317, "step": 64000 }, { "epoch": 6.86, "eval_loss": 0.4292781352996826, "eval_runtime": 49.4279, "eval_samples_per_second": 41.009, "eval_steps_per_second": 5.139, "eval_wer": 0.361707889510742, "step": 64100 }, { "epoch": 6.87, "eval_loss": 0.443094402551651, "eval_runtime": 49.4116, "eval_samples_per_second": 41.023, "eval_steps_per_second": 5.14, "eval_wer": 0.3660408015887344, "step": 64200 }, { "epoch": 6.88, "eval_loss": 0.4362151026725769, "eval_runtime": 48.7406, "eval_samples_per_second": 41.588, "eval_steps_per_second": 5.211, "eval_wer": 0.36883914063910456, "step": 64300 }, { "epoch": 6.9, "eval_loss": 0.4507463276386261, "eval_runtime": 49.1068, "eval_samples_per_second": 41.277, "eval_steps_per_second": 5.172, "eval_wer": 0.3647770355659866, "step": 64400 }, { "epoch": 6.91, "learning_rate": 0.00016251790830945558, "loss": 0.2045, "step": 64500 }, { "epoch": 6.91, "eval_loss": 0.44388145208358765, "eval_runtime": 48.9274, "eval_samples_per_second": 41.429, "eval_steps_per_second": 5.191, "eval_wer": 0.3612565445026178, "step": 64500 }, { "epoch": 6.92, "eval_loss": 0.4249202013015747, "eval_runtime": 50.6467, "eval_samples_per_second": 40.022, "eval_steps_per_second": 5.015, "eval_wer": 0.3493410362881387, "step": 64600 }, { "epoch": 6.93, "eval_loss": 0.436200350522995, "eval_runtime": 48.8605, "eval_samples_per_second": 41.485, "eval_steps_per_second": 5.198, "eval_wer": 0.36116627550099295, "step": 64700 }, { "epoch": 6.94, "eval_loss": 0.4335877299308777, "eval_runtime": 49.1047, "eval_samples_per_second": 41.279, "eval_steps_per_second": 5.173, "eval_wer": 0.3584582054522477, "step": 64800 }, { "epoch": 6.95, "eval_loss": 0.4387299120426178, "eval_runtime": 49.1708, "eval_samples_per_second": 41.224, "eval_steps_per_second": 5.166, "eval_wer": 0.35683336342300054, "step": 64900 }, { "epoch": 6.96, "learning_rate": 0.000161445558739255, "loss": 0.1977, "step": 65000 }, { "epoch": 6.96, "eval_loss": 0.43134012818336487, "eval_runtime": 49.5932, "eval_samples_per_second": 40.873, "eval_steps_per_second": 5.122, "eval_wer": 0.35421556237588014, "step": 65000 }, { "epoch": 6.97, "eval_loss": 0.42868292331695557, "eval_runtime": 49.0964, "eval_samples_per_second": 41.286, "eval_steps_per_second": 5.173, "eval_wer": 0.35520852139375336, "step": 65100 }, { "epoch": 6.98, "eval_loss": 0.4371795654296875, "eval_runtime": 49.0695, "eval_samples_per_second": 41.309, "eval_steps_per_second": 5.176, "eval_wer": 0.3586387434554974, "step": 65200 }, { "epoch": 6.99, "eval_loss": 0.43784716725349426, "eval_runtime": 48.9834, "eval_samples_per_second": 41.381, "eval_steps_per_second": 5.185, "eval_wer": 0.36288138653186497, "step": 65300 }, { "epoch": 7.0, "eval_loss": 0.4518013298511505, "eval_runtime": 49.3743, "eval_samples_per_second": 41.054, "eval_steps_per_second": 5.144, "eval_wer": 0.3639646145513631, "step": 65400 }, { "epoch": 7.01, "learning_rate": 0.00016037106017191977, "loss": 0.1971, "step": 65500 }, { "epoch": 7.01, "eval_loss": 0.44795140624046326, "eval_runtime": 48.9935, "eval_samples_per_second": 41.373, "eval_steps_per_second": 5.184, "eval_wer": 0.3556598664018776, "step": 65500 }, { "epoch": 7.02, "eval_loss": 0.452963650226593, "eval_runtime": 49.4173, "eval_samples_per_second": 41.018, "eval_steps_per_second": 5.14, "eval_wer": 0.35602094240837695, "step": 65600 }, { "epoch": 7.03, "eval_loss": 0.4580971300601959, "eval_runtime": 50.065, "eval_samples_per_second": 40.487, "eval_steps_per_second": 5.073, "eval_wer": 0.3581873984473732, "step": 65700 }, { "epoch": 7.04, "eval_loss": 0.44924312829971313, "eval_runtime": 49.1382, "eval_samples_per_second": 41.251, "eval_steps_per_second": 5.169, "eval_wer": 0.354305831377505, "step": 65800 }, { "epoch": 7.06, "eval_loss": 0.44480279088020325, "eval_runtime": 49.2997, "eval_samples_per_second": 41.116, "eval_steps_per_second": 5.152, "eval_wer": 0.3608051994944936, "step": 65900 }, { "epoch": 7.07, "learning_rate": 0.0001592965616045845, "loss": 0.1672, "step": 66000 }, { "epoch": 7.07, "eval_loss": 0.4469369351863861, "eval_runtime": 49.2087, "eval_samples_per_second": 41.192, "eval_steps_per_second": 5.162, "eval_wer": 0.354305831377505, "step": 66000 }, { "epoch": 7.08, "eval_loss": 0.42615774273872375, "eval_runtime": 49.8244, "eval_samples_per_second": 40.683, "eval_steps_per_second": 5.098, "eval_wer": 0.3487994222783896, "step": 66100 }, { "epoch": 7.09, "eval_loss": 0.4289032220840454, "eval_runtime": 49.6551, "eval_samples_per_second": 40.822, "eval_steps_per_second": 5.115, "eval_wer": 0.3570139014262502, "step": 66200 }, { "epoch": 7.1, "eval_loss": 0.4455362558364868, "eval_runtime": 49.8614, "eval_samples_per_second": 40.653, "eval_steps_per_second": 5.094, "eval_wer": 0.3544863693807547, "step": 66300 }, { "epoch": 7.11, "eval_loss": 0.4449104070663452, "eval_runtime": 49.8819, "eval_samples_per_second": 40.636, "eval_steps_per_second": 5.092, "eval_wer": 0.3562917494132515, "step": 66400 }, { "epoch": 7.12, "learning_rate": 0.0001582220630372493, "loss": 0.169, "step": 66500 }, { "epoch": 7.12, "eval_loss": 0.4554521143436432, "eval_runtime": 49.8243, "eval_samples_per_second": 40.683, "eval_steps_per_second": 5.098, "eval_wer": 0.35647228741650117, "step": 66500 }, { "epoch": 7.13, "eval_loss": 0.443204402923584, "eval_runtime": 50.0734, "eval_samples_per_second": 40.481, "eval_steps_per_second": 5.073, "eval_wer": 0.3655894565806102, "step": 66600 }, { "epoch": 7.14, "eval_loss": 0.4398520588874817, "eval_runtime": 49.6006, "eval_samples_per_second": 40.866, "eval_steps_per_second": 5.121, "eval_wer": 0.36098573749774326, "step": 66700 }, { "epoch": 7.15, "eval_loss": 0.4383464753627777, "eval_runtime": 49.6217, "eval_samples_per_second": 40.849, "eval_steps_per_second": 5.119, "eval_wer": 0.35538905939700305, "step": 66800 }, { "epoch": 7.16, "eval_loss": 0.43758177757263184, "eval_runtime": 50.6011, "eval_samples_per_second": 40.058, "eval_steps_per_second": 5.02, "eval_wer": 0.35358367936450624, "step": 66900 }, { "epoch": 7.17, "learning_rate": 0.0001571497134670487, "loss": 0.1724, "step": 67000 }, { "epoch": 7.17, "eval_loss": 0.4382694363594055, "eval_runtime": 49.755, "eval_samples_per_second": 40.74, "eval_steps_per_second": 5.105, "eval_wer": 0.3571944394294999, "step": 67000 }, { "epoch": 7.18, "eval_loss": 0.4452250301837921, "eval_runtime": 49.6952, "eval_samples_per_second": 40.789, "eval_steps_per_second": 5.111, "eval_wer": 0.3534934103628814, "step": 67100 }, { "epoch": 7.19, "eval_loss": 0.4610207974910736, "eval_runtime": 50.0238, "eval_samples_per_second": 40.521, "eval_steps_per_second": 5.078, "eval_wer": 0.36676295360173317, "step": 67200 }, { "epoch": 7.21, "eval_loss": 0.45337799191474915, "eval_runtime": 49.5531, "eval_samples_per_second": 40.906, "eval_steps_per_second": 5.126, "eval_wer": 0.3545766383823795, "step": 67300 }, { "epoch": 7.22, "eval_loss": 0.450591504573822, "eval_runtime": 49.4218, "eval_samples_per_second": 41.014, "eval_steps_per_second": 5.139, "eval_wer": 0.3604441234879942, "step": 67400 }, { "epoch": 7.23, "learning_rate": 0.0001560773638968481, "loss": 0.1729, "step": 67500 }, { "epoch": 7.23, "eval_loss": 0.4463426470756531, "eval_runtime": 49.5524, "eval_samples_per_second": 40.906, "eval_steps_per_second": 5.126, "eval_wer": 0.35069507131251126, "step": 67500 }, { "epoch": 7.24, "eval_loss": 0.44396212697029114, "eval_runtime": 49.687, "eval_samples_per_second": 40.795, "eval_steps_per_second": 5.112, "eval_wer": 0.3629716555334898, "step": 67600 }, { "epoch": 7.25, "eval_loss": 0.4361093044281006, "eval_runtime": 50.0356, "eval_samples_per_second": 40.511, "eval_steps_per_second": 5.076, "eval_wer": 0.3550279833905037, "step": 67700 }, { "epoch": 7.26, "eval_loss": 0.4397481679916382, "eval_runtime": 49.5204, "eval_samples_per_second": 40.933, "eval_steps_per_second": 5.129, "eval_wer": 0.3643256905578624, "step": 67800 }, { "epoch": 7.27, "eval_loss": 0.43276941776275635, "eval_runtime": 49.9383, "eval_samples_per_second": 40.59, "eval_steps_per_second": 5.086, "eval_wer": 0.3547571763856292, "step": 67900 }, { "epoch": 7.28, "learning_rate": 0.00015500286532951288, "loss": 0.1736, "step": 68000 }, { "epoch": 7.28, "eval_loss": 0.45456382632255554, "eval_runtime": 49.2784, "eval_samples_per_second": 41.134, "eval_steps_per_second": 5.154, "eval_wer": 0.3614370825058675, "step": 68000 }, { "epoch": 7.29, "eval_loss": 0.45059072971343994, "eval_runtime": 49.8297, "eval_samples_per_second": 40.679, "eval_steps_per_second": 5.097, "eval_wer": 0.35584040440512726, "step": 68100 }, { "epoch": 7.3, "eval_loss": 0.4360811114311218, "eval_runtime": 49.6076, "eval_samples_per_second": 40.861, "eval_steps_per_second": 5.12, "eval_wer": 0.35132695432388517, "step": 68200 }, { "epoch": 7.31, "eval_loss": 0.4222584366798401, "eval_runtime": 49.813, "eval_samples_per_second": 40.692, "eval_steps_per_second": 5.099, "eval_wer": 0.3499729192995126, "step": 68300 }, { "epoch": 7.32, "eval_loss": 0.4474307596683502, "eval_runtime": 49.5259, "eval_samples_per_second": 40.928, "eval_steps_per_second": 5.129, "eval_wer": 0.34970211229463805, "step": 68400 }, { "epoch": 7.33, "learning_rate": 0.00015392836676217763, "loss": 0.1733, "step": 68500 }, { "epoch": 7.33, "eval_loss": 0.4303099513053894, "eval_runtime": 49.5599, "eval_samples_per_second": 40.9, "eval_steps_per_second": 5.125, "eval_wer": 0.35493771438887883, "step": 68500 }, { "epoch": 7.34, "eval_loss": 0.42649605870246887, "eval_runtime": 49.6335, "eval_samples_per_second": 40.839, "eval_steps_per_second": 5.118, "eval_wer": 0.3483480772702654, "step": 68600 }, { "epoch": 7.36, "eval_loss": 0.43393298983573914, "eval_runtime": 50.0205, "eval_samples_per_second": 40.523, "eval_steps_per_second": 5.078, "eval_wer": 0.3557501354035024, "step": 68700 }, { "epoch": 7.37, "eval_loss": 0.4266127347946167, "eval_runtime": 50.1516, "eval_samples_per_second": 40.417, "eval_steps_per_second": 5.065, "eval_wer": 0.34907022928326414, "step": 68800 }, { "epoch": 7.38, "eval_loss": 0.44230374693870544, "eval_runtime": 49.8261, "eval_samples_per_second": 40.681, "eval_steps_per_second": 5.098, "eval_wer": 0.35647228741650117, "step": 68900 }, { "epoch": 7.39, "learning_rate": 0.00015285386819484238, "loss": 0.1764, "step": 69000 }, { "epoch": 7.39, "eval_loss": 0.44104790687561035, "eval_runtime": 49.6079, "eval_samples_per_second": 40.86, "eval_steps_per_second": 5.12, "eval_wer": 0.35538905939700305, "step": 69000 }, { "epoch": 7.4, "eval_loss": 0.44824397563934326, "eval_runtime": 49.4864, "eval_samples_per_second": 40.961, "eval_steps_per_second": 5.133, "eval_wer": 0.370283444665102, "step": 69100 }, { "epoch": 7.41, "eval_loss": 0.4479742646217346, "eval_runtime": 49.5287, "eval_samples_per_second": 40.926, "eval_steps_per_second": 5.128, "eval_wer": 0.36405488355298793, "step": 69200 }, { "epoch": 7.42, "eval_loss": 0.4361330270767212, "eval_runtime": 49.8379, "eval_samples_per_second": 40.672, "eval_steps_per_second": 5.097, "eval_wer": 0.3499729192995126, "step": 69300 }, { "epoch": 7.43, "eval_loss": 0.4399217963218689, "eval_runtime": 50.0303, "eval_samples_per_second": 40.515, "eval_steps_per_second": 5.077, "eval_wer": 0.36324246253836434, "step": 69400 }, { "epoch": 7.44, "learning_rate": 0.00015177936962750715, "loss": 0.1711, "step": 69500 }, { "epoch": 7.44, "eval_loss": 0.43825072050094604, "eval_runtime": 50.1866, "eval_samples_per_second": 40.389, "eval_steps_per_second": 5.061, "eval_wer": 0.3590900884636216, "step": 69500 }, { "epoch": 7.45, "eval_loss": 0.45228099822998047, "eval_runtime": 49.884, "eval_samples_per_second": 40.634, "eval_steps_per_second": 5.092, "eval_wer": 0.3636035385448637, "step": 69600 }, { "epoch": 7.46, "eval_loss": 0.438789963722229, "eval_runtime": 49.7132, "eval_samples_per_second": 40.774, "eval_steps_per_second": 5.109, "eval_wer": 0.35024372630438705, "step": 69700 }, { "epoch": 7.47, "eval_loss": 0.430462509393692, "eval_runtime": 49.7445, "eval_samples_per_second": 40.748, "eval_steps_per_second": 5.106, "eval_wer": 0.35647228741650117, "step": 69800 }, { "epoch": 7.48, "eval_loss": 0.4289742410182953, "eval_runtime": 49.8969, "eval_samples_per_second": 40.624, "eval_steps_per_second": 5.09, "eval_wer": 0.35376421736775593, "step": 69900 }, { "epoch": 7.49, "learning_rate": 0.0001507048710601719, "loss": 0.1748, "step": 70000 }, { "epoch": 7.49, "eval_loss": 0.435860276222229, "eval_runtime": 49.6706, "eval_samples_per_second": 40.809, "eval_steps_per_second": 5.114, "eval_wer": 0.3511464163206355, "step": 70000 }, { "epoch": 7.51, "eval_loss": 0.4314829707145691, "eval_runtime": 49.5429, "eval_samples_per_second": 40.914, "eval_steps_per_second": 5.127, "eval_wer": 0.3460010832280195, "step": 70100 }, { "epoch": 7.52, "eval_loss": 0.42675673961639404, "eval_runtime": 49.8146, "eval_samples_per_second": 40.691, "eval_steps_per_second": 5.099, "eval_wer": 0.3554793283986279, "step": 70200 }, { "epoch": 7.53, "eval_loss": 0.42668795585632324, "eval_runtime": 49.5577, "eval_samples_per_second": 40.902, "eval_steps_per_second": 5.125, "eval_wer": 0.34554973821989526, "step": 70300 }, { "epoch": 7.54, "eval_loss": 0.43592557311058044, "eval_runtime": 49.9069, "eval_samples_per_second": 40.616, "eval_steps_per_second": 5.089, "eval_wer": 0.35168803033038454, "step": 70400 }, { "epoch": 7.55, "learning_rate": 0.00014963037249283667, "loss": 0.1739, "step": 70500 }, { "epoch": 7.55, "eval_loss": 0.4299277067184448, "eval_runtime": 49.4302, "eval_samples_per_second": 41.007, "eval_steps_per_second": 5.139, "eval_wer": 0.34907022928326414, "step": 70500 }, { "epoch": 7.56, "eval_loss": 0.4423278570175171, "eval_runtime": 50.5024, "eval_samples_per_second": 40.137, "eval_steps_per_second": 5.029, "eval_wer": 0.3409460191370283, "step": 70600 }, { "epoch": 7.57, "eval_loss": 0.425134539604187, "eval_runtime": 49.993, "eval_samples_per_second": 40.546, "eval_steps_per_second": 5.081, "eval_wer": 0.34202924715652644, "step": 70700 }, { "epoch": 7.58, "eval_loss": 0.4300227463245392, "eval_runtime": 49.8429, "eval_samples_per_second": 40.668, "eval_steps_per_second": 5.096, "eval_wer": 0.34139736414515254, "step": 70800 }, { "epoch": 7.59, "eval_loss": 0.43489590287208557, "eval_runtime": 49.9603, "eval_samples_per_second": 40.572, "eval_steps_per_second": 5.084, "eval_wer": 0.3422097851597761, "step": 70900 }, { "epoch": 7.6, "learning_rate": 0.0001485558739255014, "loss": 0.1763, "step": 71000 }, { "epoch": 7.6, "eval_loss": 0.432796835899353, "eval_runtime": 49.7256, "eval_samples_per_second": 40.764, "eval_steps_per_second": 5.108, "eval_wer": 0.34184870915327675, "step": 71000 }, { "epoch": 7.61, "eval_loss": 0.4312654137611389, "eval_runtime": 49.7843, "eval_samples_per_second": 40.716, "eval_steps_per_second": 5.102, "eval_wer": 0.34518866221339595, "step": 71100 }, { "epoch": 7.62, "eval_loss": 0.42399337887763977, "eval_runtime": 49.7353, "eval_samples_per_second": 40.756, "eval_steps_per_second": 5.107, "eval_wer": 0.35340314136125656, "step": 71200 }, { "epoch": 7.63, "eval_loss": 0.42743441462516785, "eval_runtime": 49.616, "eval_samples_per_second": 40.854, "eval_steps_per_second": 5.119, "eval_wer": 0.34744538725401697, "step": 71300 }, { "epoch": 7.64, "eval_loss": 0.43036043643951416, "eval_runtime": 49.8989, "eval_samples_per_second": 40.622, "eval_steps_per_second": 5.09, "eval_wer": 0.3467232352410182, "step": 71400 }, { "epoch": 7.66, "learning_rate": 0.00014748137535816616, "loss": 0.171, "step": 71500 }, { "epoch": 7.66, "eval_loss": 0.43307775259017944, "eval_runtime": 49.8783, "eval_samples_per_second": 40.639, "eval_steps_per_second": 5.092, "eval_wer": 0.3509658783173858, "step": 71500 }, { "epoch": 7.67, "eval_loss": 0.42630788683891296, "eval_runtime": 49.6005, "eval_samples_per_second": 40.866, "eval_steps_per_second": 5.121, "eval_wer": 0.34780646326051634, "step": 71600 }, { "epoch": 7.68, "eval_loss": 0.4301213026046753, "eval_runtime": 49.8474, "eval_samples_per_second": 40.664, "eval_steps_per_second": 5.096, "eval_wer": 0.34473731720527173, "step": 71700 }, { "epoch": 7.69, "eval_loss": 0.40457987785339355, "eval_runtime": 49.7536, "eval_samples_per_second": 40.741, "eval_steps_per_second": 5.105, "eval_wer": 0.34518866221339595, "step": 71800 }, { "epoch": 7.7, "eval_loss": 0.42995375394821167, "eval_runtime": 50.5859, "eval_samples_per_second": 40.07, "eval_steps_per_second": 5.021, "eval_wer": 0.35277125834988265, "step": 71900 }, { "epoch": 7.71, "learning_rate": 0.00014641117478510026, "loss": 0.1792, "step": 72000 }, { "epoch": 7.71, "eval_loss": 0.42525142431259155, "eval_runtime": 49.9158, "eval_samples_per_second": 40.608, "eval_steps_per_second": 5.089, "eval_wer": 0.349160498284889, "step": 72000 }, { "epoch": 7.72, "eval_loss": 0.4295995533466339, "eval_runtime": 50.2083, "eval_samples_per_second": 40.372, "eval_steps_per_second": 5.059, "eval_wer": 0.34907022928326414, "step": 72100 }, { "epoch": 7.73, "eval_loss": 0.4117787778377533, "eval_runtime": 50.1254, "eval_samples_per_second": 40.439, "eval_steps_per_second": 5.067, "eval_wer": 0.3450983932117711, "step": 72200 }, { "epoch": 7.74, "eval_loss": 0.4347759485244751, "eval_runtime": 49.7417, "eval_samples_per_second": 40.751, "eval_steps_per_second": 5.106, "eval_wer": 0.3345369200216646, "step": 72300 }, { "epoch": 7.75, "eval_loss": 0.4282897412776947, "eval_runtime": 49.9268, "eval_samples_per_second": 40.599, "eval_steps_per_second": 5.087, "eval_wer": 0.34473731720527173, "step": 72400 }, { "epoch": 7.76, "learning_rate": 0.00014533667621776503, "loss": 0.1801, "step": 72500 }, { "epoch": 7.76, "eval_loss": 0.423183798789978, "eval_runtime": 50.0273, "eval_samples_per_second": 40.518, "eval_steps_per_second": 5.077, "eval_wer": 0.3449178552085214, "step": 72500 }, { "epoch": 7.77, "eval_loss": 0.4490908980369568, "eval_runtime": 49.8341, "eval_samples_per_second": 40.675, "eval_steps_per_second": 5.097, "eval_wer": 0.34861888427513993, "step": 72600 }, { "epoch": 7.78, "eval_loss": 0.42611071467399597, "eval_runtime": 49.9659, "eval_samples_per_second": 40.568, "eval_steps_per_second": 5.083, "eval_wer": 0.33426611301679005, "step": 72700 }, { "epoch": 7.79, "eval_loss": 0.43815183639526367, "eval_runtime": 49.9365, "eval_samples_per_second": 40.592, "eval_steps_per_second": 5.086, "eval_wer": 0.34554973821989526, "step": 72800 }, { "epoch": 7.81, "eval_loss": 0.43009382486343384, "eval_runtime": 49.5744, "eval_samples_per_second": 40.888, "eval_steps_per_second": 5.124, "eval_wer": 0.3414876331467774, "step": 72900 }, { "epoch": 7.82, "learning_rate": 0.00014426432664756445, "loss": 0.1731, "step": 73000 }, { "epoch": 7.82, "eval_loss": 0.42360547184944153, "eval_runtime": 50.0488, "eval_samples_per_second": 40.5, "eval_steps_per_second": 5.075, "eval_wer": 0.3438346271890233, "step": 73000 }, { "epoch": 7.83, "eval_loss": 0.42565011978149414, "eval_runtime": 49.9316, "eval_samples_per_second": 40.596, "eval_steps_per_second": 5.087, "eval_wer": 0.3419389781549016, "step": 73100 }, { "epoch": 7.84, "eval_loss": 0.4367884397506714, "eval_runtime": 49.8253, "eval_samples_per_second": 40.682, "eval_steps_per_second": 5.098, "eval_wer": 0.34103628813865317, "step": 73200 }, { "epoch": 7.85, "eval_loss": 0.4206501841545105, "eval_runtime": 49.6241, "eval_samples_per_second": 40.847, "eval_steps_per_second": 5.118, "eval_wer": 0.3397725221159054, "step": 73300 }, { "epoch": 7.86, "eval_loss": 0.4118278920650482, "eval_runtime": 49.7109, "eval_samples_per_second": 40.776, "eval_steps_per_second": 5.11, "eval_wer": 0.3417584401516519, "step": 73400 }, { "epoch": 7.87, "learning_rate": 0.00014318982808022923, "loss": 0.1748, "step": 73500 }, { "epoch": 7.87, "eval_loss": 0.4357281029224396, "eval_runtime": 49.9503, "eval_samples_per_second": 40.58, "eval_steps_per_second": 5.085, "eval_wer": 0.34293193717277487, "step": 73500 }, { "epoch": 7.88, "eval_loss": 0.4276559054851532, "eval_runtime": 49.4295, "eval_samples_per_second": 41.008, "eval_steps_per_second": 5.139, "eval_wer": 0.34518866221339595, "step": 73600 }, { "epoch": 7.89, "eval_loss": 0.4172598719596863, "eval_runtime": 51.6349, "eval_samples_per_second": 39.256, "eval_steps_per_second": 4.919, "eval_wer": 0.34762592525726665, "step": 73700 }, { "epoch": 7.9, "eval_loss": 0.41912218928337097, "eval_runtime": 49.7354, "eval_samples_per_second": 40.756, "eval_steps_per_second": 5.107, "eval_wer": 0.34780646326051634, "step": 73800 }, { "epoch": 7.91, "eval_loss": 0.4197118282318115, "eval_runtime": 49.7715, "eval_samples_per_second": 40.726, "eval_steps_per_second": 5.103, "eval_wer": 0.34573027622314495, "step": 73900 }, { "epoch": 7.92, "learning_rate": 0.00014211532951289397, "loss": 0.1745, "step": 74000 }, { "epoch": 7.92, "eval_loss": 0.4197350740432739, "eval_runtime": 50.0166, "eval_samples_per_second": 40.527, "eval_steps_per_second": 5.078, "eval_wer": 0.34356382018414877, "step": 74000 }, { "epoch": 7.93, "eval_loss": 0.4252673089504242, "eval_runtime": 49.9578, "eval_samples_per_second": 40.574, "eval_steps_per_second": 5.084, "eval_wer": 0.3512366853222603, "step": 74100 }, { "epoch": 7.94, "eval_loss": 0.4216529130935669, "eval_runtime": 49.7253, "eval_samples_per_second": 40.764, "eval_steps_per_second": 5.108, "eval_wer": 0.346271890232894, "step": 74200 }, { "epoch": 7.95, "eval_loss": 0.4305253326892853, "eval_runtime": 50.2727, "eval_samples_per_second": 40.32, "eval_steps_per_second": 5.052, "eval_wer": 0.3472648492507673, "step": 74300 }, { "epoch": 7.97, "eval_loss": 0.42150747776031494, "eval_runtime": 49.8232, "eval_samples_per_second": 40.684, "eval_steps_per_second": 5.098, "eval_wer": 0.35069507131251126, "step": 74400 }, { "epoch": 7.98, "learning_rate": 0.00014104083094555872, "loss": 0.1743, "step": 74500 }, { "epoch": 7.98, "eval_loss": 0.41268059611320496, "eval_runtime": 50.0689, "eval_samples_per_second": 40.484, "eval_steps_per_second": 5.073, "eval_wer": 0.34076548113377864, "step": 74500 }, { "epoch": 7.99, "eval_loss": 0.419066846370697, "eval_runtime": 49.8664, "eval_samples_per_second": 40.649, "eval_steps_per_second": 5.094, "eval_wer": 0.34681350424264307, "step": 74600 }, { "epoch": 8.0, "eval_loss": 0.43805456161499023, "eval_runtime": 49.856, "eval_samples_per_second": 40.657, "eval_steps_per_second": 5.095, "eval_wer": 0.34907022928326414, "step": 74700 }, { "epoch": 8.01, "eval_loss": 0.45096319913864136, "eval_runtime": 50.647, "eval_samples_per_second": 40.022, "eval_steps_per_second": 5.015, "eval_wer": 0.3477161942588915, "step": 74800 }, { "epoch": 8.02, "eval_loss": 0.4481862485408783, "eval_runtime": 50.0491, "eval_samples_per_second": 40.5, "eval_steps_per_second": 5.075, "eval_wer": 0.3470843112475176, "step": 74900 }, { "epoch": 8.03, "learning_rate": 0.0001399663323782235, "loss": 0.1588, "step": 75000 }, { "epoch": 8.03, "eval_loss": 0.4470798671245575, "eval_runtime": 50.1478, "eval_samples_per_second": 40.421, "eval_steps_per_second": 5.065, "eval_wer": 0.3430222061743997, "step": 75000 }, { "epoch": 8.04, "eval_loss": 0.4295661449432373, "eval_runtime": 49.994, "eval_samples_per_second": 40.545, "eval_steps_per_second": 5.081, "eval_wer": 0.3393211771077812, "step": 75100 }, { "epoch": 8.05, "eval_loss": 0.4479615390300751, "eval_runtime": 50.1363, "eval_samples_per_second": 40.43, "eval_steps_per_second": 5.066, "eval_wer": 0.3397725221159054, "step": 75200 }, { "epoch": 8.06, "eval_loss": 0.43022599816322327, "eval_runtime": 49.9468, "eval_samples_per_second": 40.583, "eval_steps_per_second": 5.085, "eval_wer": 0.34518866221339595, "step": 75300 }, { "epoch": 8.07, "eval_loss": 0.44102075695991516, "eval_runtime": 49.7515, "eval_samples_per_second": 40.742, "eval_steps_per_second": 5.105, "eval_wer": 0.34311247517602456, "step": 75400 }, { "epoch": 8.08, "learning_rate": 0.00013889183381088824, "loss": 0.144, "step": 75500 }, { "epoch": 8.08, "eval_loss": 0.426250696182251, "eval_runtime": 49.7571, "eval_samples_per_second": 40.738, "eval_steps_per_second": 5.105, "eval_wer": 0.34554973821989526, "step": 75500 }, { "epoch": 8.09, "eval_loss": 0.4522950053215027, "eval_runtime": 50.1232, "eval_samples_per_second": 40.44, "eval_steps_per_second": 5.068, "eval_wer": 0.34952157429138836, "step": 75600 }, { "epoch": 8.1, "eval_loss": 0.4454551041126251, "eval_runtime": 50.0404, "eval_samples_per_second": 40.507, "eval_steps_per_second": 5.076, "eval_wer": 0.3511464163206355, "step": 75700 }, { "epoch": 8.12, "eval_loss": 0.43785789608955383, "eval_runtime": 50.0138, "eval_samples_per_second": 40.529, "eval_steps_per_second": 5.079, "eval_wer": 0.3444665102003972, "step": 75800 }, { "epoch": 8.13, "eval_loss": 0.4417654275894165, "eval_runtime": 49.6684, "eval_samples_per_second": 40.811, "eval_steps_per_second": 5.114, "eval_wer": 0.341126557140278, "step": 75900 }, { "epoch": 8.14, "learning_rate": 0.00013781733524355298, "loss": 0.1483, "step": 76000 }, { "epoch": 8.14, "eval_loss": 0.4490506649017334, "eval_runtime": 49.753, "eval_samples_per_second": 40.741, "eval_steps_per_second": 5.105, "eval_wer": 0.346271890232894, "step": 76000 }, { "epoch": 8.15, "eval_loss": 0.43855246901512146, "eval_runtime": 49.593, "eval_samples_per_second": 40.873, "eval_steps_per_second": 5.122, "eval_wer": 0.3467232352410182, "step": 76100 }, { "epoch": 8.16, "eval_loss": 0.43268758058547974, "eval_runtime": 49.787, "eval_samples_per_second": 40.713, "eval_steps_per_second": 5.102, "eval_wer": 0.3524101823433833, "step": 76200 }, { "epoch": 8.17, "eval_loss": 0.4359542727470398, "eval_runtime": 49.6772, "eval_samples_per_second": 40.803, "eval_steps_per_second": 5.113, "eval_wer": 0.36134681350424264, "step": 76300 }, { "epoch": 8.18, "eval_loss": 0.4352158308029175, "eval_runtime": 49.6241, "eval_samples_per_second": 40.847, "eval_steps_per_second": 5.118, "eval_wer": 0.3497923812962629, "step": 76400 }, { "epoch": 8.19, "learning_rate": 0.00013674498567335243, "loss": 0.1541, "step": 76500 }, { "epoch": 8.19, "eval_loss": 0.43757787346839905, "eval_runtime": 49.5023, "eval_samples_per_second": 40.948, "eval_steps_per_second": 5.131, "eval_wer": 0.34139736414515254, "step": 76500 }, { "epoch": 8.2, "eval_loss": 0.4408476650714874, "eval_runtime": 49.9235, "eval_samples_per_second": 40.602, "eval_steps_per_second": 5.088, "eval_wer": 0.34636215923451885, "step": 76600 }, { "epoch": 8.21, "eval_loss": 0.44147056341171265, "eval_runtime": 50.6402, "eval_samples_per_second": 40.027, "eval_steps_per_second": 5.016, "eval_wer": 0.3444665102003972, "step": 76700 }, { "epoch": 8.22, "eval_loss": 0.44549474120140076, "eval_runtime": 49.8586, "eval_samples_per_second": 40.655, "eval_steps_per_second": 5.094, "eval_wer": 0.3481675392670157, "step": 76800 }, { "epoch": 8.23, "eval_loss": 0.45420777797698975, "eval_runtime": 50.7469, "eval_samples_per_second": 39.943, "eval_steps_per_second": 5.005, "eval_wer": 0.3414876331467774, "step": 76900 }, { "epoch": 8.24, "learning_rate": 0.00013567048710601718, "loss": 0.1479, "step": 77000 }, { "epoch": 8.24, "eval_loss": 0.44616568088531494, "eval_runtime": 49.6192, "eval_samples_per_second": 40.851, "eval_steps_per_second": 5.119, "eval_wer": 0.3425708611662755, "step": 77000 }, { "epoch": 8.25, "eval_loss": 0.4459743797779083, "eval_runtime": 49.6132, "eval_samples_per_second": 40.856, "eval_steps_per_second": 5.12, "eval_wer": 0.3413070951435277, "step": 77100 }, { "epoch": 8.27, "eval_loss": 0.4433516561985016, "eval_runtime": 49.9376, "eval_samples_per_second": 40.591, "eval_steps_per_second": 5.086, "eval_wer": 0.33751579707528434, "step": 77200 }, { "epoch": 8.28, "eval_loss": 0.43969422578811646, "eval_runtime": 50.4883, "eval_samples_per_second": 40.148, "eval_steps_per_second": 5.031, "eval_wer": 0.3472648492507673, "step": 77300 }, { "epoch": 8.29, "eval_loss": 0.4378765821456909, "eval_runtime": 49.5816, "eval_samples_per_second": 40.882, "eval_steps_per_second": 5.123, "eval_wer": 0.34843834627189024, "step": 77400 }, { "epoch": 8.3, "learning_rate": 0.00013459598853868192, "loss": 0.1479, "step": 77500 }, { "epoch": 8.3, "eval_loss": 0.44405272603034973, "eval_runtime": 50.0477, "eval_samples_per_second": 40.501, "eval_steps_per_second": 5.075, "eval_wer": 0.3494313052897635, "step": 77500 }, { "epoch": 8.31, "eval_loss": 0.430147647857666, "eval_runtime": 49.5341, "eval_samples_per_second": 40.921, "eval_steps_per_second": 5.128, "eval_wer": 0.3466329662393934, "step": 77600 }, { "epoch": 8.32, "eval_loss": 0.44200408458709717, "eval_runtime": 49.7936, "eval_samples_per_second": 40.708, "eval_steps_per_second": 5.101, "eval_wer": 0.3473551182523921, "step": 77700 }, { "epoch": 8.33, "eval_loss": 0.4519636034965515, "eval_runtime": 49.663, "eval_samples_per_second": 40.815, "eval_steps_per_second": 5.114, "eval_wer": 0.35890955046037193, "step": 77800 }, { "epoch": 8.34, "eval_loss": 0.4283126890659332, "eval_runtime": 49.7811, "eval_samples_per_second": 40.718, "eval_steps_per_second": 5.102, "eval_wer": 0.3481675392670157, "step": 77900 }, { "epoch": 8.35, "learning_rate": 0.0001335214899713467, "loss": 0.1531, "step": 78000 }, { "epoch": 8.35, "eval_loss": 0.4324764311313629, "eval_runtime": 49.9512, "eval_samples_per_second": 40.58, "eval_steps_per_second": 5.085, "eval_wer": 0.34455677920202205, "step": 78000 }, { "epoch": 8.36, "eval_loss": 0.4379710555076599, "eval_runtime": 50.5917, "eval_samples_per_second": 40.066, "eval_steps_per_second": 5.021, "eval_wer": 0.3469037732442679, "step": 78100 }, { "epoch": 8.37, "eval_loss": 0.44632431864738464, "eval_runtime": 49.7303, "eval_samples_per_second": 40.76, "eval_steps_per_second": 5.108, "eval_wer": 0.3503339953060119, "step": 78200 }, { "epoch": 8.38, "eval_loss": 0.44785556197166443, "eval_runtime": 50.0294, "eval_samples_per_second": 40.516, "eval_steps_per_second": 5.077, "eval_wer": 0.34988265029788773, "step": 78300 }, { "epoch": 8.39, "eval_loss": 0.4477352499961853, "eval_runtime": 50.9014, "eval_samples_per_second": 39.822, "eval_steps_per_second": 4.99, "eval_wer": 0.3528615273515075, "step": 78400 }, { "epoch": 8.4, "learning_rate": 0.00013244699140401144, "loss": 0.1507, "step": 78500 }, { "epoch": 8.4, "eval_loss": 0.47092047333717346, "eval_runtime": 50.1089, "eval_samples_per_second": 40.452, "eval_steps_per_second": 5.069, "eval_wer": 0.3551182523921285, "step": 78500 }, { "epoch": 8.42, "eval_loss": 0.45331060886383057, "eval_runtime": 49.7737, "eval_samples_per_second": 40.724, "eval_steps_per_second": 5.103, "eval_wer": 0.353132334356382, "step": 78600 }, { "epoch": 8.43, "eval_loss": 0.450659841299057, "eval_runtime": 49.9373, "eval_samples_per_second": 40.591, "eval_steps_per_second": 5.086, "eval_wer": 0.3522296443401336, "step": 78700 }, { "epoch": 8.44, "eval_loss": 0.45615944266319275, "eval_runtime": 49.8778, "eval_samples_per_second": 40.639, "eval_steps_per_second": 5.092, "eval_wer": 0.358277667448998, "step": 78800 }, { "epoch": 8.45, "eval_loss": 0.442095547914505, "eval_runtime": 49.5311, "eval_samples_per_second": 40.924, "eval_steps_per_second": 5.128, "eval_wer": 0.35773605343924897, "step": 78900 }, { "epoch": 8.46, "learning_rate": 0.00013137249283667622, "loss": 0.1545, "step": 79000 }, { "epoch": 8.46, "eval_loss": 0.4484567642211914, "eval_runtime": 49.8883, "eval_samples_per_second": 40.631, "eval_steps_per_second": 5.091, "eval_wer": 0.35466690738400436, "step": 79000 }, { "epoch": 8.47, "eval_loss": 0.4389214813709259, "eval_runtime": 49.6752, "eval_samples_per_second": 40.805, "eval_steps_per_second": 5.113, "eval_wer": 0.34654269723776854, "step": 79100 }, { "epoch": 8.48, "eval_loss": 0.43973833322525024, "eval_runtime": 49.8321, "eval_samples_per_second": 40.677, "eval_steps_per_second": 5.097, "eval_wer": 0.3501534573027622, "step": 79200 }, { "epoch": 8.49, "eval_loss": 0.44029539823532104, "eval_runtime": 50.1573, "eval_samples_per_second": 40.413, "eval_steps_per_second": 5.064, "eval_wer": 0.3470843112475176, "step": 79300 }, { "epoch": 8.5, "eval_loss": 0.4393804967403412, "eval_runtime": 49.826, "eval_samples_per_second": 40.682, "eval_steps_per_second": 5.098, "eval_wer": 0.3481675392670157, "step": 79400 }, { "epoch": 8.51, "learning_rate": 0.00013029799426934096, "loss": 0.153, "step": 79500 }, { "epoch": 8.51, "eval_loss": 0.43932780623435974, "eval_runtime": 50.1463, "eval_samples_per_second": 40.422, "eval_steps_per_second": 5.065, "eval_wer": 0.3473551182523921, "step": 79500 }, { "epoch": 8.52, "eval_loss": 0.434330016374588, "eval_runtime": 49.9012, "eval_samples_per_second": 40.62, "eval_steps_per_second": 5.09, "eval_wer": 0.34952157429138836, "step": 79600 }, { "epoch": 8.53, "eval_loss": 0.4395470917224884, "eval_runtime": 49.8862, "eval_samples_per_second": 40.633, "eval_steps_per_second": 5.092, "eval_wer": 0.35385448636938077, "step": 79700 }, { "epoch": 8.54, "eval_loss": 0.44967034459114075, "eval_runtime": 49.7096, "eval_samples_per_second": 40.777, "eval_steps_per_second": 5.11, "eval_wer": 0.3534934103628814, "step": 79800 }, { "epoch": 8.55, "eval_loss": 0.44434839487075806, "eval_runtime": 49.5821, "eval_samples_per_second": 40.882, "eval_steps_per_second": 5.123, "eval_wer": 0.35403502437263046, "step": 79900 }, { "epoch": 8.57, "learning_rate": 0.00012922349570200573, "loss": 0.1558, "step": 80000 }, { "epoch": 8.57, "eval_loss": 0.4494616985321045, "eval_runtime": 49.8291, "eval_samples_per_second": 40.679, "eval_steps_per_second": 5.097, "eval_wer": 0.35538905939700305, "step": 80000 }, { "epoch": 8.58, "eval_loss": 0.4387182295322418, "eval_runtime": 50.0487, "eval_samples_per_second": 40.501, "eval_steps_per_second": 5.075, "eval_wer": 0.3460010832280195, "step": 80100 }, { "epoch": 8.59, "eval_loss": 0.4377879202365875, "eval_runtime": 49.7994, "eval_samples_per_second": 40.703, "eval_steps_per_second": 5.1, "eval_wer": 0.3520491063368839, "step": 80200 }, { "epoch": 8.6, "eval_loss": 0.44459307193756104, "eval_runtime": 50.011, "eval_samples_per_second": 40.531, "eval_steps_per_second": 5.079, "eval_wer": 0.3526809893482578, "step": 80300 }, { "epoch": 8.61, "eval_loss": 0.451284795999527, "eval_runtime": 49.4538, "eval_samples_per_second": 40.988, "eval_steps_per_second": 5.136, "eval_wer": 0.3507853403141361, "step": 80400 }, { "epoch": 8.62, "learning_rate": 0.00012814899713467048, "loss": 0.1527, "step": 80500 }, { "epoch": 8.62, "eval_loss": 0.43961384892463684, "eval_runtime": 49.3742, "eval_samples_per_second": 41.054, "eval_steps_per_second": 5.144, "eval_wer": 0.3536739483661311, "step": 80500 }, { "epoch": 8.63, "eval_loss": 0.4405277967453003, "eval_runtime": 49.7186, "eval_samples_per_second": 40.769, "eval_steps_per_second": 5.109, "eval_wer": 0.35069507131251126, "step": 80600 }, { "epoch": 8.64, "eval_loss": 0.4397623538970947, "eval_runtime": 49.7906, "eval_samples_per_second": 40.71, "eval_steps_per_second": 5.101, "eval_wer": 0.34500812421014626, "step": 80700 }, { "epoch": 8.65, "eval_loss": 0.44584351778030396, "eval_runtime": 49.9839, "eval_samples_per_second": 40.553, "eval_steps_per_second": 5.082, "eval_wer": 0.3507853403141361, "step": 80800 }, { "epoch": 8.66, "eval_loss": 0.43796154856681824, "eval_runtime": 50.8439, "eval_samples_per_second": 39.867, "eval_steps_per_second": 4.996, "eval_wer": 0.3464524282361437, "step": 80900 }, { "epoch": 8.67, "learning_rate": 0.00012707449856733523, "loss": 0.1522, "step": 81000 }, { "epoch": 8.67, "eval_loss": 0.4372806251049042, "eval_runtime": 49.486, "eval_samples_per_second": 40.961, "eval_steps_per_second": 5.133, "eval_wer": 0.3481675392670157, "step": 81000 }, { "epoch": 8.68, "eval_loss": 0.4363256096839905, "eval_runtime": 49.4566, "eval_samples_per_second": 40.985, "eval_steps_per_second": 5.136, "eval_wer": 0.34103628813865317, "step": 81100 }, { "epoch": 8.69, "eval_loss": 0.4289993941783905, "eval_runtime": 49.6427, "eval_samples_per_second": 40.832, "eval_steps_per_second": 5.117, "eval_wer": 0.34473731720527173, "step": 81200 }, { "epoch": 8.7, "eval_loss": 0.4408806264400482, "eval_runtime": 50.5803, "eval_samples_per_second": 40.075, "eval_steps_per_second": 5.022, "eval_wer": 0.35150749232713485, "step": 81300 }, { "epoch": 8.72, "eval_loss": 0.43628886342048645, "eval_runtime": 49.5854, "eval_samples_per_second": 40.879, "eval_steps_per_second": 5.122, "eval_wer": 0.34329301317927424, "step": 81400 }, { "epoch": 8.73, "learning_rate": 0.00012599999999999997, "loss": 0.1502, "step": 81500 }, { "epoch": 8.73, "eval_loss": 0.4313265383243561, "eval_runtime": 50.648, "eval_samples_per_second": 40.021, "eval_steps_per_second": 5.015, "eval_wer": 0.34293193717277487, "step": 81500 }, { "epoch": 8.74, "eval_loss": 0.4263302981853485, "eval_runtime": 49.6108, "eval_samples_per_second": 40.858, "eval_steps_per_second": 5.12, "eval_wer": 0.3450983932117711, "step": 81600 }, { "epoch": 8.75, "eval_loss": 0.42967385053634644, "eval_runtime": 49.8154, "eval_samples_per_second": 40.69, "eval_steps_per_second": 5.099, "eval_wer": 0.34518866221339595, "step": 81700 }, { "epoch": 8.76, "eval_loss": 0.4448642432689667, "eval_runtime": 49.7694, "eval_samples_per_second": 40.728, "eval_steps_per_second": 5.104, "eval_wer": 0.341126557140278, "step": 81800 }, { "epoch": 8.77, "eval_loss": 0.4465280771255493, "eval_runtime": 49.2797, "eval_samples_per_second": 41.133, "eval_steps_per_second": 5.154, "eval_wer": 0.34554973821989526, "step": 81900 }, { "epoch": 8.78, "learning_rate": 0.00012492550143266475, "loss": 0.151, "step": 82000 }, { "epoch": 8.78, "eval_loss": 0.42739376425743103, "eval_runtime": 49.4978, "eval_samples_per_second": 40.951, "eval_steps_per_second": 5.132, "eval_wer": 0.34248059216465065, "step": 82000 }, { "epoch": 8.79, "eval_loss": 0.45250403881073, "eval_runtime": 49.9239, "eval_samples_per_second": 40.602, "eval_steps_per_second": 5.088, "eval_wer": 0.35322260335800687, "step": 82100 }, { "epoch": 8.8, "eval_loss": 0.4282127618789673, "eval_runtime": 49.2, "eval_samples_per_second": 41.199, "eval_steps_per_second": 5.163, "eval_wer": 0.35024372630438705, "step": 82200 }, { "epoch": 8.81, "eval_loss": 0.418887734413147, "eval_runtime": 49.616, "eval_samples_per_second": 40.854, "eval_steps_per_second": 5.119, "eval_wer": 0.35069507131251126, "step": 82300 }, { "epoch": 8.82, "eval_loss": 0.4379144608974457, "eval_runtime": 49.3537, "eval_samples_per_second": 41.071, "eval_steps_per_second": 5.147, "eval_wer": 0.3450983932117711, "step": 82400 }, { "epoch": 8.83, "learning_rate": 0.00012385315186246417, "loss": 0.1529, "step": 82500 }, { "epoch": 8.83, "eval_loss": 0.43779709935188293, "eval_runtime": 49.8201, "eval_samples_per_second": 40.686, "eval_steps_per_second": 5.098, "eval_wer": 0.3419389781549016, "step": 82500 }, { "epoch": 8.84, "eval_loss": 0.42828336358070374, "eval_runtime": 49.4645, "eval_samples_per_second": 40.979, "eval_steps_per_second": 5.135, "eval_wer": 0.33923090810615636, "step": 82600 }, { "epoch": 8.85, "eval_loss": 0.4358876943588257, "eval_runtime": 49.5058, "eval_samples_per_second": 40.945, "eval_steps_per_second": 5.131, "eval_wer": 0.33986279111753026, "step": 82700 }, { "epoch": 8.87, "eval_loss": 0.4307969808578491, "eval_runtime": 49.606, "eval_samples_per_second": 40.862, "eval_steps_per_second": 5.12, "eval_wer": 0.3358006860444123, "step": 82800 }, { "epoch": 8.88, "eval_loss": 0.42962419986724854, "eval_runtime": 50.0738, "eval_samples_per_second": 40.48, "eval_steps_per_second": 5.073, "eval_wer": 0.33345369200216646, "step": 82900 }, { "epoch": 8.89, "learning_rate": 0.00012277865329512894, "loss": 0.151, "step": 83000 }, { "epoch": 8.89, "eval_loss": 0.4386581778526306, "eval_runtime": 49.6144, "eval_samples_per_second": 40.855, "eval_steps_per_second": 5.119, "eval_wer": 0.3372449900704098, "step": 83000 }, { "epoch": 8.9, "eval_loss": 0.4334877133369446, "eval_runtime": 49.5844, "eval_samples_per_second": 40.88, "eval_steps_per_second": 5.123, "eval_wer": 0.34202924715652644, "step": 83100 }, { "epoch": 8.91, "eval_loss": 0.4329209625720978, "eval_runtime": 49.5046, "eval_samples_per_second": 40.946, "eval_steps_per_second": 5.131, "eval_wer": 0.3374255280736595, "step": 83200 }, { "epoch": 8.92, "eval_loss": 0.43530502915382385, "eval_runtime": 49.6901, "eval_samples_per_second": 40.793, "eval_steps_per_second": 5.112, "eval_wer": 0.3404044051272793, "step": 83300 }, { "epoch": 8.93, "eval_loss": 0.43844395875930786, "eval_runtime": 49.5686, "eval_samples_per_second": 40.893, "eval_steps_per_second": 5.124, "eval_wer": 0.34473731720527173, "step": 83400 }, { "epoch": 8.94, "learning_rate": 0.00012170415472779367, "loss": 0.1522, "step": 83500 }, { "epoch": 8.94, "eval_loss": 0.4444495141506195, "eval_runtime": 49.7157, "eval_samples_per_second": 40.772, "eval_steps_per_second": 5.109, "eval_wer": 0.3352590720346633, "step": 83500 }, { "epoch": 8.95, "eval_loss": 0.4412956237792969, "eval_runtime": 49.7084, "eval_samples_per_second": 40.778, "eval_steps_per_second": 5.11, "eval_wer": 0.34807727026539087, "step": 83600 }, { "epoch": 8.96, "eval_loss": 0.42466339468955994, "eval_runtime": 49.4542, "eval_samples_per_second": 40.987, "eval_steps_per_second": 5.136, "eval_wer": 0.3473551182523921, "step": 83700 }, { "epoch": 8.97, "eval_loss": 0.41966524720191956, "eval_runtime": 49.9194, "eval_samples_per_second": 40.605, "eval_steps_per_second": 5.088, "eval_wer": 0.33859902509478246, "step": 83800 }, { "epoch": 8.98, "eval_loss": 0.42158830165863037, "eval_runtime": 49.7701, "eval_samples_per_second": 40.727, "eval_steps_per_second": 5.103, "eval_wer": 0.33841848709153277, "step": 83900 }, { "epoch": 8.99, "learning_rate": 0.00012062965616045843, "loss": 0.1511, "step": 84000 }, { "epoch": 8.99, "eval_loss": 0.41589921712875366, "eval_runtime": 50.0082, "eval_samples_per_second": 40.533, "eval_steps_per_second": 5.079, "eval_wer": 0.33959198411265573, "step": 84000 }, { "epoch": 9.0, "eval_loss": 0.4212520122528076, "eval_runtime": 49.9688, "eval_samples_per_second": 40.565, "eval_steps_per_second": 5.083, "eval_wer": 0.3415779021484022, "step": 84100 }, { "epoch": 9.01, "eval_loss": 0.43991902470588684, "eval_runtime": 50.2667, "eval_samples_per_second": 40.325, "eval_steps_per_second": 5.053, "eval_wer": 0.3378768730817837, "step": 84200 }, { "epoch": 9.03, "eval_loss": 0.43180111050605774, "eval_runtime": 50.1864, "eval_samples_per_second": 40.389, "eval_steps_per_second": 5.061, "eval_wer": 0.3436540891857736, "step": 84300 }, { "epoch": 9.04, "eval_loss": 0.43560150265693665, "eval_runtime": 50.6404, "eval_samples_per_second": 40.027, "eval_steps_per_second": 5.016, "eval_wer": 0.3370644520671601, "step": 84400 }, { "epoch": 9.05, "learning_rate": 0.00011955515759312319, "loss": 0.1336, "step": 84500 }, { "epoch": 9.05, "eval_loss": 0.44032755494117737, "eval_runtime": 49.9078, "eval_samples_per_second": 40.615, "eval_steps_per_second": 5.089, "eval_wer": 0.33733525907203465, "step": 84500 }, { "epoch": 9.06, "eval_loss": 0.4544905722141266, "eval_runtime": 48.9473, "eval_samples_per_second": 41.412, "eval_steps_per_second": 5.189, "eval_wer": 0.33814768008665824, "step": 84600 }, { "epoch": 9.07, "eval_loss": 0.4313288629055023, "eval_runtime": 49.8429, "eval_samples_per_second": 40.668, "eval_steps_per_second": 5.096, "eval_wer": 0.3330926159956671, "step": 84700 }, { "epoch": 9.08, "eval_loss": 0.425656259059906, "eval_runtime": 49.1736, "eval_samples_per_second": 41.221, "eval_steps_per_second": 5.165, "eval_wer": 0.335981224047662, "step": 84800 }, { "epoch": 9.09, "eval_loss": 0.4285389482975006, "eval_runtime": 49.1078, "eval_samples_per_second": 41.277, "eval_steps_per_second": 5.172, "eval_wer": 0.33715472106878497, "step": 84900 }, { "epoch": 9.1, "learning_rate": 0.00011848065902578795, "loss": 0.1315, "step": 85000 }, { "epoch": 9.1, "eval_loss": 0.43780598044395447, "eval_runtime": 49.1411, "eval_samples_per_second": 41.249, "eval_steps_per_second": 5.169, "eval_wer": 0.33318288499729193, "step": 85000 }, { "epoch": 9.11, "eval_loss": 0.4351807236671448, "eval_runtime": 48.8456, "eval_samples_per_second": 41.498, "eval_steps_per_second": 5.2, "eval_wer": 0.3282180899079256, "step": 85100 }, { "epoch": 9.12, "eval_loss": 0.4359615743160248, "eval_runtime": 50.6269, "eval_samples_per_second": 40.038, "eval_steps_per_second": 5.017, "eval_wer": 0.3339050370102907, "step": 85200 }, { "epoch": 9.13, "eval_loss": 0.4403829574584961, "eval_runtime": 48.958, "eval_samples_per_second": 41.403, "eval_steps_per_second": 5.188, "eval_wer": 0.33652283805741107, "step": 85300 }, { "epoch": 9.14, "eval_loss": 0.4345133602619171, "eval_runtime": 49.1877, "eval_samples_per_second": 41.21, "eval_steps_per_second": 5.164, "eval_wer": 0.3356201480411627, "step": 85400 }, { "epoch": 9.15, "learning_rate": 0.00011740616045845271, "loss": 0.1272, "step": 85500 }, { "epoch": 9.15, "eval_loss": 0.4467580020427704, "eval_runtime": 48.8216, "eval_samples_per_second": 41.519, "eval_steps_per_second": 5.203, "eval_wer": 0.33751579707528434, "step": 85500 }, { "epoch": 9.16, "eval_loss": 0.43308141827583313, "eval_runtime": 49.2077, "eval_samples_per_second": 41.193, "eval_steps_per_second": 5.162, "eval_wer": 0.3363423000541614, "step": 85600 }, { "epoch": 9.18, "eval_loss": 0.4329800605773926, "eval_runtime": 50.5519, "eval_samples_per_second": 40.097, "eval_steps_per_second": 5.025, "eval_wer": 0.3309261599566709, "step": 85700 }, { "epoch": 9.19, "eval_loss": 0.4423808753490448, "eval_runtime": 48.8833, "eval_samples_per_second": 41.466, "eval_steps_per_second": 5.196, "eval_wer": 0.3301137389420473, "step": 85800 }, { "epoch": 9.2, "eval_loss": 0.4520210027694702, "eval_runtime": 48.6979, "eval_samples_per_second": 41.624, "eval_steps_per_second": 5.216, "eval_wer": 0.33264127098754287, "step": 85900 }, { "epoch": 9.21, "learning_rate": 0.00011633166189111747, "loss": 0.1289, "step": 86000 }, { "epoch": 9.21, "eval_loss": 0.44208621978759766, "eval_runtime": 49.4655, "eval_samples_per_second": 40.978, "eval_steps_per_second": 5.135, "eval_wer": 0.332551001985918, "step": 86000 }, { "epoch": 9.22, "eval_loss": 0.44799816608428955, "eval_runtime": 49.0094, "eval_samples_per_second": 41.359, "eval_steps_per_second": 5.183, "eval_wer": 0.33345369200216646, "step": 86100 }, { "epoch": 9.23, "eval_loss": 0.4351326525211334, "eval_runtime": 49.1297, "eval_samples_per_second": 41.258, "eval_steps_per_second": 5.17, "eval_wer": 0.33796714208340856, "step": 86200 }, { "epoch": 9.24, "eval_loss": 0.43502259254455566, "eval_runtime": 49.1339, "eval_samples_per_second": 41.255, "eval_steps_per_second": 5.17, "eval_wer": 0.34266113016790034, "step": 86300 }, { "epoch": 9.25, "eval_loss": 0.43621236085891724, "eval_runtime": 49.6078, "eval_samples_per_second": 40.86, "eval_steps_per_second": 5.12, "eval_wer": 0.33200938797616897, "step": 86400 }, { "epoch": 9.26, "learning_rate": 0.00011525716332378223, "loss": 0.1333, "step": 86500 }, { "epoch": 9.26, "eval_loss": 0.42599332332611084, "eval_runtime": 49.1903, "eval_samples_per_second": 41.207, "eval_steps_per_second": 5.164, "eval_wer": 0.3341758440151652, "step": 86500 }, { "epoch": 9.27, "eval_loss": 0.4356515407562256, "eval_runtime": 48.8406, "eval_samples_per_second": 41.502, "eval_steps_per_second": 5.201, "eval_wer": 0.335981224047662, "step": 86600 }, { "epoch": 9.28, "eval_loss": 0.45051419734954834, "eval_runtime": 49.1958, "eval_samples_per_second": 41.203, "eval_steps_per_second": 5.163, "eval_wer": 0.3372449900704098, "step": 86700 }, { "epoch": 9.29, "eval_loss": 0.4341755509376526, "eval_runtime": 49.4875, "eval_samples_per_second": 40.96, "eval_steps_per_second": 5.133, "eval_wer": 0.33589095504603717, "step": 86800 }, { "epoch": 9.3, "eval_loss": 0.4295257329940796, "eval_runtime": 49.2323, "eval_samples_per_second": 41.172, "eval_steps_per_second": 5.159, "eval_wer": 0.33670337606066075, "step": 86900 }, { "epoch": 9.31, "learning_rate": 0.00011418266475644698, "loss": 0.1318, "step": 87000 }, { "epoch": 9.31, "eval_loss": 0.43195515871047974, "eval_runtime": 50.3285, "eval_samples_per_second": 40.275, "eval_steps_per_second": 5.047, "eval_wer": 0.3335439610037913, "step": 87000 }, { "epoch": 9.33, "eval_loss": 0.4331757128238678, "eval_runtime": 49.2032, "eval_samples_per_second": 41.197, "eval_steps_per_second": 5.162, "eval_wer": 0.33444665102003973, "step": 87100 }, { "epoch": 9.34, "eval_loss": 0.43729162216186523, "eval_runtime": 49.2547, "eval_samples_per_second": 41.153, "eval_steps_per_second": 5.157, "eval_wer": 0.33300234699404224, "step": 87200 }, { "epoch": 9.35, "eval_loss": 0.44904646277427673, "eval_runtime": 49.1768, "eval_samples_per_second": 41.219, "eval_steps_per_second": 5.165, "eval_wer": 0.33155804296804475, "step": 87300 }, { "epoch": 9.36, "eval_loss": 0.41877713799476624, "eval_runtime": 49.0605, "eval_samples_per_second": 41.316, "eval_steps_per_second": 5.177, "eval_wer": 0.34293193717277487, "step": 87400 }, { "epoch": 9.37, "learning_rate": 0.00011311031518624641, "loss": 0.1275, "step": 87500 }, { "epoch": 9.37, "eval_loss": 0.45020759105682373, "eval_runtime": 48.7704, "eval_samples_per_second": 41.562, "eval_steps_per_second": 5.208, "eval_wer": 0.33832821808990793, "step": 87500 }, { "epoch": 9.38, "eval_loss": 0.44634371995925903, "eval_runtime": 49.2783, "eval_samples_per_second": 41.134, "eval_steps_per_second": 5.154, "eval_wer": 0.3386892940964073, "step": 87600 }, { "epoch": 9.39, "eval_loss": 0.4385134279727936, "eval_runtime": 49.1376, "eval_samples_per_second": 41.251, "eval_steps_per_second": 5.169, "eval_wer": 0.33083589095504606, "step": 87700 }, { "epoch": 9.4, "eval_loss": 0.446433424949646, "eval_runtime": 48.9791, "eval_samples_per_second": 41.385, "eval_steps_per_second": 5.186, "eval_wer": 0.34139736414515254, "step": 87800 }, { "epoch": 9.41, "eval_loss": 0.4562661945819855, "eval_runtime": 49.0763, "eval_samples_per_second": 41.303, "eval_steps_per_second": 5.176, "eval_wer": 0.3404946741289041, "step": 87900 }, { "epoch": 9.42, "learning_rate": 0.00011203581661891117, "loss": 0.1331, "step": 88000 }, { "epoch": 9.42, "eval_loss": 0.4285636842250824, "eval_runtime": 49.0786, "eval_samples_per_second": 41.301, "eval_steps_per_second": 5.175, "eval_wer": 0.3374255280736595, "step": 88000 }, { "epoch": 9.43, "eval_loss": 0.4389163553714752, "eval_runtime": 49.1661, "eval_samples_per_second": 41.228, "eval_steps_per_second": 5.166, "eval_wer": 0.3351688030330385, "step": 88100 }, { "epoch": 9.44, "eval_loss": 0.43011942505836487, "eval_runtime": 49.0545, "eval_samples_per_second": 41.321, "eval_steps_per_second": 5.178, "eval_wer": 0.3339953060119155, "step": 88200 }, { "epoch": 9.45, "eval_loss": 0.4416744112968445, "eval_runtime": 49.0788, "eval_samples_per_second": 41.301, "eval_steps_per_second": 5.175, "eval_wer": 0.33733525907203465, "step": 88300 }, { "epoch": 9.46, "eval_loss": 0.44503673911094666, "eval_runtime": 49.266, "eval_samples_per_second": 41.144, "eval_steps_per_second": 5.156, "eval_wer": 0.34248059216465065, "step": 88400 }, { "epoch": 9.48, "learning_rate": 0.00011096346704871058, "loss": 0.1266, "step": 88500 }, { "epoch": 9.48, "eval_loss": 0.44555312395095825, "eval_runtime": 49.2181, "eval_samples_per_second": 41.184, "eval_steps_per_second": 5.161, "eval_wer": 0.3450983932117711, "step": 88500 }, { "epoch": 9.49, "eval_loss": 0.45165377855300903, "eval_runtime": 49.095, "eval_samples_per_second": 41.287, "eval_steps_per_second": 5.174, "eval_wer": 0.3403141361256545, "step": 88600 }, { "epoch": 9.5, "eval_loss": 0.44465458393096924, "eval_runtime": 48.9889, "eval_samples_per_second": 41.377, "eval_steps_per_second": 5.185, "eval_wer": 0.3419389781549016, "step": 88700 }, { "epoch": 9.51, "eval_loss": 0.4486336410045624, "eval_runtime": 49.0554, "eval_samples_per_second": 41.321, "eval_steps_per_second": 5.178, "eval_wer": 0.3427513991695252, "step": 88800 }, { "epoch": 9.52, "eval_loss": 0.4590870141983032, "eval_runtime": 48.9673, "eval_samples_per_second": 41.395, "eval_steps_per_second": 5.187, "eval_wer": 0.341126557140278, "step": 88900 }, { "epoch": 9.53, "learning_rate": 0.00010988896848137534, "loss": 0.1316, "step": 89000 }, { "epoch": 9.53, "eval_loss": 0.44813600182533264, "eval_runtime": 49.5192, "eval_samples_per_second": 40.934, "eval_steps_per_second": 5.129, "eval_wer": 0.3386892940964073, "step": 89000 }, { "epoch": 9.54, "eval_loss": 0.43075862526893616, "eval_runtime": 49.2146, "eval_samples_per_second": 41.187, "eval_steps_per_second": 5.161, "eval_wer": 0.33489799602816395, "step": 89100 }, { "epoch": 9.55, "eval_loss": 0.44113072752952576, "eval_runtime": 49.2342, "eval_samples_per_second": 41.171, "eval_steps_per_second": 5.159, "eval_wer": 0.3404946741289041, "step": 89200 }, { "epoch": 9.56, "eval_loss": 0.43779146671295166, "eval_runtime": 48.7095, "eval_samples_per_second": 41.614, "eval_steps_per_second": 5.215, "eval_wer": 0.33896010110128183, "step": 89300 }, { "epoch": 9.57, "eval_loss": 0.44476673007011414, "eval_runtime": 49.0767, "eval_samples_per_second": 41.303, "eval_steps_per_second": 5.176, "eval_wer": 0.33652283805741107, "step": 89400 }, { "epoch": 9.58, "learning_rate": 0.0001088144699140401, "loss": 0.1325, "step": 89500 }, { "epoch": 9.58, "eval_loss": 0.45753398537635803, "eval_runtime": 50.1245, "eval_samples_per_second": 40.439, "eval_steps_per_second": 5.067, "eval_wer": 0.3415779021484022, "step": 89500 }, { "epoch": 9.59, "eval_loss": 0.46084266901016235, "eval_runtime": 48.8264, "eval_samples_per_second": 41.514, "eval_steps_per_second": 5.202, "eval_wer": 0.3422097851597761, "step": 89600 }, { "epoch": 9.6, "eval_loss": 0.4396139681339264, "eval_runtime": 48.7221, "eval_samples_per_second": 41.603, "eval_steps_per_second": 5.213, "eval_wer": 0.3349882650297888, "step": 89700 }, { "epoch": 9.61, "eval_loss": 0.43795400857925415, "eval_runtime": 49.7416, "eval_samples_per_second": 40.751, "eval_steps_per_second": 5.106, "eval_wer": 0.3397725221159054, "step": 89800 }, { "epoch": 9.63, "eval_loss": 0.43372565507888794, "eval_runtime": 49.3047, "eval_samples_per_second": 41.112, "eval_steps_per_second": 5.152, "eval_wer": 0.33877956309803214, "step": 89900 }, { "epoch": 9.64, "learning_rate": 0.00010773997134670486, "loss": 0.1324, "step": 90000 }, { "epoch": 9.64, "eval_loss": 0.4376404285430908, "eval_runtime": 49.2265, "eval_samples_per_second": 41.177, "eval_steps_per_second": 5.16, "eval_wer": 0.33877956309803214, "step": 90000 }, { "epoch": 9.65, "eval_loss": 0.418549120426178, "eval_runtime": 49.0407, "eval_samples_per_second": 41.333, "eval_steps_per_second": 5.179, "eval_wer": 0.33796714208340856, "step": 90100 }, { "epoch": 9.66, "eval_loss": 0.43939289450645447, "eval_runtime": 49.1046, "eval_samples_per_second": 41.279, "eval_steps_per_second": 5.173, "eval_wer": 0.33841848709153277, "step": 90200 }, { "epoch": 9.67, "eval_loss": 0.4472477436065674, "eval_runtime": 48.6772, "eval_samples_per_second": 41.642, "eval_steps_per_second": 5.218, "eval_wer": 0.34004332912077995, "step": 90300 }, { "epoch": 9.68, "eval_loss": 0.45231983065605164, "eval_runtime": 49.342, "eval_samples_per_second": 41.081, "eval_steps_per_second": 5.148, "eval_wer": 0.33896010110128183, "step": 90400 }, { "epoch": 9.69, "learning_rate": 0.00010666762177650428, "loss": 0.1361, "step": 90500 }, { "epoch": 9.69, "eval_loss": 0.4465869069099426, "eval_runtime": 49.0952, "eval_samples_per_second": 41.287, "eval_steps_per_second": 5.174, "eval_wer": 0.338869832099657, "step": 90500 }, { "epoch": 9.7, "eval_loss": 0.44142165780067444, "eval_runtime": 48.9328, "eval_samples_per_second": 41.424, "eval_steps_per_second": 5.191, "eval_wer": 0.33832821808990793, "step": 90600 }, { "epoch": 9.71, "eval_loss": 0.42880019545555115, "eval_runtime": 49.1913, "eval_samples_per_second": 41.206, "eval_steps_per_second": 5.164, "eval_wer": 0.3348077270265391, "step": 90700 }, { "epoch": 9.72, "eval_loss": 0.4444648027420044, "eval_runtime": 49.0743, "eval_samples_per_second": 41.305, "eval_steps_per_second": 5.176, "eval_wer": 0.3374255280736595, "step": 90800 }, { "epoch": 9.73, "eval_loss": 0.4251817762851715, "eval_runtime": 49.2092, "eval_samples_per_second": 41.191, "eval_steps_per_second": 5.162, "eval_wer": 0.33218992597941865, "step": 90900 }, { "epoch": 9.74, "learning_rate": 0.00010559312320916904, "loss": 0.1353, "step": 91000 }, { "epoch": 9.74, "eval_loss": 0.4311528205871582, "eval_runtime": 49.3374, "eval_samples_per_second": 41.084, "eval_steps_per_second": 5.148, "eval_wer": 0.33381476800866583, "step": 91000 }, { "epoch": 9.75, "eval_loss": 0.4325965344905853, "eval_runtime": 49.4186, "eval_samples_per_second": 41.017, "eval_steps_per_second": 5.14, "eval_wer": 0.3319191189745441, "step": 91100 }, { "epoch": 9.76, "eval_loss": 0.42121651768684387, "eval_runtime": 50.098, "eval_samples_per_second": 40.461, "eval_steps_per_second": 5.07, "eval_wer": 0.3399530601191551, "step": 91200 }, { "epoch": 9.78, "eval_loss": 0.4190988838672638, "eval_runtime": 48.9423, "eval_samples_per_second": 41.416, "eval_steps_per_second": 5.19, "eval_wer": 0.3374255280736595, "step": 91300 }, { "epoch": 9.79, "eval_loss": 0.4398752450942993, "eval_runtime": 49.0663, "eval_samples_per_second": 41.311, "eval_steps_per_second": 5.177, "eval_wer": 0.33318288499729193, "step": 91400 }, { "epoch": 9.8, "learning_rate": 0.0001045186246418338, "loss": 0.1308, "step": 91500 }, { "epoch": 9.8, "eval_loss": 0.43398961424827576, "eval_runtime": 49.3702, "eval_samples_per_second": 41.057, "eval_steps_per_second": 5.145, "eval_wer": 0.33489799602816395, "step": 91500 }, { "epoch": 9.81, "eval_loss": 0.4279971718788147, "eval_runtime": 49.3652, "eval_samples_per_second": 41.061, "eval_steps_per_second": 5.145, "eval_wer": 0.3378768730817837, "step": 91600 }, { "epoch": 9.82, "eval_loss": 0.44193169474601746, "eval_runtime": 49.0009, "eval_samples_per_second": 41.367, "eval_steps_per_second": 5.184, "eval_wer": 0.3376060660769092, "step": 91700 }, { "epoch": 9.83, "eval_loss": 0.43088042736053467, "eval_runtime": 49.3626, "eval_samples_per_second": 41.063, "eval_steps_per_second": 5.146, "eval_wer": 0.33327315399891677, "step": 91800 }, { "epoch": 9.84, "eval_loss": 0.42743775248527527, "eval_runtime": 49.588, "eval_samples_per_second": 40.877, "eval_steps_per_second": 5.122, "eval_wer": 0.3351688030330385, "step": 91900 }, { "epoch": 9.85, "learning_rate": 0.00010344627507163324, "loss": 0.1321, "step": 92000 }, { "epoch": 9.85, "eval_loss": 0.41469934582710266, "eval_runtime": 49.1545, "eval_samples_per_second": 41.237, "eval_steps_per_second": 5.167, "eval_wer": 0.333724499007041, "step": 92000 }, { "epoch": 9.86, "eval_loss": 0.4252135455608368, "eval_runtime": 49.2985, "eval_samples_per_second": 41.117, "eval_steps_per_second": 5.152, "eval_wer": 0.3316483119696696, "step": 92100 }, { "epoch": 9.87, "eval_loss": 0.43777018785476685, "eval_runtime": 49.1225, "eval_samples_per_second": 41.264, "eval_steps_per_second": 5.171, "eval_wer": 0.33814768008665824, "step": 92200 }, { "epoch": 9.88, "eval_loss": 0.4264971911907196, "eval_runtime": 49.522, "eval_samples_per_second": 40.931, "eval_steps_per_second": 5.129, "eval_wer": 0.33552987903953785, "step": 92300 }, { "epoch": 9.89, "eval_loss": 0.4247148036956787, "eval_runtime": 49.2205, "eval_samples_per_second": 41.182, "eval_steps_per_second": 5.16, "eval_wer": 0.3330926159956671, "step": 92400 }, { "epoch": 9.9, "learning_rate": 0.000102371776504298, "loss": 0.1358, "step": 92500 }, { "epoch": 9.9, "eval_loss": 0.4099043309688568, "eval_runtime": 49.0334, "eval_samples_per_second": 41.339, "eval_steps_per_second": 5.18, "eval_wer": 0.3378768730817837, "step": 92500 }, { "epoch": 9.91, "eval_loss": 0.414156436920166, "eval_runtime": 49.0837, "eval_samples_per_second": 41.297, "eval_steps_per_second": 5.175, "eval_wer": 0.3356201480411627, "step": 92600 }, { "epoch": 9.93, "eval_loss": 0.4220016598701477, "eval_runtime": 49.194, "eval_samples_per_second": 41.204, "eval_steps_per_second": 5.163, "eval_wer": 0.33318288499729193, "step": 92700 }, { "epoch": 9.94, "eval_loss": 0.42191407084465027, "eval_runtime": 50.2805, "eval_samples_per_second": 40.314, "eval_steps_per_second": 5.052, "eval_wer": 0.33688391406391044, "step": 92800 }, { "epoch": 9.95, "eval_loss": 0.4178451597690582, "eval_runtime": 49.1736, "eval_samples_per_second": 41.221, "eval_steps_per_second": 5.165, "eval_wer": 0.33318288499729193, "step": 92900 }, { "epoch": 9.96, "learning_rate": 0.00010129727793696274, "loss": 0.1331, "step": 93000 }, { "epoch": 9.96, "eval_loss": 0.43051832914352417, "eval_runtime": 49.1956, "eval_samples_per_second": 41.203, "eval_steps_per_second": 5.163, "eval_wer": 0.3352590720346633, "step": 93000 }, { "epoch": 9.97, "eval_loss": 0.43244585394859314, "eval_runtime": 49.2837, "eval_samples_per_second": 41.129, "eval_steps_per_second": 5.154, "eval_wer": 0.3306553529517964, "step": 93100 }, { "epoch": 9.98, "eval_loss": 0.4315347671508789, "eval_runtime": 49.2581, "eval_samples_per_second": 41.151, "eval_steps_per_second": 5.157, "eval_wer": 0.33444665102003973, "step": 93200 }, { "epoch": 9.99, "eval_loss": 0.4212498664855957, "eval_runtime": 49.1731, "eval_samples_per_second": 41.222, "eval_steps_per_second": 5.165, "eval_wer": 0.33137750496479507, "step": 93300 }, { "epoch": 10.0, "eval_loss": 0.42032095789909363, "eval_runtime": 49.4382, "eval_samples_per_second": 41.001, "eval_steps_per_second": 5.138, "eval_wer": 0.33318288499729193, "step": 93400 }, { "epoch": 10.01, "learning_rate": 0.00010022277936962749, "loss": 0.1304, "step": 93500 }, { "epoch": 10.01, "eval_loss": 0.4423731863498688, "eval_runtime": 50.0952, "eval_samples_per_second": 40.463, "eval_steps_per_second": 5.07, "eval_wer": 0.33507853403141363, "step": 93500 }, { "epoch": 10.02, "eval_loss": 0.44737526774406433, "eval_runtime": 49.7473, "eval_samples_per_second": 40.746, "eval_steps_per_second": 5.106, "eval_wer": 0.33408557501354036, "step": 93600 }, { "epoch": 10.03, "eval_loss": 0.4465775191783905, "eval_runtime": 49.5611, "eval_samples_per_second": 40.899, "eval_steps_per_second": 5.125, "eval_wer": 0.33778660408015887, "step": 93700 }, { "epoch": 10.04, "eval_loss": 0.43884560465812683, "eval_runtime": 49.0695, "eval_samples_per_second": 41.309, "eval_steps_per_second": 5.176, "eval_wer": 0.3327315399891677, "step": 93800 }, { "epoch": 10.05, "eval_loss": 0.431158185005188, "eval_runtime": 49.6041, "eval_samples_per_second": 40.864, "eval_steps_per_second": 5.121, "eval_wer": 0.335981224047662, "step": 93900 }, { "epoch": 10.06, "learning_rate": 9.914828080229225e-05, "loss": 0.1152, "step": 94000 }, { "epoch": 10.06, "eval_loss": 0.44709327816963196, "eval_runtime": 49.482, "eval_samples_per_second": 40.964, "eval_steps_per_second": 5.133, "eval_wer": 0.3306553529517964, "step": 94000 }, { "epoch": 10.07, "eval_loss": 0.4472164809703827, "eval_runtime": 49.2263, "eval_samples_per_second": 41.177, "eval_steps_per_second": 5.16, "eval_wer": 0.33155804296804475, "step": 94100 }, { "epoch": 10.09, "eval_loss": 0.4462222158908844, "eval_runtime": 50.6279, "eval_samples_per_second": 40.037, "eval_steps_per_second": 5.017, "eval_wer": 0.33237046398266834, "step": 94200 }, { "epoch": 10.1, "eval_loss": 0.4382689297199249, "eval_runtime": 49.1505, "eval_samples_per_second": 41.241, "eval_steps_per_second": 5.168, "eval_wer": 0.3343563820184149, "step": 94300 }, { "epoch": 10.11, "eval_loss": 0.46711546182632446, "eval_runtime": 49.598, "eval_samples_per_second": 40.869, "eval_steps_per_second": 5.121, "eval_wer": 0.33652283805741107, "step": 94400 }, { "epoch": 10.12, "learning_rate": 9.8073782234957e-05, "loss": 0.1097, "step": 94500 }, { "epoch": 10.12, "eval_loss": 0.4596339464187622, "eval_runtime": 49.2966, "eval_samples_per_second": 41.118, "eval_steps_per_second": 5.152, "eval_wer": 0.3306553529517964, "step": 94500 }, { "epoch": 10.13, "eval_loss": 0.4517350196838379, "eval_runtime": 49.4575, "eval_samples_per_second": 40.985, "eval_steps_per_second": 5.136, "eval_wer": 0.3382379490882831, "step": 94600 }, { "epoch": 10.14, "eval_loss": 0.4285356402397156, "eval_runtime": 49.5466, "eval_samples_per_second": 40.911, "eval_steps_per_second": 5.126, "eval_wer": 0.33796714208340856, "step": 94700 }, { "epoch": 10.15, "eval_loss": 0.46282461285591125, "eval_runtime": 49.2102, "eval_samples_per_second": 41.191, "eval_steps_per_second": 5.162, "eval_wer": 0.3363423000541614, "step": 94800 }, { "epoch": 10.16, "eval_loss": 0.4478081464767456, "eval_runtime": 49.3065, "eval_samples_per_second": 41.11, "eval_steps_per_second": 5.151, "eval_wer": 0.33652283805741107, "step": 94900 }, { "epoch": 10.17, "learning_rate": 9.699928366762177e-05, "loss": 0.1153, "step": 95000 }, { "epoch": 10.17, "eval_loss": 0.44635722041130066, "eval_runtime": 49.4158, "eval_samples_per_second": 41.019, "eval_steps_per_second": 5.14, "eval_wer": 0.3346271890232894, "step": 95000 }, { "epoch": 10.18, "eval_loss": 0.44317421317100525, "eval_runtime": 49.2548, "eval_samples_per_second": 41.153, "eval_steps_per_second": 5.157, "eval_wer": 0.33923090810615636, "step": 95100 }, { "epoch": 10.19, "eval_loss": 0.4326357841491699, "eval_runtime": 49.4047, "eval_samples_per_second": 41.029, "eval_steps_per_second": 5.141, "eval_wer": 0.33300234699404224, "step": 95200 }, { "epoch": 10.2, "eval_loss": 0.4479786455631256, "eval_runtime": 49.1321, "eval_samples_per_second": 41.256, "eval_steps_per_second": 5.17, "eval_wer": 0.3327315399891677, "step": 95300 }, { "epoch": 10.21, "eval_loss": 0.44355833530426025, "eval_runtime": 50.8799, "eval_samples_per_second": 39.839, "eval_steps_per_second": 4.992, "eval_wer": 0.3259613648673046, "step": 95400 }, { "epoch": 10.22, "learning_rate": 9.592693409742119e-05, "loss": 0.1149, "step": 95500 }, { "epoch": 10.22, "eval_loss": 0.4549073874950409, "eval_runtime": 49.3035, "eval_samples_per_second": 41.113, "eval_steps_per_second": 5.152, "eval_wer": 0.33110669795992054, "step": 95500 }, { "epoch": 10.24, "eval_loss": 0.4572867751121521, "eval_runtime": 49.5772, "eval_samples_per_second": 40.886, "eval_steps_per_second": 5.123, "eval_wer": 0.33534934103628816, "step": 95600 }, { "epoch": 10.25, "eval_loss": 0.4373367428779602, "eval_runtime": 49.5738, "eval_samples_per_second": 40.889, "eval_steps_per_second": 5.124, "eval_wer": 0.33688391406391044, "step": 95700 }, { "epoch": 10.26, "eval_loss": 0.4459189176559448, "eval_runtime": 49.4912, "eval_samples_per_second": 40.957, "eval_steps_per_second": 5.132, "eval_wer": 0.3358006860444123, "step": 95800 }, { "epoch": 10.27, "eval_loss": 0.42883867025375366, "eval_runtime": 49.3495, "eval_samples_per_second": 41.074, "eval_steps_per_second": 5.147, "eval_wer": 0.32704459288680265, "step": 95900 }, { "epoch": 10.28, "learning_rate": 9.485243553008595e-05, "loss": 0.1169, "step": 96000 }, { "epoch": 10.28, "eval_loss": 0.44739025831222534, "eval_runtime": 49.7992, "eval_samples_per_second": 40.703, "eval_steps_per_second": 5.1, "eval_wer": 0.33300234699404224, "step": 96000 }, { "epoch": 10.29, "eval_loss": 0.4523959755897522, "eval_runtime": 49.381, "eval_samples_per_second": 41.048, "eval_steps_per_second": 5.144, "eval_wer": 0.3298429319371728, "step": 96100 }, { "epoch": 10.3, "eval_loss": 0.4517040550708771, "eval_runtime": 49.4501, "eval_samples_per_second": 40.991, "eval_steps_per_second": 5.136, "eval_wer": 0.3257808268640549, "step": 96200 }, { "epoch": 10.31, "eval_loss": 0.43664810061454773, "eval_runtime": 49.3021, "eval_samples_per_second": 41.114, "eval_steps_per_second": 5.152, "eval_wer": 0.3288499729192995, "step": 96300 }, { "epoch": 10.32, "eval_loss": 0.4574427008628845, "eval_runtime": 49.5018, "eval_samples_per_second": 40.948, "eval_steps_per_second": 5.131, "eval_wer": 0.33237046398266834, "step": 96400 }, { "epoch": 10.33, "learning_rate": 9.37779369627507e-05, "loss": 0.1137, "step": 96500 }, { "epoch": 10.33, "eval_loss": 0.4506693482398987, "eval_runtime": 49.6177, "eval_samples_per_second": 40.852, "eval_steps_per_second": 5.119, "eval_wer": 0.33426611301679005, "step": 96500 }, { "epoch": 10.34, "eval_loss": 0.44143351912498474, "eval_runtime": 49.2006, "eval_samples_per_second": 41.199, "eval_steps_per_second": 5.163, "eval_wer": 0.3301137389420473, "step": 96600 }, { "epoch": 10.35, "eval_loss": 0.45244306325912476, "eval_runtime": 49.2654, "eval_samples_per_second": 41.144, "eval_steps_per_second": 5.156, "eval_wer": 0.3366131070590359, "step": 96700 }, { "epoch": 10.36, "eval_loss": 0.45626798272132874, "eval_runtime": 50.7297, "eval_samples_per_second": 39.957, "eval_steps_per_second": 5.007, "eval_wer": 0.34347355118252393, "step": 96800 }, { "epoch": 10.37, "eval_loss": 0.4315440356731415, "eval_runtime": 49.4934, "eval_samples_per_second": 40.955, "eval_steps_per_second": 5.132, "eval_wer": 0.33751579707528434, "step": 96900 }, { "epoch": 10.39, "learning_rate": 9.270343839541547e-05, "loss": 0.1162, "step": 97000 }, { "epoch": 10.39, "eval_loss": 0.44286635518074036, "eval_runtime": 49.454, "eval_samples_per_second": 40.988, "eval_steps_per_second": 5.136, "eval_wer": 0.33652283805741107, "step": 97000 }, { "epoch": 10.4, "eval_loss": 0.4488806128501892, "eval_runtime": 49.716, "eval_samples_per_second": 40.772, "eval_steps_per_second": 5.109, "eval_wer": 0.33796714208340856, "step": 97100 }, { "epoch": 10.41, "eval_loss": 0.4351952075958252, "eval_runtime": 49.4834, "eval_samples_per_second": 40.963, "eval_steps_per_second": 5.133, "eval_wer": 0.33571041704278753, "step": 97200 }, { "epoch": 10.42, "eval_loss": 0.4390479624271393, "eval_runtime": 49.1335, "eval_samples_per_second": 41.255, "eval_steps_per_second": 5.17, "eval_wer": 0.3319191189745441, "step": 97300 }, { "epoch": 10.43, "eval_loss": 0.4569990336894989, "eval_runtime": 49.1672, "eval_samples_per_second": 41.227, "eval_steps_per_second": 5.166, "eval_wer": 0.330294276945297, "step": 97400 }, { "epoch": 10.44, "learning_rate": 9.162893982808023e-05, "loss": 0.1151, "step": 97500 }, { "epoch": 10.44, "eval_loss": 0.4691784083843231, "eval_runtime": 49.324, "eval_samples_per_second": 41.096, "eval_steps_per_second": 5.15, "eval_wer": 0.3343563820184149, "step": 97500 }, { "epoch": 10.45, "eval_loss": 0.46045053005218506, "eval_runtime": 49.3284, "eval_samples_per_second": 41.092, "eval_steps_per_second": 5.149, "eval_wer": 0.33318288499729193, "step": 97600 }, { "epoch": 10.46, "eval_loss": 0.4457150101661682, "eval_runtime": 48.9643, "eval_samples_per_second": 41.398, "eval_steps_per_second": 5.187, "eval_wer": 0.32379490882830836, "step": 97700 }, { "epoch": 10.47, "eval_loss": 0.4298110902309418, "eval_runtime": 49.1962, "eval_samples_per_second": 41.202, "eval_steps_per_second": 5.163, "eval_wer": 0.33038454594692185, "step": 97800 }, { "epoch": 10.48, "eval_loss": 0.4619194269180298, "eval_runtime": 49.4405, "eval_samples_per_second": 40.999, "eval_steps_per_second": 5.137, "eval_wer": 0.327405668893302, "step": 97900 }, { "epoch": 10.49, "learning_rate": 9.055444126074499e-05, "loss": 0.1105, "step": 98000 }, { "epoch": 10.49, "eval_loss": 0.4361836612224579, "eval_runtime": 49.0712, "eval_samples_per_second": 41.307, "eval_steps_per_second": 5.176, "eval_wer": 0.32442679183968226, "step": 98000 }, { "epoch": 10.5, "eval_loss": 0.45676031708717346, "eval_runtime": 49.0451, "eval_samples_per_second": 41.329, "eval_steps_per_second": 5.179, "eval_wer": 0.32894024192092436, "step": 98100 }, { "epoch": 10.51, "eval_loss": 0.4522392153739929, "eval_runtime": 49.3352, "eval_samples_per_second": 41.086, "eval_steps_per_second": 5.148, "eval_wer": 0.33363423000541614, "step": 98200 }, { "epoch": 10.52, "eval_loss": 0.43021589517593384, "eval_runtime": 49.3191, "eval_samples_per_second": 41.1, "eval_steps_per_second": 5.15, "eval_wer": 0.32569055786243006, "step": 98300 }, { "epoch": 10.54, "eval_loss": 0.4505043625831604, "eval_runtime": 49.4141, "eval_samples_per_second": 41.021, "eval_steps_per_second": 5.14, "eval_wer": 0.32379490882830836, "step": 98400 }, { "epoch": 10.55, "learning_rate": 8.947994269340974e-05, "loss": 0.1164, "step": 98500 }, { "epoch": 10.55, "eval_loss": 0.4430020749568939, "eval_runtime": 49.2412, "eval_samples_per_second": 41.165, "eval_steps_per_second": 5.158, "eval_wer": 0.3301137389420473, "step": 98500 }, { "epoch": 10.56, "eval_loss": 0.4575265944004059, "eval_runtime": 48.9818, "eval_samples_per_second": 41.383, "eval_steps_per_second": 5.186, "eval_wer": 0.32830835890955046, "step": 98600 }, { "epoch": 10.57, "eval_loss": 0.4447467029094696, "eval_runtime": 49.3508, "eval_samples_per_second": 41.073, "eval_steps_per_second": 5.147, "eval_wer": 0.32767647589817656, "step": 98700 }, { "epoch": 10.58, "eval_loss": 0.4400414824485779, "eval_runtime": 49.1998, "eval_samples_per_second": 41.199, "eval_steps_per_second": 5.163, "eval_wer": 0.3301137389420473, "step": 98800 }, { "epoch": 10.59, "eval_loss": 0.44269418716430664, "eval_runtime": 49.2271, "eval_samples_per_second": 41.176, "eval_steps_per_second": 5.16, "eval_wer": 0.3287597039176747, "step": 98900 }, { "epoch": 10.6, "learning_rate": 8.84054441260745e-05, "loss": 0.1113, "step": 99000 }, { "epoch": 10.6, "eval_loss": 0.4538458585739136, "eval_runtime": 49.0089, "eval_samples_per_second": 41.36, "eval_steps_per_second": 5.183, "eval_wer": 0.32478786784618163, "step": 99000 }, { "epoch": 10.61, "eval_loss": 0.4518674612045288, "eval_runtime": 49.3026, "eval_samples_per_second": 41.113, "eval_steps_per_second": 5.152, "eval_wer": 0.3298429319371728, "step": 99100 }, { "epoch": 10.62, "eval_loss": 0.4290253520011902, "eval_runtime": 49.1748, "eval_samples_per_second": 41.22, "eval_steps_per_second": 5.165, "eval_wer": 0.3248781368478065, "step": 99200 }, { "epoch": 10.63, "eval_loss": 0.45013627409935, "eval_runtime": 49.3453, "eval_samples_per_second": 41.078, "eval_steps_per_second": 5.147, "eval_wer": 0.3219895287958115, "step": 99300 }, { "epoch": 10.64, "eval_loss": 0.4410213530063629, "eval_runtime": 49.1693, "eval_samples_per_second": 41.225, "eval_steps_per_second": 5.166, "eval_wer": 0.3218089907925618, "step": 99400 }, { "epoch": 10.65, "learning_rate": 8.733309455587391e-05, "loss": 0.1159, "step": 99500 }, { "epoch": 10.65, "eval_loss": 0.447797566652298, "eval_runtime": 49.0342, "eval_samples_per_second": 41.338, "eval_steps_per_second": 5.18, "eval_wer": 0.3210868387795631, "step": 99500 }, { "epoch": 10.66, "eval_loss": 0.44618627429008484, "eval_runtime": 48.7054, "eval_samples_per_second": 41.618, "eval_steps_per_second": 5.215, "eval_wer": 0.3249684058494313, "step": 99600 }, { "epoch": 10.67, "eval_loss": 0.45431581139564514, "eval_runtime": 48.7336, "eval_samples_per_second": 41.594, "eval_steps_per_second": 5.212, "eval_wer": 0.33020400794367216, "step": 99700 }, { "epoch": 10.69, "eval_loss": 0.4462348520755768, "eval_runtime": 48.6987, "eval_samples_per_second": 41.623, "eval_steps_per_second": 5.216, "eval_wer": 0.3301137389420473, "step": 99800 }, { "epoch": 10.7, "eval_loss": 0.44683581590652466, "eval_runtime": 49.026, "eval_samples_per_second": 41.345, "eval_steps_per_second": 5.181, "eval_wer": 0.32289221881205993, "step": 99900 }, { "epoch": 10.71, "learning_rate": 8.625859598853867e-05, "loss": 0.1161, "step": 100000 }, { "epoch": 10.71, "eval_loss": 0.45149165391921997, "eval_runtime": 49.1288, "eval_samples_per_second": 41.259, "eval_steps_per_second": 5.17, "eval_wer": 0.3240657158331829, "step": 100000 }, { "epoch": 10.72, "eval_loss": 0.44036853313446045, "eval_runtime": 49.9413, "eval_samples_per_second": 40.588, "eval_steps_per_second": 5.086, "eval_wer": 0.3275862068965517, "step": 100100 }, { "epoch": 10.73, "eval_loss": 0.4439077079296112, "eval_runtime": 48.7005, "eval_samples_per_second": 41.622, "eval_steps_per_second": 5.216, "eval_wer": 0.3221700667990612, "step": 100200 }, { "epoch": 10.74, "eval_loss": 0.43919479846954346, "eval_runtime": 48.8991, "eval_samples_per_second": 41.453, "eval_steps_per_second": 5.194, "eval_wer": 0.32569055786243006, "step": 100300 }, { "epoch": 10.75, "eval_loss": 0.4475514590740204, "eval_runtime": 49.0257, "eval_samples_per_second": 41.346, "eval_steps_per_second": 5.181, "eval_wer": 0.33137750496479507, "step": 100400 }, { "epoch": 10.76, "learning_rate": 8.518409742120343e-05, "loss": 0.1199, "step": 100500 }, { "epoch": 10.76, "eval_loss": 0.44927603006362915, "eval_runtime": 49.1482, "eval_samples_per_second": 41.243, "eval_steps_per_second": 5.168, "eval_wer": 0.32704459288680265, "step": 100500 }, { "epoch": 10.77, "eval_loss": 0.44615232944488525, "eval_runtime": 48.9489, "eval_samples_per_second": 41.411, "eval_steps_per_second": 5.189, "eval_wer": 0.32235060480231087, "step": 100600 }, { "epoch": 10.78, "eval_loss": 0.44666746258735657, "eval_runtime": 48.7214, "eval_samples_per_second": 41.604, "eval_steps_per_second": 5.213, "eval_wer": 0.33110669795992054, "step": 100700 }, { "epoch": 10.79, "eval_loss": 0.4198402762413025, "eval_runtime": 49.5384, "eval_samples_per_second": 40.918, "eval_steps_per_second": 5.127, "eval_wer": 0.3228019498104351, "step": 100800 }, { "epoch": 10.8, "eval_loss": 0.4348670244216919, "eval_runtime": 48.746, "eval_samples_per_second": 41.583, "eval_steps_per_second": 5.211, "eval_wer": 0.32253114280556056, "step": 100900 }, { "epoch": 10.81, "learning_rate": 8.410959885386819e-05, "loss": 0.1146, "step": 101000 }, { "epoch": 10.81, "eval_loss": 0.4371398985385895, "eval_runtime": 49.8683, "eval_samples_per_second": 40.647, "eval_steps_per_second": 5.093, "eval_wer": 0.32722513089005234, "step": 101000 }, { "epoch": 10.82, "eval_loss": 0.4525171220302582, "eval_runtime": 49.2008, "eval_samples_per_second": 41.199, "eval_steps_per_second": 5.163, "eval_wer": 0.3209965697779383, "step": 101100 }, { "epoch": 10.84, "eval_loss": 0.4292885959148407, "eval_runtime": 48.606, "eval_samples_per_second": 41.703, "eval_steps_per_second": 5.226, "eval_wer": 0.32189925979418665, "step": 101200 }, { "epoch": 10.85, "eval_loss": 0.4238409698009491, "eval_runtime": 48.6683, "eval_samples_per_second": 41.649, "eval_steps_per_second": 5.219, "eval_wer": 0.3216284527893121, "step": 101300 }, { "epoch": 10.86, "eval_loss": 0.43767470121383667, "eval_runtime": 48.6531, "eval_samples_per_second": 41.662, "eval_steps_per_second": 5.221, "eval_wer": 0.32523921285430585, "step": 101400 }, { "epoch": 10.87, "learning_rate": 8.303510028653295e-05, "loss": 0.118, "step": 101500 }, { "epoch": 10.87, "eval_loss": 0.43711698055267334, "eval_runtime": 48.5847, "eval_samples_per_second": 41.721, "eval_steps_per_second": 5.228, "eval_wer": 0.3208160317746886, "step": 101500 }, { "epoch": 10.88, "eval_loss": 0.4216325879096985, "eval_runtime": 48.5704, "eval_samples_per_second": 41.733, "eval_steps_per_second": 5.23, "eval_wer": 0.31738580971294456, "step": 101600 }, { "epoch": 10.89, "eval_loss": 0.43119776248931885, "eval_runtime": 48.5795, "eval_samples_per_second": 41.725, "eval_steps_per_second": 5.229, "eval_wer": 0.3189203827405669, "step": 101700 }, { "epoch": 10.9, "eval_loss": 0.4317311942577362, "eval_runtime": 48.6163, "eval_samples_per_second": 41.694, "eval_steps_per_second": 5.225, "eval_wer": 0.3203646867665644, "step": 101800 }, { "epoch": 10.91, "eval_loss": 0.43034303188323975, "eval_runtime": 48.6584, "eval_samples_per_second": 41.658, "eval_steps_per_second": 5.22, "eval_wer": 0.32352410182343383, "step": 101900 }, { "epoch": 10.92, "learning_rate": 8.19606017191977e-05, "loss": 0.114, "step": 102000 }, { "epoch": 10.92, "eval_loss": 0.44159621000289917, "eval_runtime": 49.7514, "eval_samples_per_second": 40.743, "eval_steps_per_second": 5.105, "eval_wer": 0.31576096768369744, "step": 102000 }, { "epoch": 10.93, "eval_loss": 0.4239681363105774, "eval_runtime": 48.5431, "eval_samples_per_second": 41.757, "eval_steps_per_second": 5.232, "eval_wer": 0.31946199675031595, "step": 102100 }, { "epoch": 10.94, "eval_loss": 0.4340362548828125, "eval_runtime": 49.0823, "eval_samples_per_second": 41.298, "eval_steps_per_second": 5.175, "eval_wer": 0.31494854666907385, "step": 102200 }, { "epoch": 10.95, "eval_loss": 0.431062251329422, "eval_runtime": 48.4884, "eval_samples_per_second": 41.804, "eval_steps_per_second": 5.238, "eval_wer": 0.3215381837876873, "step": 102300 }, { "epoch": 10.96, "eval_loss": 0.4261479377746582, "eval_runtime": 49.008, "eval_samples_per_second": 41.361, "eval_steps_per_second": 5.183, "eval_wer": 0.32379490882830836, "step": 102400 }, { "epoch": 10.97, "learning_rate": 8.088610315186246e-05, "loss": 0.1152, "step": 102500 }, { "epoch": 10.97, "eval_loss": 0.42632901668548584, "eval_runtime": 49.1051, "eval_samples_per_second": 41.279, "eval_steps_per_second": 5.173, "eval_wer": 0.3206354937714389, "step": 102500 }, { "epoch": 10.98, "eval_loss": 0.4325226843357086, "eval_runtime": 49.3257, "eval_samples_per_second": 41.094, "eval_steps_per_second": 5.149, "eval_wer": 0.3293915869290486, "step": 102600 }, { "epoch": 11.0, "eval_loss": 0.4327019155025482, "eval_runtime": 49.2829, "eval_samples_per_second": 41.13, "eval_steps_per_second": 5.154, "eval_wer": 0.3187398447373172, "step": 102700 }, { "epoch": 11.01, "eval_loss": 0.44230592250823975, "eval_runtime": 49.246, "eval_samples_per_second": 41.161, "eval_steps_per_second": 5.158, "eval_wer": 0.31946199675031595, "step": 102800 }, { "epoch": 11.02, "eval_loss": 0.43406760692596436, "eval_runtime": 49.0206, "eval_samples_per_second": 41.35, "eval_steps_per_second": 5.181, "eval_wer": 0.32767647589817656, "step": 102900 }, { "epoch": 11.03, "learning_rate": 7.981160458452722e-05, "loss": 0.1084, "step": 103000 }, { "epoch": 11.03, "eval_loss": 0.42317888140678406, "eval_runtime": 49.1704, "eval_samples_per_second": 41.224, "eval_steps_per_second": 5.166, "eval_wer": 0.3243365228380574, "step": 103000 }, { "epoch": 11.04, "eval_loss": 0.4355052411556244, "eval_runtime": 49.0712, "eval_samples_per_second": 41.307, "eval_steps_per_second": 5.176, "eval_wer": 0.31837876873081783, "step": 103100 }, { "epoch": 11.05, "eval_loss": 0.43737396597862244, "eval_runtime": 49.4194, "eval_samples_per_second": 41.016, "eval_steps_per_second": 5.14, "eval_wer": 0.327405668893302, "step": 103200 }, { "epoch": 11.06, "eval_loss": 0.44839176535606384, "eval_runtime": 49.5435, "eval_samples_per_second": 40.914, "eval_steps_per_second": 5.127, "eval_wer": 0.3304748149485467, "step": 103300 }, { "epoch": 11.07, "eval_loss": 0.44234499335289, "eval_runtime": 48.8359, "eval_samples_per_second": 41.506, "eval_steps_per_second": 5.201, "eval_wer": 0.3226214118071854, "step": 103400 }, { "epoch": 11.08, "learning_rate": 7.873925501432665e-05, "loss": 0.1003, "step": 103500 }, { "epoch": 11.08, "eval_loss": 0.45182204246520996, "eval_runtime": 49.1484, "eval_samples_per_second": 41.242, "eval_steps_per_second": 5.168, "eval_wer": 0.3224408738039357, "step": 103500 }, { "epoch": 11.09, "eval_loss": 0.45178499817848206, "eval_runtime": 48.7083, "eval_samples_per_second": 41.615, "eval_steps_per_second": 5.215, "eval_wer": 0.3243365228380574, "step": 103600 }, { "epoch": 11.1, "eval_loss": 0.4281817376613617, "eval_runtime": 48.8171, "eval_samples_per_second": 41.522, "eval_steps_per_second": 5.203, "eval_wer": 0.32072576277306375, "step": 103700 }, { "epoch": 11.11, "eval_loss": 0.44184988737106323, "eval_runtime": 48.9326, "eval_samples_per_second": 41.424, "eval_steps_per_second": 5.191, "eval_wer": 0.3219895287958115, "step": 103800 }, { "epoch": 11.12, "eval_loss": 0.4411134123802185, "eval_runtime": 48.7339, "eval_samples_per_second": 41.593, "eval_steps_per_second": 5.212, "eval_wer": 0.3216284527893121, "step": 103900 }, { "epoch": 11.13, "learning_rate": 7.766475644699141e-05, "loss": 0.1009, "step": 104000 }, { "epoch": 11.13, "eval_loss": 0.44739264249801636, "eval_runtime": 49.071, "eval_samples_per_second": 41.307, "eval_steps_per_second": 5.176, "eval_wer": 0.32379490882830836, "step": 104000 }, { "epoch": 11.15, "eval_loss": 0.4405987858772278, "eval_runtime": 48.9357, "eval_samples_per_second": 41.422, "eval_steps_per_second": 5.19, "eval_wer": 0.3245170608413071, "step": 104100 }, { "epoch": 11.16, "eval_loss": 0.43838658928871155, "eval_runtime": 48.6654, "eval_samples_per_second": 41.652, "eval_steps_per_second": 5.219, "eval_wer": 0.32415598483480773, "step": 104200 }, { "epoch": 11.17, "eval_loss": 0.470173716545105, "eval_runtime": 48.9255, "eval_samples_per_second": 41.43, "eval_steps_per_second": 5.192, "eval_wer": 0.3265029788770536, "step": 104300 }, { "epoch": 11.18, "eval_loss": 0.4611179828643799, "eval_runtime": 48.9633, "eval_samples_per_second": 41.398, "eval_steps_per_second": 5.188, "eval_wer": 0.32659324787867844, "step": 104400 }, { "epoch": 11.19, "learning_rate": 7.659025787965614e-05, "loss": 0.0992, "step": 104500 }, { "epoch": 11.19, "eval_loss": 0.44245555996894836, "eval_runtime": 48.853, "eval_samples_per_second": 41.492, "eval_steps_per_second": 5.199, "eval_wer": 0.3210868387795631, "step": 104500 }, { "epoch": 11.2, "eval_loss": 0.45753201842308044, "eval_runtime": 48.7428, "eval_samples_per_second": 41.586, "eval_steps_per_second": 5.211, "eval_wer": 0.3221700667990612, "step": 104600 }, { "epoch": 11.21, "eval_loss": 0.4448811411857605, "eval_runtime": 48.4957, "eval_samples_per_second": 41.797, "eval_steps_per_second": 5.238, "eval_wer": 0.3208160317746886, "step": 104700 }, { "epoch": 11.22, "eval_loss": 0.47151175141334534, "eval_runtime": 48.9938, "eval_samples_per_second": 41.373, "eval_steps_per_second": 5.184, "eval_wer": 0.3208160317746886, "step": 104800 }, { "epoch": 11.23, "eval_loss": 0.4468552768230438, "eval_runtime": 48.8885, "eval_samples_per_second": 41.462, "eval_steps_per_second": 5.195, "eval_wer": 0.322260335800686, "step": 104900 }, { "epoch": 11.24, "learning_rate": 7.55157593123209e-05, "loss": 0.1021, "step": 105000 }, { "epoch": 11.24, "eval_loss": 0.4536341726779938, "eval_runtime": 48.4312, "eval_samples_per_second": 41.853, "eval_steps_per_second": 5.245, "eval_wer": 0.32253114280556056, "step": 105000 }, { "epoch": 11.25, "eval_loss": 0.4629049599170685, "eval_runtime": 48.4787, "eval_samples_per_second": 41.812, "eval_steps_per_second": 5.239, "eval_wer": 0.323433832821809, "step": 105100 }, { "epoch": 11.26, "eval_loss": 0.4549843966960907, "eval_runtime": 48.5414, "eval_samples_per_second": 41.758, "eval_steps_per_second": 5.233, "eval_wer": 0.32054522476981406, "step": 105200 }, { "epoch": 11.27, "eval_loss": 0.4598093032836914, "eval_runtime": 48.7765, "eval_samples_per_second": 41.557, "eval_steps_per_second": 5.207, "eval_wer": 0.3212673767828128, "step": 105300 }, { "epoch": 11.28, "eval_loss": 0.45224353671073914, "eval_runtime": 48.7101, "eval_samples_per_second": 41.614, "eval_steps_per_second": 5.215, "eval_wer": 0.3179274237226936, "step": 105400 }, { "epoch": 11.3, "learning_rate": 7.444126074498566e-05, "loss": 0.1021, "step": 105500 }, { "epoch": 11.3, "eval_loss": 0.4658335745334625, "eval_runtime": 48.593, "eval_samples_per_second": 41.714, "eval_steps_per_second": 5.227, "eval_wer": 0.3210868387795631, "step": 105500 }, { "epoch": 11.31, "eval_loss": 0.4664027690887451, "eval_runtime": 49.0611, "eval_samples_per_second": 41.316, "eval_steps_per_second": 5.177, "eval_wer": 0.3195522657519408, "step": 105600 }, { "epoch": 11.32, "eval_loss": 0.47357499599456787, "eval_runtime": 49.0629, "eval_samples_per_second": 41.314, "eval_steps_per_second": 5.177, "eval_wer": 0.31774688571944393, "step": 105700 }, { "epoch": 11.33, "eval_loss": 0.4587169885635376, "eval_runtime": 49.4541, "eval_samples_per_second": 40.987, "eval_steps_per_second": 5.136, "eval_wer": 0.31576096768369744, "step": 105800 }, { "epoch": 11.34, "eval_loss": 0.45886215567588806, "eval_runtime": 48.5172, "eval_samples_per_second": 41.779, "eval_steps_per_second": 5.235, "eval_wer": 0.3193717277486911, "step": 105900 }, { "epoch": 11.35, "learning_rate": 7.336676217765042e-05, "loss": 0.1025, "step": 106000 }, { "epoch": 11.35, "eval_loss": 0.4691576361656189, "eval_runtime": 48.5278, "eval_samples_per_second": 41.77, "eval_steps_per_second": 5.234, "eval_wer": 0.32135764578443765, "step": 106000 }, { "epoch": 11.36, "eval_loss": 0.43815869092941284, "eval_runtime": 48.5469, "eval_samples_per_second": 41.753, "eval_steps_per_second": 5.232, "eval_wer": 0.3181079617259433, "step": 106100 }, { "epoch": 11.37, "eval_loss": 0.4555544853210449, "eval_runtime": 48.8057, "eval_samples_per_second": 41.532, "eval_steps_per_second": 5.204, "eval_wer": 0.3184690377324427, "step": 106200 }, { "epoch": 11.38, "eval_loss": 0.4445129334926605, "eval_runtime": 49.8518, "eval_samples_per_second": 40.661, "eval_steps_per_second": 5.095, "eval_wer": 0.3191009207438166, "step": 106300 }, { "epoch": 11.39, "eval_loss": 0.4379484951496124, "eval_runtime": 48.9128, "eval_samples_per_second": 41.441, "eval_steps_per_second": 5.193, "eval_wer": 0.3163025816934465, "step": 106400 }, { "epoch": 11.4, "learning_rate": 7.229226361031518e-05, "loss": 0.104, "step": 106500 }, { "epoch": 11.4, "eval_loss": 0.44537481665611267, "eval_runtime": 48.5687, "eval_samples_per_second": 41.735, "eval_steps_per_second": 5.23, "eval_wer": 0.3219895287958115, "step": 106500 }, { "epoch": 11.41, "eval_loss": 0.44634634256362915, "eval_runtime": 48.8665, "eval_samples_per_second": 41.48, "eval_steps_per_second": 5.198, "eval_wer": 0.32009387976168985, "step": 106600 }, { "epoch": 11.42, "eval_loss": 0.4550469219684601, "eval_runtime": 48.5571, "eval_samples_per_second": 41.745, "eval_steps_per_second": 5.231, "eval_wer": 0.3172955407113197, "step": 106700 }, { "epoch": 11.43, "eval_loss": 0.44044601917266846, "eval_runtime": 48.518, "eval_samples_per_second": 41.778, "eval_steps_per_second": 5.235, "eval_wer": 0.31675392670157065, "step": 106800 }, { "epoch": 11.45, "eval_loss": 0.45691826939582825, "eval_runtime": 48.6409, "eval_samples_per_second": 41.673, "eval_steps_per_second": 5.222, "eval_wer": 0.3170247337064452, "step": 106900 }, { "epoch": 11.46, "learning_rate": 7.121776504297993e-05, "loss": 0.1016, "step": 107000 }, { "epoch": 11.46, "eval_loss": 0.45285138487815857, "eval_runtime": 48.4798, "eval_samples_per_second": 41.811, "eval_steps_per_second": 5.239, "eval_wer": 0.3168441957031955, "step": 107000 }, { "epoch": 11.47, "eval_loss": 0.45870763063430786, "eval_runtime": 49.1364, "eval_samples_per_second": 41.252, "eval_steps_per_second": 5.169, "eval_wer": 0.3172955407113197, "step": 107100 }, { "epoch": 11.48, "eval_loss": 0.4505434036254883, "eval_runtime": 48.8484, "eval_samples_per_second": 41.496, "eval_steps_per_second": 5.2, "eval_wer": 0.31720527170969487, "step": 107200 }, { "epoch": 11.49, "eval_loss": 0.44892099499702454, "eval_runtime": 48.8062, "eval_samples_per_second": 41.532, "eval_steps_per_second": 5.204, "eval_wer": 0.3158512366853223, "step": 107300 }, { "epoch": 11.5, "eval_loss": 0.4527936577796936, "eval_runtime": 48.8297, "eval_samples_per_second": 41.512, "eval_steps_per_second": 5.202, "eval_wer": 0.3129626286333273, "step": 107400 }, { "epoch": 11.51, "learning_rate": 7.014326647564469e-05, "loss": 0.1001, "step": 107500 }, { "epoch": 11.51, "eval_loss": 0.4472792446613312, "eval_runtime": 48.6292, "eval_samples_per_second": 41.683, "eval_steps_per_second": 5.223, "eval_wer": 0.3181079617259433, "step": 107500 }, { "epoch": 11.52, "eval_loss": 0.4434313476085663, "eval_runtime": 48.7732, "eval_samples_per_second": 41.56, "eval_steps_per_second": 5.208, "eval_wer": 0.31756634771619424, "step": 107600 }, { "epoch": 11.53, "eval_loss": 0.45973971486091614, "eval_runtime": 48.7123, "eval_samples_per_second": 41.612, "eval_steps_per_second": 5.214, "eval_wer": 0.3185593067340675, "step": 107700 }, { "epoch": 11.54, "eval_loss": 0.4351407289505005, "eval_runtime": 48.8735, "eval_samples_per_second": 41.474, "eval_steps_per_second": 5.197, "eval_wer": 0.3159415056869471, "step": 107800 }, { "epoch": 11.55, "eval_loss": 0.44710567593574524, "eval_runtime": 49.9625, "eval_samples_per_second": 40.57, "eval_steps_per_second": 5.084, "eval_wer": 0.3184690377324427, "step": 107900 }, { "epoch": 11.56, "learning_rate": 6.907091690544412e-05, "loss": 0.1005, "step": 108000 }, { "epoch": 11.56, "eval_loss": 0.44572997093200684, "eval_runtime": 48.7976, "eval_samples_per_second": 41.539, "eval_steps_per_second": 5.205, "eval_wer": 0.3191009207438166, "step": 108000 }, { "epoch": 11.57, "eval_loss": 0.45437440276145935, "eval_runtime": 48.6844, "eval_samples_per_second": 41.636, "eval_steps_per_second": 5.217, "eval_wer": 0.32930131792742373, "step": 108100 }, { "epoch": 11.58, "eval_loss": 0.4436147212982178, "eval_runtime": 49.2491, "eval_samples_per_second": 41.158, "eval_steps_per_second": 5.157, "eval_wer": 0.32207979779743634, "step": 108200 }, { "epoch": 11.6, "eval_loss": 0.4641793668270111, "eval_runtime": 48.7793, "eval_samples_per_second": 41.554, "eval_steps_per_second": 5.207, "eval_wer": 0.3269543238851778, "step": 108300 }, { "epoch": 11.61, "eval_loss": 0.44737499952316284, "eval_runtime": 48.6883, "eval_samples_per_second": 41.632, "eval_steps_per_second": 5.217, "eval_wer": 0.32704459288680265, "step": 108400 }, { "epoch": 11.62, "learning_rate": 6.799641833810888e-05, "loss": 0.1031, "step": 108500 }, { "epoch": 11.62, "eval_loss": 0.44577571749687195, "eval_runtime": 48.8043, "eval_samples_per_second": 41.533, "eval_steps_per_second": 5.204, "eval_wer": 0.31964253475356563, "step": 108500 }, { "epoch": 11.63, "eval_loss": 0.4723000228404999, "eval_runtime": 48.8424, "eval_samples_per_second": 41.501, "eval_steps_per_second": 5.2, "eval_wer": 0.3204549557681892, "step": 108600 }, { "epoch": 11.64, "eval_loss": 0.4507168233394623, "eval_runtime": 48.9897, "eval_samples_per_second": 41.376, "eval_steps_per_second": 5.185, "eval_wer": 0.3226214118071854, "step": 108700 }, { "epoch": 11.65, "eval_loss": 0.44235825538635254, "eval_runtime": 48.7448, "eval_samples_per_second": 41.584, "eval_steps_per_second": 5.211, "eval_wer": 0.3212673767828128, "step": 108800 }, { "epoch": 11.66, "eval_loss": 0.4511132836341858, "eval_runtime": 48.7014, "eval_samples_per_second": 41.621, "eval_steps_per_second": 5.215, "eval_wer": 0.3212673767828128, "step": 108900 }, { "epoch": 11.67, "learning_rate": 6.692191977077364e-05, "loss": 0.1014, "step": 109000 }, { "epoch": 11.67, "eval_loss": 0.4421851634979248, "eval_runtime": 48.8914, "eval_samples_per_second": 41.459, "eval_steps_per_second": 5.195, "eval_wer": 0.3204549557681892, "step": 109000 }, { "epoch": 11.68, "eval_loss": 0.44982463121414185, "eval_runtime": 48.4128, "eval_samples_per_second": 41.869, "eval_steps_per_second": 5.247, "eval_wer": 0.31801769272431846, "step": 109100 }, { "epoch": 11.69, "eval_loss": 0.43027353286743164, "eval_runtime": 48.7237, "eval_samples_per_second": 41.602, "eval_steps_per_second": 5.213, "eval_wer": 0.31666365769994587, "step": 109200 }, { "epoch": 11.7, "eval_loss": 0.4483342170715332, "eval_runtime": 48.6826, "eval_samples_per_second": 41.637, "eval_steps_per_second": 5.217, "eval_wer": 0.3107961725943311, "step": 109300 }, { "epoch": 11.71, "eval_loss": 0.4547644257545471, "eval_runtime": 49.6041, "eval_samples_per_second": 40.864, "eval_steps_per_second": 5.121, "eval_wer": 0.31693446470482034, "step": 109400 }, { "epoch": 11.72, "learning_rate": 6.584742120343839e-05, "loss": 0.0981, "step": 109500 }, { "epoch": 11.72, "eval_loss": 0.4406187832355499, "eval_runtime": 49.0859, "eval_samples_per_second": 41.295, "eval_steps_per_second": 5.175, "eval_wer": 0.3121502076187037, "step": 109500 }, { "epoch": 11.73, "eval_loss": 0.42933210730552673, "eval_runtime": 49.1781, "eval_samples_per_second": 41.218, "eval_steps_per_second": 5.165, "eval_wer": 0.311428055605705, "step": 109600 }, { "epoch": 11.75, "eval_loss": 0.4368530511856079, "eval_runtime": 48.9575, "eval_samples_per_second": 41.403, "eval_steps_per_second": 5.188, "eval_wer": 0.3158512366853223, "step": 109700 }, { "epoch": 11.76, "eval_loss": 0.43642425537109375, "eval_runtime": 48.9813, "eval_samples_per_second": 41.383, "eval_steps_per_second": 5.186, "eval_wer": 0.31639285069507134, "step": 109800 }, { "epoch": 11.77, "eval_loss": 0.4358440339565277, "eval_runtime": 48.7711, "eval_samples_per_second": 41.562, "eval_steps_per_second": 5.208, "eval_wer": 0.3189203827405669, "step": 109900 }, { "epoch": 11.78, "learning_rate": 6.477292263610315e-05, "loss": 0.1023, "step": 110000 }, { "epoch": 11.78, "eval_loss": 0.4281153976917267, "eval_runtime": 48.845, "eval_samples_per_second": 41.499, "eval_steps_per_second": 5.2, "eval_wer": 0.318288499729193, "step": 110000 }, { "epoch": 11.79, "eval_loss": 0.44035249948501587, "eval_runtime": 49.3957, "eval_samples_per_second": 41.036, "eval_steps_per_second": 5.142, "eval_wer": 0.3158512366853223, "step": 110100 }, { "epoch": 11.8, "eval_loss": 0.44708630442619324, "eval_runtime": 48.6464, "eval_samples_per_second": 41.668, "eval_steps_per_second": 5.221, "eval_wer": 0.31350424264307636, "step": 110200 }, { "epoch": 11.81, "eval_loss": 0.449814110994339, "eval_runtime": 48.8935, "eval_samples_per_second": 41.457, "eval_steps_per_second": 5.195, "eval_wer": 0.32009387976168985, "step": 110300 }, { "epoch": 11.82, "eval_loss": 0.45270591974258423, "eval_runtime": 48.7747, "eval_samples_per_second": 41.558, "eval_steps_per_second": 5.208, "eval_wer": 0.3161220436901968, "step": 110400 }, { "epoch": 11.83, "learning_rate": 6.370057306590257e-05, "loss": 0.0988, "step": 110500 }, { "epoch": 11.83, "eval_loss": 0.4439750909805298, "eval_runtime": 48.8822, "eval_samples_per_second": 41.467, "eval_steps_per_second": 5.196, "eval_wer": 0.3172955407113197, "step": 110500 }, { "epoch": 11.84, "eval_loss": 0.4356108605861664, "eval_runtime": 48.8938, "eval_samples_per_second": 41.457, "eval_steps_per_second": 5.195, "eval_wer": 0.3135945116447012, "step": 110600 }, { "epoch": 11.85, "eval_loss": 0.43082764744758606, "eval_runtime": 48.9279, "eval_samples_per_second": 41.428, "eval_steps_per_second": 5.191, "eval_wer": 0.31350424264307636, "step": 110700 }, { "epoch": 11.86, "eval_loss": 0.4294142723083496, "eval_runtime": 49.0537, "eval_samples_per_second": 41.322, "eval_steps_per_second": 5.178, "eval_wer": 0.3191911897454414, "step": 110800 }, { "epoch": 11.87, "eval_loss": 0.4240707755088806, "eval_runtime": 48.8428, "eval_samples_per_second": 41.501, "eval_steps_per_second": 5.2, "eval_wer": 0.3168441957031955, "step": 110900 }, { "epoch": 11.88, "learning_rate": 6.263037249283667e-05, "loss": 0.1022, "step": 111000 }, { "epoch": 11.88, "eval_loss": 0.44202566146850586, "eval_runtime": 49.1216, "eval_samples_per_second": 41.265, "eval_steps_per_second": 5.171, "eval_wer": 0.3156706986820726, "step": 111000 }, { "epoch": 11.9, "eval_loss": 0.43126294016838074, "eval_runtime": 49.1248, "eval_samples_per_second": 41.262, "eval_steps_per_second": 5.171, "eval_wer": 0.3125112836252031, "step": 111100 }, { "epoch": 11.91, "eval_loss": 0.42133891582489014, "eval_runtime": 48.989, "eval_samples_per_second": 41.377, "eval_steps_per_second": 5.185, "eval_wer": 0.31675392670157065, "step": 111200 }, { "epoch": 11.92, "eval_loss": 0.4351927936077118, "eval_runtime": 50.4732, "eval_samples_per_second": 40.16, "eval_steps_per_second": 5.032, "eval_wer": 0.31350424264307636, "step": 111300 }, { "epoch": 11.93, "eval_loss": 0.4296703040599823, "eval_runtime": 49.0792, "eval_samples_per_second": 41.301, "eval_steps_per_second": 5.175, "eval_wer": 0.3116085936089547, "step": 111400 }, { "epoch": 11.94, "learning_rate": 6.155587392550143e-05, "loss": 0.1032, "step": 111500 }, { "epoch": 11.94, "eval_loss": 0.42183753848075867, "eval_runtime": 49.0367, "eval_samples_per_second": 41.336, "eval_steps_per_second": 5.18, "eval_wer": 0.31368478064632604, "step": 111500 }, { "epoch": 11.95, "eval_loss": 0.43339774012565613, "eval_runtime": 48.4486, "eval_samples_per_second": 41.838, "eval_steps_per_second": 5.243, "eval_wer": 0.3123307456219534, "step": 111600 }, { "epoch": 11.96, "eval_loss": 0.4373456537723541, "eval_runtime": 48.7637, "eval_samples_per_second": 41.568, "eval_steps_per_second": 5.209, "eval_wer": 0.3174760787145694, "step": 111700 }, { "epoch": 11.97, "eval_loss": 0.4298686385154724, "eval_runtime": 49.5415, "eval_samples_per_second": 40.915, "eval_steps_per_second": 5.127, "eval_wer": 0.31603177468857196, "step": 111800 }, { "epoch": 11.98, "eval_loss": 0.432638943195343, "eval_runtime": 48.7304, "eval_samples_per_second": 41.596, "eval_steps_per_second": 5.212, "eval_wer": 0.3189203827405669, "step": 111900 }, { "epoch": 11.99, "learning_rate": 6.0481375358166186e-05, "loss": 0.0969, "step": 112000 }, { "epoch": 11.99, "eval_loss": 0.4207654595375061, "eval_runtime": 48.9546, "eval_samples_per_second": 41.406, "eval_steps_per_second": 5.188, "eval_wer": 0.31864957573569236, "step": 112000 }, { "epoch": 12.0, "eval_loss": 0.4385160207748413, "eval_runtime": 48.8057, "eval_samples_per_second": 41.532, "eval_steps_per_second": 5.204, "eval_wer": 0.31693446470482034, "step": 112100 }, { "epoch": 12.01, "eval_loss": 0.4453379809856415, "eval_runtime": 48.7148, "eval_samples_per_second": 41.609, "eval_steps_per_second": 5.214, "eval_wer": 0.31558042968044775, "step": 112200 }, { "epoch": 12.02, "eval_loss": 0.4596421718597412, "eval_runtime": 48.8968, "eval_samples_per_second": 41.455, "eval_steps_per_second": 5.195, "eval_wer": 0.3133237046398267, "step": 112300 }, { "epoch": 12.03, "eval_loss": 0.45092177391052246, "eval_runtime": 48.8687, "eval_samples_per_second": 41.478, "eval_steps_per_second": 5.198, "eval_wer": 0.3092615995667088, "step": 112400 }, { "epoch": 12.04, "learning_rate": 5.9406876790830945e-05, "loss": 0.0901, "step": 112500 }, { "epoch": 12.04, "eval_loss": 0.45350125432014465, "eval_runtime": 48.6941, "eval_samples_per_second": 41.627, "eval_steps_per_second": 5.216, "eval_wer": 0.3137750496479509, "step": 112500 }, { "epoch": 12.06, "eval_loss": 0.4370967447757721, "eval_runtime": 49.3215, "eval_samples_per_second": 41.098, "eval_steps_per_second": 5.15, "eval_wer": 0.3144069326593248, "step": 112600 }, { "epoch": 12.07, "eval_loss": 0.4498507082462311, "eval_runtime": 49.0717, "eval_samples_per_second": 41.307, "eval_steps_per_second": 5.176, "eval_wer": 0.31539989167719806, "step": 112700 }, { "epoch": 12.08, "eval_loss": 0.46147477626800537, "eval_runtime": 48.753, "eval_samples_per_second": 41.577, "eval_steps_per_second": 5.21, "eval_wer": 0.3198230727568153, "step": 112800 }, { "epoch": 12.09, "eval_loss": 0.45230022072792053, "eval_runtime": 48.945, "eval_samples_per_second": 41.414, "eval_steps_per_second": 5.19, "eval_wer": 0.3176566167178191, "step": 112900 }, { "epoch": 12.1, "learning_rate": 5.833237822349569e-05, "loss": 0.0889, "step": 113000 }, { "epoch": 12.1, "eval_loss": 0.44123727083206177, "eval_runtime": 49.3729, "eval_samples_per_second": 41.055, "eval_steps_per_second": 5.145, "eval_wer": 0.3129626286333273, "step": 113000 }, { "epoch": 12.11, "eval_loss": 0.4471343457698822, "eval_runtime": 49.1556, "eval_samples_per_second": 41.236, "eval_steps_per_second": 5.167, "eval_wer": 0.3181079617259433, "step": 113100 }, { "epoch": 12.12, "eval_loss": 0.45298895239830017, "eval_runtime": 49.0223, "eval_samples_per_second": 41.349, "eval_steps_per_second": 5.181, "eval_wer": 0.31693446470482034, "step": 113200 }, { "epoch": 12.13, "eval_loss": 0.467046320438385, "eval_runtime": 49.039, "eval_samples_per_second": 41.334, "eval_steps_per_second": 5.18, "eval_wer": 0.314858277667449, "step": 113300 }, { "epoch": 12.14, "eval_loss": 0.4594302475452423, "eval_runtime": 50.5981, "eval_samples_per_second": 40.061, "eval_steps_per_second": 5.02, "eval_wer": 0.31413612565445026, "step": 113400 }, { "epoch": 12.15, "learning_rate": 5.725787965616045e-05, "loss": 0.0917, "step": 113500 }, { "epoch": 12.15, "eval_loss": 0.4622795879840851, "eval_runtime": 50.5474, "eval_samples_per_second": 40.101, "eval_steps_per_second": 5.025, "eval_wer": 0.31269182162845277, "step": 113500 }, { "epoch": 12.16, "eval_loss": 0.4459761083126068, "eval_runtime": 50.9405, "eval_samples_per_second": 39.792, "eval_steps_per_second": 4.986, "eval_wer": 0.3133237046398267, "step": 113600 }, { "epoch": 12.17, "eval_loss": 0.45123758912086487, "eval_runtime": 50.7689, "eval_samples_per_second": 39.926, "eval_steps_per_second": 5.003, "eval_wer": 0.3191009207438166, "step": 113700 }, { "epoch": 12.18, "eval_loss": 0.46812236309051514, "eval_runtime": 50.5875, "eval_samples_per_second": 40.069, "eval_steps_per_second": 5.021, "eval_wer": 0.3135945116447012, "step": 113800 }, { "epoch": 12.19, "eval_loss": 0.45636752247810364, "eval_runtime": 50.7928, "eval_samples_per_second": 39.907, "eval_steps_per_second": 5.001, "eval_wer": 0.31287235963170246, "step": 113900 }, { "epoch": 12.21, "learning_rate": 5.618553008595988e-05, "loss": 0.0906, "step": 114000 }, { "epoch": 12.21, "eval_loss": 0.44822677969932556, "eval_runtime": 50.8831, "eval_samples_per_second": 39.836, "eval_steps_per_second": 4.992, "eval_wer": 0.3107059035927063, "step": 114000 }, { "epoch": 12.22, "eval_loss": 0.4594801664352417, "eval_runtime": 50.6192, "eval_samples_per_second": 40.044, "eval_steps_per_second": 5.018, "eval_wer": 0.3133237046398267, "step": 114100 }, { "epoch": 12.23, "eval_loss": 0.4509586989879608, "eval_runtime": 50.466, "eval_samples_per_second": 40.166, "eval_steps_per_second": 5.033, "eval_wer": 0.3117891316122044, "step": 114200 }, { "epoch": 12.24, "eval_loss": 0.44721925258636475, "eval_runtime": 50.6245, "eval_samples_per_second": 40.04, "eval_steps_per_second": 5.017, "eval_wer": 0.31305289763495214, "step": 114300 }, { "epoch": 12.25, "eval_loss": 0.44987425208091736, "eval_runtime": 51.5037, "eval_samples_per_second": 39.356, "eval_steps_per_second": 4.932, "eval_wer": 0.3129626286333273, "step": 114400 }, { "epoch": 12.26, "learning_rate": 5.511103151862464e-05, "loss": 0.0918, "step": 114500 }, { "epoch": 12.26, "eval_loss": 0.45026734471321106, "eval_runtime": 49.4953, "eval_samples_per_second": 40.953, "eval_steps_per_second": 5.132, "eval_wer": 0.3137750496479509, "step": 114500 }, { "epoch": 12.27, "eval_loss": 0.45180875062942505, "eval_runtime": 49.496, "eval_samples_per_second": 40.953, "eval_steps_per_second": 5.132, "eval_wer": 0.31350424264307636, "step": 114600 }, { "epoch": 12.28, "eval_loss": 0.44931671023368835, "eval_runtime": 49.0213, "eval_samples_per_second": 41.349, "eval_steps_per_second": 5.181, "eval_wer": 0.311428055605705, "step": 114700 }, { "epoch": 12.29, "eval_loss": 0.45739245414733887, "eval_runtime": 49.1885, "eval_samples_per_second": 41.209, "eval_steps_per_second": 5.164, "eval_wer": 0.3133237046398267, "step": 114800 }, { "epoch": 12.3, "eval_loss": 0.46827754378318787, "eval_runtime": 49.2072, "eval_samples_per_second": 41.193, "eval_steps_per_second": 5.162, "eval_wer": 0.320003610760065, "step": 114900 }, { "epoch": 12.31, "learning_rate": 5.40365329512894e-05, "loss": 0.0869, "step": 115000 }, { "epoch": 12.31, "eval_loss": 0.4608277678489685, "eval_runtime": 49.5789, "eval_samples_per_second": 40.884, "eval_steps_per_second": 5.123, "eval_wer": 0.3164831196966962, "step": 115000 }, { "epoch": 12.32, "eval_loss": 0.46175676584243774, "eval_runtime": 49.9224, "eval_samples_per_second": 40.603, "eval_steps_per_second": 5.088, "eval_wer": 0.318288499729193, "step": 115100 }, { "epoch": 12.33, "eval_loss": 0.46893182396888733, "eval_runtime": 49.2463, "eval_samples_per_second": 41.16, "eval_steps_per_second": 5.158, "eval_wer": 0.3172955407113197, "step": 115200 }, { "epoch": 12.34, "eval_loss": 0.4680798351764679, "eval_runtime": 48.8639, "eval_samples_per_second": 41.483, "eval_steps_per_second": 5.198, "eval_wer": 0.32235060480231087, "step": 115300 }, { "epoch": 12.36, "eval_loss": 0.4576069712638855, "eval_runtime": 49.1095, "eval_samples_per_second": 41.275, "eval_steps_per_second": 5.172, "eval_wer": 0.3230727568153096, "step": 115400 }, { "epoch": 12.37, "learning_rate": 5.2962034383954145e-05, "loss": 0.0885, "step": 115500 }, { "epoch": 12.37, "eval_loss": 0.48311322927474976, "eval_runtime": 48.7739, "eval_samples_per_second": 41.559, "eval_steps_per_second": 5.208, "eval_wer": 0.31756634771619424, "step": 115500 }, { "epoch": 12.38, "eval_loss": 0.4601800739765167, "eval_runtime": 49.0417, "eval_samples_per_second": 41.332, "eval_steps_per_second": 5.179, "eval_wer": 0.3181079617259433, "step": 115600 }, { "epoch": 12.39, "eval_loss": 0.4493272006511688, "eval_runtime": 49.2267, "eval_samples_per_second": 41.177, "eval_steps_per_second": 5.16, "eval_wer": 0.31675392670157065, "step": 115700 }, { "epoch": 12.4, "eval_loss": 0.45637446641921997, "eval_runtime": 48.8932, "eval_samples_per_second": 41.458, "eval_steps_per_second": 5.195, "eval_wer": 0.314858277667449, "step": 115800 }, { "epoch": 12.41, "eval_loss": 0.45846298336982727, "eval_runtime": 48.5992, "eval_samples_per_second": 41.708, "eval_steps_per_second": 5.226, "eval_wer": 0.31576096768369744, "step": 115900 }, { "epoch": 12.42, "learning_rate": 5.1887535816618904e-05, "loss": 0.091, "step": 116000 }, { "epoch": 12.42, "eval_loss": 0.4713011384010315, "eval_runtime": 48.7915, "eval_samples_per_second": 41.544, "eval_steps_per_second": 5.206, "eval_wer": 0.31928145874706626, "step": 116000 }, { "epoch": 12.43, "eval_loss": 0.45806244015693665, "eval_runtime": 48.5172, "eval_samples_per_second": 41.779, "eval_steps_per_second": 5.235, "eval_wer": 0.31386531864957573, "step": 116100 }, { "epoch": 12.44, "eval_loss": 0.4636545777320862, "eval_runtime": 48.7872, "eval_samples_per_second": 41.548, "eval_steps_per_second": 5.206, "eval_wer": 0.313143166636577, "step": 116200 }, { "epoch": 12.45, "eval_loss": 0.4571922719478607, "eval_runtime": 48.9824, "eval_samples_per_second": 41.382, "eval_steps_per_second": 5.186, "eval_wer": 0.31242101462357824, "step": 116300 }, { "epoch": 12.46, "eval_loss": 0.44893747568130493, "eval_runtime": 51.4376, "eval_samples_per_second": 39.407, "eval_steps_per_second": 4.938, "eval_wer": 0.3163025816934465, "step": 116400 }, { "epoch": 12.47, "learning_rate": 5.0813037249283664e-05, "loss": 0.0886, "step": 116500 }, { "epoch": 12.47, "eval_loss": 0.46794840693473816, "eval_runtime": 49.1991, "eval_samples_per_second": 41.2, "eval_steps_per_second": 5.163, "eval_wer": 0.3159415056869471, "step": 116500 }, { "epoch": 12.48, "eval_loss": 0.4712357819080353, "eval_runtime": 49.2178, "eval_samples_per_second": 41.184, "eval_steps_per_second": 5.161, "eval_wer": 0.31512908467232353, "step": 116600 }, { "epoch": 12.49, "eval_loss": 0.47498226165771484, "eval_runtime": 48.8815, "eval_samples_per_second": 41.468, "eval_steps_per_second": 5.196, "eval_wer": 0.31864957573569236, "step": 116700 }, { "epoch": 12.51, "eval_loss": 0.4672822654247284, "eval_runtime": 48.7696, "eval_samples_per_second": 41.563, "eval_steps_per_second": 5.208, "eval_wer": 0.31756634771619424, "step": 116800 }, { "epoch": 12.52, "eval_loss": 0.4601333439350128, "eval_runtime": 48.6974, "eval_samples_per_second": 41.624, "eval_steps_per_second": 5.216, "eval_wer": 0.3113377866040802, "step": 116900 }, { "epoch": 12.53, "learning_rate": 4.9738538681948424e-05, "loss": 0.0917, "step": 117000 }, { "epoch": 12.53, "eval_loss": 0.43411996960639954, "eval_runtime": 49.4938, "eval_samples_per_second": 40.955, "eval_steps_per_second": 5.132, "eval_wer": 0.3125112836252031, "step": 117000 }, { "epoch": 12.54, "eval_loss": 0.4462231397628784, "eval_runtime": 48.7809, "eval_samples_per_second": 41.553, "eval_steps_per_second": 5.207, "eval_wer": 0.30772702653908646, "step": 117100 }, { "epoch": 12.55, "eval_loss": 0.45020830631256104, "eval_runtime": 48.9828, "eval_samples_per_second": 41.382, "eval_steps_per_second": 5.185, "eval_wer": 0.3098934825780827, "step": 117200 }, { "epoch": 12.56, "eval_loss": 0.4482104480266571, "eval_runtime": 49.0098, "eval_samples_per_second": 41.359, "eval_steps_per_second": 5.183, "eval_wer": 0.3116085936089547, "step": 117300 }, { "epoch": 12.57, "eval_loss": 0.4459335505962372, "eval_runtime": 48.885, "eval_samples_per_second": 41.465, "eval_steps_per_second": 5.196, "eval_wer": 0.313143166636577, "step": 117400 }, { "epoch": 12.58, "learning_rate": 4.8664040114613176e-05, "loss": 0.0881, "step": 117500 }, { "epoch": 12.58, "eval_loss": 0.4464477598667145, "eval_runtime": 48.7534, "eval_samples_per_second": 41.577, "eval_steps_per_second": 5.21, "eval_wer": 0.3121502076187037, "step": 117500 }, { "epoch": 12.59, "eval_loss": 0.4471108019351959, "eval_runtime": 49.1827, "eval_samples_per_second": 41.214, "eval_steps_per_second": 5.164, "eval_wer": 0.3125112836252031, "step": 117600 }, { "epoch": 12.6, "eval_loss": 0.4318666458129883, "eval_runtime": 48.6999, "eval_samples_per_second": 41.622, "eval_steps_per_second": 5.216, "eval_wer": 0.31224047662032856, "step": 117700 }, { "epoch": 12.61, "eval_loss": 0.4420875310897827, "eval_runtime": 48.5883, "eval_samples_per_second": 41.718, "eval_steps_per_second": 5.228, "eval_wer": 0.31025455858458206, "step": 117800 }, { "epoch": 12.62, "eval_loss": 0.43261706829071045, "eval_runtime": 48.5361, "eval_samples_per_second": 41.763, "eval_steps_per_second": 5.233, "eval_wer": 0.3107961725943311, "step": 117900 }, { "epoch": 12.63, "learning_rate": 4.758954154727793e-05, "loss": 0.0913, "step": 118000 }, { "epoch": 12.63, "eval_loss": 0.44137805700302124, "eval_runtime": 49.0062, "eval_samples_per_second": 41.362, "eval_steps_per_second": 5.183, "eval_wer": 0.3068243365228381, "step": 118000 }, { "epoch": 12.64, "eval_loss": 0.4421420097351074, "eval_runtime": 48.7431, "eval_samples_per_second": 41.585, "eval_steps_per_second": 5.211, "eval_wer": 0.3082686405488355, "step": 118100 }, { "epoch": 12.66, "eval_loss": 0.44493910670280457, "eval_runtime": 48.7918, "eval_samples_per_second": 41.544, "eval_steps_per_second": 5.206, "eval_wer": 0.31025455858458206, "step": 118200 }, { "epoch": 12.67, "eval_loss": 0.43802663683891296, "eval_runtime": 48.9254, "eval_samples_per_second": 41.43, "eval_steps_per_second": 5.192, "eval_wer": 0.3127820906300776, "step": 118300 }, { "epoch": 12.68, "eval_loss": 0.43897026777267456, "eval_runtime": 48.7195, "eval_samples_per_second": 41.606, "eval_steps_per_second": 5.214, "eval_wer": 0.3135945116447012, "step": 118400 }, { "epoch": 12.69, "learning_rate": 4.651504297994269e-05, "loss": 0.0921, "step": 118500 }, { "epoch": 12.69, "eval_loss": 0.4452337324619293, "eval_runtime": 48.675, "eval_samples_per_second": 41.644, "eval_steps_per_second": 5.218, "eval_wer": 0.31043509658783175, "step": 118500 }, { "epoch": 12.7, "eval_loss": 0.437765896320343, "eval_runtime": 48.8617, "eval_samples_per_second": 41.484, "eval_steps_per_second": 5.198, "eval_wer": 0.3121502076187037, "step": 118600 }, { "epoch": 12.71, "eval_loss": 0.44589871168136597, "eval_runtime": 49.4576, "eval_samples_per_second": 40.985, "eval_steps_per_second": 5.136, "eval_wer": 0.307997833543961, "step": 118700 }, { "epoch": 12.72, "eval_loss": 0.43694981932640076, "eval_runtime": 48.5647, "eval_samples_per_second": 41.738, "eval_steps_per_second": 5.23, "eval_wer": 0.30510922549196606, "step": 118800 }, { "epoch": 12.73, "eval_loss": 0.4473933279514313, "eval_runtime": 48.8399, "eval_samples_per_second": 41.503, "eval_steps_per_second": 5.201, "eval_wer": 0.3076367575374616, "step": 118900 }, { "epoch": 12.74, "learning_rate": 4.544054441260745e-05, "loss": 0.0886, "step": 119000 }, { "epoch": 12.74, "eval_loss": 0.45080724358558655, "eval_runtime": 48.7926, "eval_samples_per_second": 41.543, "eval_steps_per_second": 5.206, "eval_wer": 0.3066437985195884, "step": 119000 }, { "epoch": 12.75, "eval_loss": 0.445557177066803, "eval_runtime": 49.0576, "eval_samples_per_second": 41.319, "eval_steps_per_second": 5.178, "eval_wer": 0.309712944574833, "step": 119100 }, { "epoch": 12.76, "eval_loss": 0.4503107964992523, "eval_runtime": 49.0549, "eval_samples_per_second": 41.321, "eval_steps_per_second": 5.178, "eval_wer": 0.3078172955407113, "step": 119200 }, { "epoch": 12.77, "eval_loss": 0.4459659457206726, "eval_runtime": 49.8084, "eval_samples_per_second": 40.696, "eval_steps_per_second": 5.1, "eval_wer": 0.30808810254558583, "step": 119300 }, { "epoch": 12.78, "eval_loss": 0.4403787851333618, "eval_runtime": 48.9807, "eval_samples_per_second": 41.384, "eval_steps_per_second": 5.186, "eval_wer": 0.307997833543961, "step": 119400 }, { "epoch": 12.79, "learning_rate": 4.43660458452722e-05, "loss": 0.0897, "step": 119500 }, { "epoch": 12.79, "eval_loss": 0.43507125973701477, "eval_runtime": 49.5648, "eval_samples_per_second": 40.896, "eval_steps_per_second": 5.125, "eval_wer": 0.30998375157970753, "step": 119500 }, { "epoch": 12.81, "eval_loss": 0.44462278485298157, "eval_runtime": 48.5763, "eval_samples_per_second": 41.728, "eval_steps_per_second": 5.229, "eval_wer": 0.311969669615454, "step": 119600 }, { "epoch": 12.82, "eval_loss": 0.44070571660995483, "eval_runtime": 49.2374, "eval_samples_per_second": 41.168, "eval_steps_per_second": 5.159, "eval_wer": 0.30980321357645785, "step": 119700 }, { "epoch": 12.83, "eval_loss": 0.4405609667301178, "eval_runtime": 48.5684, "eval_samples_per_second": 41.735, "eval_steps_per_second": 5.23, "eval_wer": 0.30835890955046036, "step": 119800 }, { "epoch": 12.84, "eval_loss": 0.4491572678089142, "eval_runtime": 49.0594, "eval_samples_per_second": 41.317, "eval_steps_per_second": 5.177, "eval_wer": 0.30673406752121324, "step": 119900 }, { "epoch": 12.85, "learning_rate": 4.329369627507163e-05, "loss": 0.09, "step": 120000 }, { "epoch": 12.85, "eval_loss": 0.45461514592170715, "eval_runtime": 49.0505, "eval_samples_per_second": 41.325, "eval_steps_per_second": 5.178, "eval_wer": 0.30980321357645785, "step": 120000 }, { "epoch": 12.86, "eval_loss": 0.45472848415374756, "eval_runtime": 49.0834, "eval_samples_per_second": 41.297, "eval_steps_per_second": 5.175, "eval_wer": 0.3073659505325871, "step": 120100 }, { "epoch": 12.87, "eval_loss": 0.45165643095970154, "eval_runtime": 49.1082, "eval_samples_per_second": 41.276, "eval_steps_per_second": 5.172, "eval_wer": 0.31106697959920565, "step": 120200 }, { "epoch": 12.88, "eval_loss": 0.43198153376579285, "eval_runtime": 49.0197, "eval_samples_per_second": 41.351, "eval_steps_per_second": 5.182, "eval_wer": 0.30637299151471387, "step": 120300 }, { "epoch": 12.89, "eval_loss": 0.4293752610683441, "eval_runtime": 49.0833, "eval_samples_per_second": 41.297, "eval_steps_per_second": 5.175, "eval_wer": 0.3071854125293374, "step": 120400 }, { "epoch": 12.9, "learning_rate": 4.221919770773638e-05, "loss": 0.0898, "step": 120500 }, { "epoch": 12.9, "eval_loss": 0.44117698073387146, "eval_runtime": 49.2326, "eval_samples_per_second": 41.172, "eval_steps_per_second": 5.159, "eval_wer": 0.3050189564903412, "step": 120500 }, { "epoch": 12.91, "eval_loss": 0.4254050552845001, "eval_runtime": 49.3023, "eval_samples_per_second": 41.114, "eval_steps_per_second": 5.152, "eval_wer": 0.3073659505325871, "step": 120600 }, { "epoch": 12.92, "eval_loss": 0.4409028887748718, "eval_runtime": 48.4446, "eval_samples_per_second": 41.842, "eval_steps_per_second": 5.243, "eval_wer": 0.3070951435277126, "step": 120700 }, { "epoch": 12.93, "eval_loss": 0.4362035095691681, "eval_runtime": 49.258, "eval_samples_per_second": 41.151, "eval_steps_per_second": 5.157, "eval_wer": 0.3070951435277126, "step": 120800 }, { "epoch": 12.94, "eval_loss": 0.45788970589637756, "eval_runtime": 49.1783, "eval_samples_per_second": 41.217, "eval_steps_per_second": 5.165, "eval_wer": 0.30899079256183426, "step": 120900 }, { "epoch": 12.95, "learning_rate": 4.114469914040114e-05, "loss": 0.0892, "step": 121000 }, { "epoch": 12.95, "eval_loss": 0.44916099309921265, "eval_runtime": 49.252, "eval_samples_per_second": 41.156, "eval_steps_per_second": 5.157, "eval_wer": 0.30592164650658965, "step": 121000 }, { "epoch": 12.97, "eval_loss": 0.44036194682121277, "eval_runtime": 48.5298, "eval_samples_per_second": 41.768, "eval_steps_per_second": 5.234, "eval_wer": 0.3105253655894566, "step": 121100 }, { "epoch": 12.98, "eval_loss": 0.43648219108581543, "eval_runtime": 48.6252, "eval_samples_per_second": 41.686, "eval_steps_per_second": 5.224, "eval_wer": 0.3066437985195884, "step": 121200 }, { "epoch": 12.99, "eval_loss": 0.43682196736335754, "eval_runtime": 49.1606, "eval_samples_per_second": 41.232, "eval_steps_per_second": 5.167, "eval_wer": 0.30483841848709153, "step": 121300 }, { "epoch": 13.0, "eval_loss": 0.44096165895462036, "eval_runtime": 49.9358, "eval_samples_per_second": 40.592, "eval_steps_per_second": 5.087, "eval_wer": 0.3033038454594692, "step": 121400 }, { "epoch": 13.01, "learning_rate": 4.00702005730659e-05, "loss": 0.085, "step": 121500 }, { "epoch": 13.01, "eval_loss": 0.44503235816955566, "eval_runtime": 48.8269, "eval_samples_per_second": 41.514, "eval_steps_per_second": 5.202, "eval_wer": 0.30465788048384185, "step": 121500 }, { "epoch": 13.02, "eval_loss": 0.4633066952228546, "eval_runtime": 49.1922, "eval_samples_per_second": 41.206, "eval_steps_per_second": 5.163, "eval_wer": 0.3013179274237227, "step": 121600 }, { "epoch": 13.03, "eval_loss": 0.46001821756362915, "eval_runtime": 49.1699, "eval_samples_per_second": 41.224, "eval_steps_per_second": 5.166, "eval_wer": 0.3053800324968406, "step": 121700 }, { "epoch": 13.04, "eval_loss": 0.4540691375732422, "eval_runtime": 49.0697, "eval_samples_per_second": 41.309, "eval_steps_per_second": 5.176, "eval_wer": 0.3047481494854667, "step": 121800 }, { "epoch": 13.05, "eval_loss": 0.45461952686309814, "eval_runtime": 49.096, "eval_samples_per_second": 41.286, "eval_steps_per_second": 5.174, "eval_wer": 0.3058313775049648, "step": 121900 }, { "epoch": 13.06, "learning_rate": 3.8995702005730654e-05, "loss": 0.0791, "step": 122000 }, { "epoch": 13.06, "eval_loss": 0.4536155164241791, "eval_runtime": 48.7723, "eval_samples_per_second": 41.56, "eval_steps_per_second": 5.208, "eval_wer": 0.30447734248059216, "step": 122000 }, { "epoch": 13.07, "eval_loss": 0.4589266777038574, "eval_runtime": 49.0728, "eval_samples_per_second": 41.306, "eval_steps_per_second": 5.176, "eval_wer": 0.30655352951796355, "step": 122100 }, { "epoch": 13.08, "eval_loss": 0.4580624997615814, "eval_runtime": 49.0335, "eval_samples_per_second": 41.339, "eval_steps_per_second": 5.18, "eval_wer": 0.30574110850333996, "step": 122200 }, { "epoch": 13.09, "eval_loss": 0.45460861921310425, "eval_runtime": 48.9092, "eval_samples_per_second": 41.444, "eval_steps_per_second": 5.193, "eval_wer": 0.30483841848709153, "step": 122300 }, { "epoch": 13.1, "eval_loss": 0.46732285618782043, "eval_runtime": 48.8035, "eval_samples_per_second": 41.534, "eval_steps_per_second": 5.205, "eval_wer": 0.30059577541072396, "step": 122400 }, { "epoch": 13.12, "learning_rate": 3.792335243553008e-05, "loss": 0.0789, "step": 122500 }, { "epoch": 13.12, "eval_loss": 0.45507410168647766, "eval_runtime": 48.977, "eval_samples_per_second": 41.387, "eval_steps_per_second": 5.186, "eval_wer": 0.30185954143347177, "step": 122500 }, { "epoch": 13.13, "eval_loss": 0.4466601014137268, "eval_runtime": 48.675, "eval_samples_per_second": 41.644, "eval_steps_per_second": 5.218, "eval_wer": 0.3024914244448456, "step": 122600 }, { "epoch": 13.14, "eval_loss": 0.4593279957771301, "eval_runtime": 49.0944, "eval_samples_per_second": 41.288, "eval_steps_per_second": 5.174, "eval_wer": 0.3014984654269724, "step": 122700 }, { "epoch": 13.15, "eval_loss": 0.4597959518432617, "eval_runtime": 48.7201, "eval_samples_per_second": 41.605, "eval_steps_per_second": 5.213, "eval_wer": 0.3036649214659686, "step": 122800 }, { "epoch": 13.16, "eval_loss": 0.4531610608100891, "eval_runtime": 49.6573, "eval_samples_per_second": 40.82, "eval_steps_per_second": 5.115, "eval_wer": 0.3037551904675934, "step": 122900 }, { "epoch": 13.17, "learning_rate": 3.685100286532951e-05, "loss": 0.077, "step": 123000 }, { "epoch": 13.17, "eval_loss": 0.46069207787513733, "eval_runtime": 49.0496, "eval_samples_per_second": 41.325, "eval_steps_per_second": 5.178, "eval_wer": 0.3014984654269724, "step": 123000 }, { "epoch": 13.18, "eval_loss": 0.43852800130844116, "eval_runtime": 49.9159, "eval_samples_per_second": 40.608, "eval_steps_per_second": 5.089, "eval_wer": 0.3005055064090991, "step": 123100 }, { "epoch": 13.19, "eval_loss": 0.4589592218399048, "eval_runtime": 49.0752, "eval_samples_per_second": 41.304, "eval_steps_per_second": 5.176, "eval_wer": 0.3041162664740928, "step": 123200 }, { "epoch": 13.2, "eval_loss": 0.4358598589897156, "eval_runtime": 48.8305, "eval_samples_per_second": 41.511, "eval_steps_per_second": 5.202, "eval_wer": 0.30465788048384185, "step": 123300 }, { "epoch": 13.21, "eval_loss": 0.4457867443561554, "eval_runtime": 48.6567, "eval_samples_per_second": 41.659, "eval_steps_per_second": 5.22, "eval_wer": 0.3039357284708431, "step": 123400 }, { "epoch": 13.22, "learning_rate": 3.5776504297994264e-05, "loss": 0.0771, "step": 123500 }, { "epoch": 13.22, "eval_loss": 0.4506053924560547, "eval_runtime": 48.6615, "eval_samples_per_second": 41.655, "eval_steps_per_second": 5.22, "eval_wer": 0.30754648853583677, "step": 123500 }, { "epoch": 13.23, "eval_loss": 0.4456702768802643, "eval_runtime": 48.5857, "eval_samples_per_second": 41.72, "eval_steps_per_second": 5.228, "eval_wer": 0.30790756454233614, "step": 123600 }, { "epoch": 13.24, "eval_loss": 0.4448252022266388, "eval_runtime": 48.8145, "eval_samples_per_second": 41.525, "eval_steps_per_second": 5.203, "eval_wer": 0.30483841848709153, "step": 123700 }, { "epoch": 13.25, "eval_loss": 0.4397769272327423, "eval_runtime": 48.444, "eval_samples_per_second": 41.842, "eval_steps_per_second": 5.243, "eval_wer": 0.30357465246434373, "step": 123800 }, { "epoch": 13.27, "eval_loss": 0.451018363237381, "eval_runtime": 48.6358, "eval_samples_per_second": 41.677, "eval_steps_per_second": 5.222, "eval_wer": 0.30547030149846544, "step": 123900 }, { "epoch": 13.28, "learning_rate": 3.4702005730659024e-05, "loss": 0.0804, "step": 124000 }, { "epoch": 13.28, "eval_loss": 0.4506898522377014, "eval_runtime": 48.6155, "eval_samples_per_second": 41.695, "eval_steps_per_second": 5.225, "eval_wer": 0.30592164650658965, "step": 124000 }, { "epoch": 13.29, "eval_loss": 0.4543741047382355, "eval_runtime": 49.2524, "eval_samples_per_second": 41.155, "eval_steps_per_second": 5.157, "eval_wer": 0.3076367575374616, "step": 124100 }, { "epoch": 13.3, "eval_loss": 0.45340901613235474, "eval_runtime": 48.7151, "eval_samples_per_second": 41.609, "eval_steps_per_second": 5.214, "eval_wer": 0.30727568153096224, "step": 124200 }, { "epoch": 13.31, "eval_loss": 0.4441240131855011, "eval_runtime": 48.5073, "eval_samples_per_second": 41.788, "eval_steps_per_second": 5.236, "eval_wer": 0.30610218450983934, "step": 124300 }, { "epoch": 13.32, "eval_loss": 0.43914496898651123, "eval_runtime": 48.7563, "eval_samples_per_second": 41.574, "eval_steps_per_second": 5.21, "eval_wer": 0.30754648853583677, "step": 124400 }, { "epoch": 13.33, "learning_rate": 3.362750716332378e-05, "loss": 0.0774, "step": 124500 }, { "epoch": 13.33, "eval_loss": 0.45265689492225647, "eval_runtime": 49.1972, "eval_samples_per_second": 41.202, "eval_steps_per_second": 5.163, "eval_wer": 0.306282722513089, "step": 124500 }, { "epoch": 13.34, "eval_loss": 0.46383553743362427, "eval_runtime": 48.6998, "eval_samples_per_second": 41.622, "eval_steps_per_second": 5.216, "eval_wer": 0.30574110850333996, "step": 124600 }, { "epoch": 13.35, "eval_loss": 0.45413774251937866, "eval_runtime": 48.7189, "eval_samples_per_second": 41.606, "eval_steps_per_second": 5.214, "eval_wer": 0.30637299151471387, "step": 124700 }, { "epoch": 13.36, "eval_loss": 0.46165329217910767, "eval_runtime": 48.6222, "eval_samples_per_second": 41.689, "eval_steps_per_second": 5.224, "eval_wer": 0.3078172955407113, "step": 124800 }, { "epoch": 13.37, "eval_loss": 0.4584297239780426, "eval_runtime": 48.9274, "eval_samples_per_second": 41.429, "eval_steps_per_second": 5.191, "eval_wer": 0.3041162664740928, "step": 124900 }, { "epoch": 13.38, "learning_rate": 3.2555157593123205e-05, "loss": 0.0795, "step": 125000 }, { "epoch": 13.38, "eval_loss": 0.4663410782814026, "eval_runtime": 48.6633, "eval_samples_per_second": 41.654, "eval_steps_per_second": 5.22, "eval_wer": 0.30321357645784436, "step": 125000 }, { "epoch": 13.39, "eval_loss": 0.4545777440071106, "eval_runtime": 49.7034, "eval_samples_per_second": 40.782, "eval_steps_per_second": 5.11, "eval_wer": 0.3024914244448456, "step": 125100 }, { "epoch": 13.4, "eval_loss": 0.4616332948207855, "eval_runtime": 48.8306, "eval_samples_per_second": 41.511, "eval_steps_per_second": 5.202, "eval_wer": 0.3021303484383463, "step": 125200 }, { "epoch": 13.42, "eval_loss": 0.4602724611759186, "eval_runtime": 48.7695, "eval_samples_per_second": 41.563, "eval_steps_per_second": 5.208, "eval_wer": 0.30158873442859724, "step": 125300 }, { "epoch": 13.43, "eval_loss": 0.4615834057331085, "eval_runtime": 48.6683, "eval_samples_per_second": 41.649, "eval_steps_per_second": 5.219, "eval_wer": 0.30402599747246795, "step": 125400 }, { "epoch": 13.44, "learning_rate": 3.1480659025787965e-05, "loss": 0.0791, "step": 125500 }, { "epoch": 13.44, "eval_loss": 0.45479077100753784, "eval_runtime": 48.3791, "eval_samples_per_second": 41.898, "eval_steps_per_second": 5.25, "eval_wer": 0.3021303484383463, "step": 125500 }, { "epoch": 13.45, "eval_loss": 0.4559873640537262, "eval_runtime": 48.8585, "eval_samples_per_second": 41.487, "eval_steps_per_second": 5.199, "eval_wer": 0.3024914244448456, "step": 125600 }, { "epoch": 13.46, "eval_loss": 0.45155441761016846, "eval_runtime": 48.7439, "eval_samples_per_second": 41.585, "eval_steps_per_second": 5.211, "eval_wer": 0.3036649214659686, "step": 125700 }, { "epoch": 13.47, "eval_loss": 0.45003730058670044, "eval_runtime": 48.8595, "eval_samples_per_second": 41.486, "eval_steps_per_second": 5.199, "eval_wer": 0.3013179274237227, "step": 125800 }, { "epoch": 13.48, "eval_loss": 0.4539685547351837, "eval_runtime": 49.61, "eval_samples_per_second": 40.859, "eval_steps_per_second": 5.12, "eval_wer": 0.3008665824155985, "step": 125900 }, { "epoch": 13.49, "learning_rate": 3.0406160458452718e-05, "loss": 0.0776, "step": 126000 }, { "epoch": 13.49, "eval_loss": 0.4581133723258972, "eval_runtime": 48.613, "eval_samples_per_second": 41.697, "eval_steps_per_second": 5.225, "eval_wer": 0.30258169344647046, "step": 126000 }, { "epoch": 13.5, "eval_loss": 0.45983752608299255, "eval_runtime": 48.7145, "eval_samples_per_second": 41.61, "eval_steps_per_second": 5.214, "eval_wer": 0.30276223144972014, "step": 126100 }, { "epoch": 13.51, "eval_loss": 0.45870548486709595, "eval_runtime": 48.7095, "eval_samples_per_second": 41.614, "eval_steps_per_second": 5.215, "eval_wer": 0.30384545946921826, "step": 126200 }, { "epoch": 13.52, "eval_loss": 0.45144903659820557, "eval_runtime": 48.8311, "eval_samples_per_second": 41.51, "eval_steps_per_second": 5.202, "eval_wer": 0.30240115544322077, "step": 126300 }, { "epoch": 13.53, "eval_loss": 0.4495235085487366, "eval_runtime": 48.8596, "eval_samples_per_second": 41.486, "eval_steps_per_second": 5.199, "eval_wer": 0.30357465246434373, "step": 126400 }, { "epoch": 13.54, "learning_rate": 2.9331661891117477e-05, "loss": 0.0793, "step": 126500 }, { "epoch": 13.54, "eval_loss": 0.45561927556991577, "eval_runtime": 49.1727, "eval_samples_per_second": 41.222, "eval_steps_per_second": 5.165, "eval_wer": 0.30158873442859724, "step": 126500 }, { "epoch": 13.55, "eval_loss": 0.46026507019996643, "eval_runtime": 48.7412, "eval_samples_per_second": 41.587, "eval_steps_per_second": 5.211, "eval_wer": 0.3024914244448456, "step": 126600 }, { "epoch": 13.57, "eval_loss": 0.4496086835861206, "eval_runtime": 48.782, "eval_samples_per_second": 41.552, "eval_steps_per_second": 5.207, "eval_wer": 0.29951254739122585, "step": 126700 }, { "epoch": 13.58, "eval_loss": 0.44833648204803467, "eval_runtime": 48.9526, "eval_samples_per_second": 41.407, "eval_steps_per_second": 5.189, "eval_wer": 0.29689474634410545, "step": 126800 }, { "epoch": 13.59, "eval_loss": 0.4462050795555115, "eval_runtime": 48.8347, "eval_samples_per_second": 41.507, "eval_steps_per_second": 5.201, "eval_wer": 0.2979779743636035, "step": 126900 }, { "epoch": 13.6, "learning_rate": 2.8257163323782234e-05, "loss": 0.0816, "step": 127000 }, { "epoch": 13.6, "eval_loss": 0.4521482586860657, "eval_runtime": 48.794, "eval_samples_per_second": 41.542, "eval_steps_per_second": 5.206, "eval_wer": 0.2981585123668532, "step": 127000 }, { "epoch": 13.61, "eval_loss": 0.4580208659172058, "eval_runtime": 48.7962, "eval_samples_per_second": 41.54, "eval_steps_per_second": 5.205, "eval_wer": 0.30185954143347177, "step": 127100 }, { "epoch": 13.62, "eval_loss": 0.46691346168518066, "eval_runtime": 48.9324, "eval_samples_per_second": 41.424, "eval_steps_per_second": 5.191, "eval_wer": 0.3008665824155985, "step": 127200 }, { "epoch": 13.63, "eval_loss": 0.4513174295425415, "eval_runtime": 48.9146, "eval_samples_per_second": 41.44, "eval_steps_per_second": 5.193, "eval_wer": 0.3016790034302221, "step": 127300 }, { "epoch": 13.64, "eval_loss": 0.46024101972579956, "eval_runtime": 48.6915, "eval_samples_per_second": 41.629, "eval_steps_per_second": 5.217, "eval_wer": 0.3014984654269724, "step": 127400 }, { "epoch": 13.65, "learning_rate": 2.718266475644699e-05, "loss": 0.0779, "step": 127500 }, { "epoch": 13.65, "eval_loss": 0.45917895436286926, "eval_runtime": 48.782, "eval_samples_per_second": 41.552, "eval_steps_per_second": 5.207, "eval_wer": 0.2997833543961004, "step": 127500 }, { "epoch": 13.66, "eval_loss": 0.47004109621047974, "eval_runtime": 48.902, "eval_samples_per_second": 41.45, "eval_steps_per_second": 5.194, "eval_wer": 0.29806824336522836, "step": 127600 }, { "epoch": 13.67, "eval_loss": 0.4726985692977905, "eval_runtime": 48.8717, "eval_samples_per_second": 41.476, "eval_steps_per_second": 5.197, "eval_wer": 0.29779743636035383, "step": 127700 }, { "epoch": 13.68, "eval_loss": 0.45995599031448364, "eval_runtime": 49.2728, "eval_samples_per_second": 41.138, "eval_steps_per_second": 5.155, "eval_wer": 0.2983390503701029, "step": 127800 }, { "epoch": 13.69, "eval_loss": 0.44724515080451965, "eval_runtime": 48.727, "eval_samples_per_second": 41.599, "eval_steps_per_second": 5.213, "eval_wer": 0.29779743636035383, "step": 127900 }, { "epoch": 13.7, "learning_rate": 2.6108166189111746e-05, "loss": 0.0779, "step": 128000 }, { "epoch": 13.7, "eval_loss": 0.4483438730239868, "eval_runtime": 48.7121, "eval_samples_per_second": 41.612, "eval_steps_per_second": 5.214, "eval_wer": 0.29842931937172773, "step": 128000 }, { "epoch": 13.72, "eval_loss": 0.45116451382637024, "eval_runtime": 48.9634, "eval_samples_per_second": 41.398, "eval_steps_per_second": 5.188, "eval_wer": 0.2968044773424806, "step": 128100 }, { "epoch": 13.73, "eval_loss": 0.4549117386341095, "eval_runtime": 48.796, "eval_samples_per_second": 41.54, "eval_steps_per_second": 5.205, "eval_wer": 0.2987903953782271, "step": 128200 }, { "epoch": 13.74, "eval_loss": 0.45755627751350403, "eval_runtime": 49.8079, "eval_samples_per_second": 40.696, "eval_steps_per_second": 5.1, "eval_wer": 0.2992417403863513, "step": 128300 }, { "epoch": 13.75, "eval_loss": 0.4400174915790558, "eval_runtime": 48.596, "eval_samples_per_second": 41.711, "eval_steps_per_second": 5.227, "eval_wer": 0.2974363603538545, "step": 128400 }, { "epoch": 13.76, "learning_rate": 2.50336676217765e-05, "loss": 0.0793, "step": 128500 }, { "epoch": 13.76, "eval_loss": 0.4433426260948181, "eval_runtime": 48.6648, "eval_samples_per_second": 41.652, "eval_steps_per_second": 5.219, "eval_wer": 0.3008665824155985, "step": 128500 }, { "epoch": 13.77, "eval_loss": 0.44558921456336975, "eval_runtime": 48.7178, "eval_samples_per_second": 41.607, "eval_steps_per_second": 5.214, "eval_wer": 0.29824878136847804, "step": 128600 }, { "epoch": 13.78, "eval_loss": 0.4559650719165802, "eval_runtime": 48.5852, "eval_samples_per_second": 41.72, "eval_steps_per_second": 5.228, "eval_wer": 0.3019498104350966, "step": 128700 }, { "epoch": 13.79, "eval_loss": 0.45514196157455444, "eval_runtime": 48.8865, "eval_samples_per_second": 41.463, "eval_steps_per_second": 5.196, "eval_wer": 0.30077631341397365, "step": 128800 }, { "epoch": 13.8, "eval_loss": 0.45125389099121094, "eval_runtime": 48.9777, "eval_samples_per_second": 41.386, "eval_steps_per_second": 5.186, "eval_wer": 0.3006860444123488, "step": 128900 }, { "epoch": 13.81, "learning_rate": 2.3959169054441258e-05, "loss": 0.0769, "step": 129000 }, { "epoch": 13.81, "eval_loss": 0.45180532336235046, "eval_runtime": 48.7049, "eval_samples_per_second": 41.618, "eval_steps_per_second": 5.215, "eval_wer": 0.30077631341397365, "step": 129000 }, { "epoch": 13.82, "eval_loss": 0.45669108629226685, "eval_runtime": 48.6617, "eval_samples_per_second": 41.655, "eval_steps_per_second": 5.22, "eval_wer": 0.29806824336522836, "step": 129100 }, { "epoch": 13.83, "eval_loss": 0.4437228739261627, "eval_runtime": 48.6473, "eval_samples_per_second": 41.667, "eval_steps_per_second": 5.221, "eval_wer": 0.2985195883733526, "step": 129200 }, { "epoch": 13.84, "eval_loss": 0.4423811733722687, "eval_runtime": 49.8087, "eval_samples_per_second": 40.696, "eval_steps_per_second": 5.1, "eval_wer": 0.2969850153457303, "step": 129300 }, { "epoch": 13.85, "eval_loss": 0.44225621223449707, "eval_runtime": 48.5133, "eval_samples_per_second": 41.782, "eval_steps_per_second": 5.236, "eval_wer": 0.30095685141722334, "step": 129400 }, { "epoch": 13.87, "learning_rate": 2.2884670487106014e-05, "loss": 0.0785, "step": 129500 }, { "epoch": 13.87, "eval_loss": 0.44948408007621765, "eval_runtime": 48.6646, "eval_samples_per_second": 41.652, "eval_steps_per_second": 5.219, "eval_wer": 0.2998736233977252, "step": 129500 }, { "epoch": 13.88, "eval_loss": 0.4482867419719696, "eval_runtime": 48.676, "eval_samples_per_second": 41.643, "eval_steps_per_second": 5.218, "eval_wer": 0.29752662935547936, "step": 129600 }, { "epoch": 13.89, "eval_loss": 0.44850584864616394, "eval_runtime": 48.5728, "eval_samples_per_second": 41.731, "eval_steps_per_second": 5.229, "eval_wer": 0.2981585123668532, "step": 129700 }, { "epoch": 13.9, "eval_loss": 0.4428721070289612, "eval_runtime": 48.6015, "eval_samples_per_second": 41.707, "eval_steps_per_second": 5.226, "eval_wer": 0.29716555334898, "step": 129800 }, { "epoch": 13.91, "eval_loss": 0.4429783523082733, "eval_runtime": 48.8683, "eval_samples_per_second": 41.479, "eval_steps_per_second": 5.198, "eval_wer": 0.29581151832460734, "step": 129900 }, { "epoch": 13.92, "learning_rate": 2.181017191977077e-05, "loss": 0.0792, "step": 130000 }, { "epoch": 13.92, "eval_loss": 0.44945263862609863, "eval_runtime": 48.6546, "eval_samples_per_second": 41.661, "eval_steps_per_second": 5.22, "eval_wer": 0.2953601733164831, "step": 130000 }, { "epoch": 13.93, "eval_loss": 0.4485260546207428, "eval_runtime": 48.9845, "eval_samples_per_second": 41.38, "eval_steps_per_second": 5.185, "eval_wer": 0.2947282903051092, "step": 130100 }, { "epoch": 13.94, "eval_loss": 0.4395206570625305, "eval_runtime": 49.0973, "eval_samples_per_second": 41.285, "eval_steps_per_second": 5.173, "eval_wer": 0.29716555334898, "step": 130200 }, { "epoch": 13.95, "eval_loss": 0.43786346912384033, "eval_runtime": 48.7456, "eval_samples_per_second": 41.583, "eval_steps_per_second": 5.211, "eval_wer": 0.29734609135222967, "step": 130300 }, { "epoch": 13.96, "eval_loss": 0.44279754161834717, "eval_runtime": 48.6537, "eval_samples_per_second": 41.662, "eval_steps_per_second": 5.221, "eval_wer": 0.29888066437985195, "step": 130400 }, { "epoch": 13.97, "learning_rate": 2.0735673352435527e-05, "loss": 0.0795, "step": 130500 }, { "epoch": 13.97, "eval_loss": 0.43852099776268005, "eval_runtime": 48.7541, "eval_samples_per_second": 41.576, "eval_steps_per_second": 5.21, "eval_wer": 0.29996389239935006, "step": 130500 }, { "epoch": 13.98, "eval_loss": 0.4489758014678955, "eval_runtime": 48.8778, "eval_samples_per_second": 41.471, "eval_steps_per_second": 5.197, "eval_wer": 0.2983390503701029, "step": 130600 }, { "epoch": 13.99, "eval_loss": 0.45682230591773987, "eval_runtime": 48.7069, "eval_samples_per_second": 41.616, "eval_steps_per_second": 5.215, "eval_wer": 0.2969850153457303, "step": 130700 }, { "epoch": 14.0, "eval_loss": 0.4481572210788727, "eval_runtime": 48.9961, "eval_samples_per_second": 41.371, "eval_steps_per_second": 5.184, "eval_wer": 0.29626286333273155, "step": 130800 }, { "epoch": 14.01, "eval_loss": 0.44789794087409973, "eval_runtime": 48.6027, "eval_samples_per_second": 41.705, "eval_steps_per_second": 5.226, "eval_wer": 0.2961725943311067, "step": 130900 }, { "epoch": 14.03, "learning_rate": 1.9663323782234952e-05, "loss": 0.075, "step": 131000 }, { "epoch": 14.03, "eval_loss": 0.4565275013446808, "eval_runtime": 48.781, "eval_samples_per_second": 41.553, "eval_steps_per_second": 5.207, "eval_wer": 0.2968044773424806, "step": 131000 }, { "epoch": 14.04, "eval_loss": 0.46226829290390015, "eval_runtime": 48.8274, "eval_samples_per_second": 41.514, "eval_steps_per_second": 5.202, "eval_wer": 0.2961725943311067, "step": 131100 }, { "epoch": 14.05, "eval_loss": 0.4617317020893097, "eval_runtime": 48.5503, "eval_samples_per_second": 41.751, "eval_steps_per_second": 5.232, "eval_wer": 0.2965336703376061, "step": 131200 }, { "epoch": 14.06, "eval_loss": 0.46868252754211426, "eval_runtime": 49.7035, "eval_samples_per_second": 40.782, "eval_steps_per_second": 5.11, "eval_wer": 0.2949088283083589, "step": 131300 }, { "epoch": 14.07, "eval_loss": 0.47178399562835693, "eval_runtime": 48.788, "eval_samples_per_second": 41.547, "eval_steps_per_second": 5.206, "eval_wer": 0.29292291027261236, "step": 131400 }, { "epoch": 14.08, "learning_rate": 1.8590974212034384e-05, "loss": 0.0709, "step": 131500 }, { "epoch": 14.08, "eval_loss": 0.4720158278942108, "eval_runtime": 48.3508, "eval_samples_per_second": 41.923, "eval_steps_per_second": 5.253, "eval_wer": 0.2944574833002347, "step": 131500 }, { "epoch": 14.09, "eval_loss": 0.46036496758461, "eval_runtime": 48.6823, "eval_samples_per_second": 41.637, "eval_steps_per_second": 5.218, "eval_wer": 0.2952699043148583, "step": 131600 }, { "epoch": 14.1, "eval_loss": 0.46548134088516235, "eval_runtime": 48.9917, "eval_samples_per_second": 41.374, "eval_steps_per_second": 5.185, "eval_wer": 0.29545044231810796, "step": 131700 }, { "epoch": 14.11, "eval_loss": 0.4694814682006836, "eval_runtime": 48.632, "eval_samples_per_second": 41.68, "eval_steps_per_second": 5.223, "eval_wer": 0.29581151832460734, "step": 131800 }, { "epoch": 14.12, "eval_loss": 0.4666370153427124, "eval_runtime": 48.4823, "eval_samples_per_second": 41.809, "eval_steps_per_second": 5.239, "eval_wer": 0.29454775230185953, "step": 131900 }, { "epoch": 14.13, "learning_rate": 1.751647564469914e-05, "loss": 0.0705, "step": 132000 }, { "epoch": 14.13, "eval_loss": 0.460516095161438, "eval_runtime": 48.7139, "eval_samples_per_second": 41.61, "eval_steps_per_second": 5.214, "eval_wer": 0.2959017873262322, "step": 132000 }, { "epoch": 14.14, "eval_loss": 0.4581490755081177, "eval_runtime": 48.7404, "eval_samples_per_second": 41.588, "eval_steps_per_second": 5.211, "eval_wer": 0.2947282903051092, "step": 132100 }, { "epoch": 14.15, "eval_loss": 0.4597261846065521, "eval_runtime": 48.813, "eval_samples_per_second": 41.526, "eval_steps_per_second": 5.204, "eval_wer": 0.29481855930673406, "step": 132200 }, { "epoch": 14.16, "eval_loss": 0.4612421691417694, "eval_runtime": 48.6056, "eval_samples_per_second": 41.703, "eval_steps_per_second": 5.226, "eval_wer": 0.294276945296985, "step": 132300 }, { "epoch": 14.18, "eval_loss": 0.46105560660362244, "eval_runtime": 48.4486, "eval_samples_per_second": 41.838, "eval_steps_per_second": 5.243, "eval_wer": 0.2959017873262322, "step": 132400 }, { "epoch": 14.19, "learning_rate": 1.6441977077363896e-05, "loss": 0.0727, "step": 132500 }, { "epoch": 14.19, "eval_loss": 0.4569126069545746, "eval_runtime": 48.7541, "eval_samples_per_second": 41.576, "eval_steps_per_second": 5.21, "eval_wer": 0.29581151832460734, "step": 132500 }, { "epoch": 14.2, "eval_loss": 0.4556213319301605, "eval_runtime": 48.9259, "eval_samples_per_second": 41.43, "eval_steps_per_second": 5.192, "eval_wer": 0.2950893663116086, "step": 132600 }, { "epoch": 14.21, "eval_loss": 0.4596796929836273, "eval_runtime": 48.837, "eval_samples_per_second": 41.505, "eval_steps_per_second": 5.201, "eval_wer": 0.2955407113197328, "step": 132700 }, { "epoch": 14.22, "eval_loss": 0.4472346305847168, "eval_runtime": 48.874, "eval_samples_per_second": 41.474, "eval_steps_per_second": 5.197, "eval_wer": 0.2934645242823614, "step": 132800 }, { "epoch": 14.23, "eval_loss": 0.4573153853416443, "eval_runtime": 48.9521, "eval_samples_per_second": 41.408, "eval_steps_per_second": 5.189, "eval_wer": 0.294276945296985, "step": 132900 }, { "epoch": 14.24, "learning_rate": 1.5367478510028653e-05, "loss": 0.0723, "step": 133000 }, { "epoch": 14.24, "eval_loss": 0.4571533501148224, "eval_runtime": 48.8128, "eval_samples_per_second": 41.526, "eval_steps_per_second": 5.204, "eval_wer": 0.294276945296985, "step": 133000 }, { "epoch": 14.25, "eval_loss": 0.45821666717529297, "eval_runtime": 48.7097, "eval_samples_per_second": 41.614, "eval_steps_per_second": 5.215, "eval_wer": 0.29563098032135765, "step": 133100 }, { "epoch": 14.26, "eval_loss": 0.4598552882671356, "eval_runtime": 48.9917, "eval_samples_per_second": 41.374, "eval_steps_per_second": 5.185, "eval_wer": 0.2968044773424806, "step": 133200 }, { "epoch": 14.27, "eval_loss": 0.46326953172683716, "eval_runtime": 48.9832, "eval_samples_per_second": 41.382, "eval_steps_per_second": 5.185, "eval_wer": 0.2961725943311067, "step": 133300 }, { "epoch": 14.28, "eval_loss": 0.46043142676353455, "eval_runtime": 48.7305, "eval_samples_per_second": 41.596, "eval_steps_per_second": 5.212, "eval_wer": 0.29716555334898, "step": 133400 }, { "epoch": 14.29, "learning_rate": 1.429512893982808e-05, "loss": 0.071, "step": 133500 }, { "epoch": 14.29, "eval_loss": 0.45868054032325745, "eval_runtime": 48.925, "eval_samples_per_second": 41.431, "eval_steps_per_second": 5.192, "eval_wer": 0.29707528434735514, "step": 133500 }, { "epoch": 14.3, "eval_loss": 0.4598270058631897, "eval_runtime": 48.8352, "eval_samples_per_second": 41.507, "eval_steps_per_second": 5.201, "eval_wer": 0.2972558223506048, "step": 133600 }, { "epoch": 14.31, "eval_loss": 0.4579356610774994, "eval_runtime": 48.7823, "eval_samples_per_second": 41.552, "eval_steps_per_second": 5.207, "eval_wer": 0.2976168983571042, "step": 133700 }, { "epoch": 14.33, "eval_loss": 0.4539426565170288, "eval_runtime": 49.092, "eval_samples_per_second": 41.29, "eval_steps_per_second": 5.174, "eval_wer": 0.29689474634410545, "step": 133800 }, { "epoch": 14.34, "eval_loss": 0.46281492710113525, "eval_runtime": 48.5974, "eval_samples_per_second": 41.71, "eval_steps_per_second": 5.227, "eval_wer": 0.29608232532948187, "step": 133900 }, { "epoch": 14.35, "learning_rate": 1.3220630372492836e-05, "loss": 0.0703, "step": 134000 }, { "epoch": 14.35, "eval_loss": 0.46268972754478455, "eval_runtime": 48.6114, "eval_samples_per_second": 41.698, "eval_steps_per_second": 5.225, "eval_wer": 0.2974363603538545, "step": 134000 }, { "epoch": 14.36, "eval_loss": 0.4611077606678009, "eval_runtime": 48.7363, "eval_samples_per_second": 41.591, "eval_steps_per_second": 5.212, "eval_wer": 0.2974363603538545, "step": 134100 }, { "epoch": 14.37, "eval_loss": 0.4607299268245697, "eval_runtime": 48.8318, "eval_samples_per_second": 41.51, "eval_steps_per_second": 5.202, "eval_wer": 0.297707167358729, "step": 134200 }, { "epoch": 14.38, "eval_loss": 0.46377691626548767, "eval_runtime": 48.5242, "eval_samples_per_second": 41.773, "eval_steps_per_second": 5.235, "eval_wer": 0.2983390503701029, "step": 134300 }, { "epoch": 14.39, "eval_loss": 0.46281489729881287, "eval_runtime": 48.4537, "eval_samples_per_second": 41.834, "eval_steps_per_second": 5.242, "eval_wer": 0.29689474634410545, "step": 134400 }, { "epoch": 14.4, "learning_rate": 1.2146131805157592e-05, "loss": 0.0736, "step": 134500 }, { "epoch": 14.4, "eval_loss": 0.45427754521369934, "eval_runtime": 49.0592, "eval_samples_per_second": 41.317, "eval_steps_per_second": 5.177, "eval_wer": 0.2965336703376061, "step": 134500 }, { "epoch": 14.41, "eval_loss": 0.4584720730781555, "eval_runtime": 48.8757, "eval_samples_per_second": 41.473, "eval_steps_per_second": 5.197, "eval_wer": 0.29626286333273155, "step": 134600 }, { "epoch": 14.42, "eval_loss": 0.4636397361755371, "eval_runtime": 48.5914, "eval_samples_per_second": 41.715, "eval_steps_per_second": 5.227, "eval_wer": 0.29499909730998375, "step": 134700 }, { "epoch": 14.43, "eval_loss": 0.463554710149765, "eval_runtime": 48.5443, "eval_samples_per_second": 41.756, "eval_steps_per_second": 5.232, "eval_wer": 0.2963531323343564, "step": 134800 }, { "epoch": 14.44, "eval_loss": 0.4630184769630432, "eval_runtime": 48.4957, "eval_samples_per_second": 41.798, "eval_steps_per_second": 5.238, "eval_wer": 0.29581151832460734, "step": 134900 }, { "epoch": 14.45, "learning_rate": 1.107163323782235e-05, "loss": 0.0715, "step": 135000 }, { "epoch": 14.45, "eval_loss": 0.46107855439186096, "eval_runtime": 48.3967, "eval_samples_per_second": 41.883, "eval_steps_per_second": 5.248, "eval_wer": 0.2968044773424806, "step": 135000 }, { "epoch": 14.46, "eval_loss": 0.4633425176143646, "eval_runtime": 48.7522, "eval_samples_per_second": 41.578, "eval_steps_per_second": 5.21, "eval_wer": 0.2966239393392309, "step": 135100 }, { "epoch": 14.48, "eval_loss": 0.46640947461128235, "eval_runtime": 48.7469, "eval_samples_per_second": 41.582, "eval_steps_per_second": 5.211, "eval_wer": 0.2953601733164831, "step": 135200 }, { "epoch": 14.49, "eval_loss": 0.46697285771369934, "eval_runtime": 48.3158, "eval_samples_per_second": 41.953, "eval_steps_per_second": 5.257, "eval_wer": 0.29454775230185953, "step": 135300 }, { "epoch": 14.5, "eval_loss": 0.4637785255908966, "eval_runtime": 48.5635, "eval_samples_per_second": 41.739, "eval_steps_per_second": 5.23, "eval_wer": 0.29608232532948187, "step": 135400 }, { "epoch": 14.51, "learning_rate": 9.997134670487106e-06, "loss": 0.073, "step": 135500 }, { "epoch": 14.51, "eval_loss": 0.46345365047454834, "eval_runtime": 48.4562, "eval_samples_per_second": 41.832, "eval_steps_per_second": 5.242, "eval_wer": 0.2965336703376061, "step": 135500 }, { "epoch": 14.52, "eval_loss": 0.4638654291629791, "eval_runtime": 48.5254, "eval_samples_per_second": 41.772, "eval_steps_per_second": 5.234, "eval_wer": 0.29563098032135765, "step": 135600 }, { "epoch": 14.53, "eval_loss": 0.461653470993042, "eval_runtime": 48.3998, "eval_samples_per_second": 41.88, "eval_steps_per_second": 5.248, "eval_wer": 0.29481855930673406, "step": 135700 }, { "epoch": 14.54, "eval_loss": 0.46086516976356506, "eval_runtime": 48.3403, "eval_samples_per_second": 41.932, "eval_steps_per_second": 5.254, "eval_wer": 0.29328398627911173, "step": 135800 }, { "epoch": 14.55, "eval_loss": 0.4613838493824005, "eval_runtime": 49.0954, "eval_samples_per_second": 41.287, "eval_steps_per_second": 5.174, "eval_wer": 0.2947282903051092, "step": 135900 }, { "epoch": 14.56, "learning_rate": 8.926934097421202e-06, "loss": 0.0717, "step": 136000 }, { "epoch": 14.56, "eval_loss": 0.4566675126552582, "eval_runtime": 48.7004, "eval_samples_per_second": 41.622, "eval_steps_per_second": 5.216, "eval_wer": 0.29581151832460734, "step": 136000 }, { "epoch": 14.57, "eval_loss": 0.4615228474140167, "eval_runtime": 48.4673, "eval_samples_per_second": 41.822, "eval_steps_per_second": 5.241, "eval_wer": 0.2933742552807366, "step": 136100 }, { "epoch": 14.58, "eval_loss": 0.4605715572834015, "eval_runtime": 48.7692, "eval_samples_per_second": 41.563, "eval_steps_per_second": 5.208, "eval_wer": 0.29292291027261236, "step": 136200 }, { "epoch": 14.59, "eval_loss": 0.4651778042316437, "eval_runtime": 48.3037, "eval_samples_per_second": 41.964, "eval_steps_per_second": 5.258, "eval_wer": 0.2933742552807366, "step": 136300 }, { "epoch": 14.6, "eval_loss": 0.466376394033432, "eval_runtime": 48.4015, "eval_samples_per_second": 41.879, "eval_steps_per_second": 5.248, "eval_wer": 0.2933742552807366, "step": 136400 }, { "epoch": 14.61, "learning_rate": 7.852435530085958e-06, "loss": 0.0717, "step": 136500 }, { "epoch": 14.61, "eval_loss": 0.4657481908798218, "eval_runtime": 49.5201, "eval_samples_per_second": 40.933, "eval_steps_per_second": 5.129, "eval_wer": 0.2922910272612385, "step": 136500 }, { "epoch": 14.63, "eval_loss": 0.46331438422203064, "eval_runtime": 48.1829, "eval_samples_per_second": 42.069, "eval_steps_per_second": 5.272, "eval_wer": 0.29310344827586204, "step": 136600 }, { "epoch": 14.64, "eval_loss": 0.4623650014400482, "eval_runtime": 48.4558, "eval_samples_per_second": 41.832, "eval_steps_per_second": 5.242, "eval_wer": 0.294276945296985, "step": 136700 }, { "epoch": 14.65, "eval_loss": 0.46153533458709717, "eval_runtime": 48.2857, "eval_samples_per_second": 41.979, "eval_steps_per_second": 5.26, "eval_wer": 0.2949088283083589, "step": 136800 }, { "epoch": 14.66, "eval_loss": 0.46194565296173096, "eval_runtime": 48.511, "eval_samples_per_second": 41.784, "eval_steps_per_second": 5.236, "eval_wer": 0.2930131792742372, "step": 136900 }, { "epoch": 14.67, "learning_rate": 6.777936962750715e-06, "loss": 0.0707, "step": 137000 }, { "epoch": 14.67, "eval_loss": 0.4607996642589569, "eval_runtime": 48.4004, "eval_samples_per_second": 41.88, "eval_steps_per_second": 5.248, "eval_wer": 0.29355479328398626, "step": 137000 }, { "epoch": 14.68, "eval_loss": 0.4615156948566437, "eval_runtime": 48.1236, "eval_samples_per_second": 42.121, "eval_steps_per_second": 5.278, "eval_wer": 0.2944574833002347, "step": 137100 }, { "epoch": 14.69, "eval_loss": 0.4605298340320587, "eval_runtime": 48.3679, "eval_samples_per_second": 41.908, "eval_steps_per_second": 5.251, "eval_wer": 0.2940964072937353, "step": 137200 }, { "epoch": 14.7, "eval_loss": 0.4598088562488556, "eval_runtime": 48.3883, "eval_samples_per_second": 41.89, "eval_steps_per_second": 5.249, "eval_wer": 0.29310344827586204, "step": 137300 }, { "epoch": 14.71, "eval_loss": 0.4595940113067627, "eval_runtime": 48.3856, "eval_samples_per_second": 41.893, "eval_steps_per_second": 5.249, "eval_wer": 0.294276945296985, "step": 137400 }, { "epoch": 14.72, "learning_rate": 5.703438395415472e-06, "loss": 0.0694, "step": 137500 }, { "epoch": 14.72, "eval_loss": 0.4623918831348419, "eval_runtime": 48.1674, "eval_samples_per_second": 42.082, "eval_steps_per_second": 5.273, "eval_wer": 0.2927423722693627, "step": 137500 }, { "epoch": 14.73, "eval_loss": 0.46141380071640015, "eval_runtime": 48.7535, "eval_samples_per_second": 41.576, "eval_steps_per_second": 5.21, "eval_wer": 0.29310344827586204, "step": 137600 }, { "epoch": 14.74, "eval_loss": 0.4621369540691376, "eval_runtime": 48.3733, "eval_samples_per_second": 41.903, "eval_steps_per_second": 5.251, "eval_wer": 0.29238129626286335, "step": 137700 }, { "epoch": 14.75, "eval_loss": 0.4588609039783478, "eval_runtime": 48.512, "eval_samples_per_second": 41.783, "eval_steps_per_second": 5.236, "eval_wer": 0.292020220256364, "step": 137800 }, { "epoch": 14.76, "eval_loss": 0.4590286314487457, "eval_runtime": 48.3051, "eval_samples_per_second": 41.962, "eval_steps_per_second": 5.258, "eval_wer": 0.29256183426611304, "step": 137900 }, { "epoch": 14.78, "learning_rate": 4.6310888252149e-06, "loss": 0.0706, "step": 138000 }, { "epoch": 14.78, "eval_loss": 0.4587528705596924, "eval_runtime": 48.6184, "eval_samples_per_second": 41.692, "eval_steps_per_second": 5.224, "eval_wer": 0.29310344827586204, "step": 138000 }, { "epoch": 14.79, "eval_loss": 0.4583205282688141, "eval_runtime": 48.382, "eval_samples_per_second": 41.896, "eval_steps_per_second": 5.25, "eval_wer": 0.29283264127098757, "step": 138100 }, { "epoch": 14.8, "eval_loss": 0.4552071690559387, "eval_runtime": 48.5176, "eval_samples_per_second": 41.779, "eval_steps_per_second": 5.235, "eval_wer": 0.2933742552807366, "step": 138200 }, { "epoch": 14.81, "eval_loss": 0.45508986711502075, "eval_runtime": 48.381, "eval_samples_per_second": 41.897, "eval_steps_per_second": 5.25, "eval_wer": 0.2922910272612385, "step": 138300 }, { "epoch": 14.82, "eval_loss": 0.4554976224899292, "eval_runtime": 48.4911, "eval_samples_per_second": 41.801, "eval_steps_per_second": 5.238, "eval_wer": 0.2927423722693627, "step": 138400 }, { "epoch": 14.83, "learning_rate": 3.5565902578796557e-06, "loss": 0.0717, "step": 138500 }, { "epoch": 14.83, "eval_loss": 0.45470017194747925, "eval_runtime": 48.872, "eval_samples_per_second": 41.476, "eval_steps_per_second": 5.197, "eval_wer": 0.2930131792742372, "step": 138500 }, { "epoch": 14.84, "eval_loss": 0.45462867617607117, "eval_runtime": 48.527, "eval_samples_per_second": 41.771, "eval_steps_per_second": 5.234, "eval_wer": 0.2930131792742372, "step": 138600 }, { "epoch": 14.85, "eval_loss": 0.45525601506233215, "eval_runtime": 48.4224, "eval_samples_per_second": 41.861, "eval_steps_per_second": 5.246, "eval_wer": 0.2933742552807366, "step": 138700 }, { "epoch": 14.86, "eval_loss": 0.4553750157356262, "eval_runtime": 49.4095, "eval_samples_per_second": 41.025, "eval_steps_per_second": 5.141, "eval_wer": 0.29238129626286335, "step": 138800 }, { "epoch": 14.87, "eval_loss": 0.4572896361351013, "eval_runtime": 48.7188, "eval_samples_per_second": 41.606, "eval_steps_per_second": 5.214, "eval_wer": 0.29238129626286335, "step": 138900 }, { "epoch": 14.88, "learning_rate": 2.4820916905444123e-06, "loss": 0.0722, "step": 139000 }, { "epoch": 14.88, "eval_loss": 0.4582221806049347, "eval_runtime": 48.6094, "eval_samples_per_second": 41.7, "eval_steps_per_second": 5.225, "eval_wer": 0.2927423722693627, "step": 139000 }, { "epoch": 14.89, "eval_loss": 0.45864611864089966, "eval_runtime": 48.4648, "eval_samples_per_second": 41.824, "eval_steps_per_second": 5.241, "eval_wer": 0.29256183426611304, "step": 139100 }, { "epoch": 14.9, "eval_loss": 0.4569910168647766, "eval_runtime": 48.3017, "eval_samples_per_second": 41.965, "eval_steps_per_second": 5.259, "eval_wer": 0.29256183426611304, "step": 139200 }, { "epoch": 14.91, "eval_loss": 0.45708757638931274, "eval_runtime": 49.3455, "eval_samples_per_second": 41.078, "eval_steps_per_second": 5.147, "eval_wer": 0.2922910272612385, "step": 139300 }, { "epoch": 14.93, "eval_loss": 0.45643165707588196, "eval_runtime": 48.5858, "eval_samples_per_second": 41.72, "eval_steps_per_second": 5.228, "eval_wer": 0.2924715652644882, "step": 139400 }, { "epoch": 14.94, "learning_rate": 1.4075931232091689e-06, "loss": 0.0698, "step": 139500 }, { "epoch": 14.94, "eval_loss": 0.45725566148757935, "eval_runtime": 48.4887, "eval_samples_per_second": 41.804, "eval_steps_per_second": 5.238, "eval_wer": 0.2927423722693627, "step": 139500 }, { "epoch": 14.95, "eval_loss": 0.457427054643631, "eval_runtime": 48.4081, "eval_samples_per_second": 41.873, "eval_steps_per_second": 5.247, "eval_wer": 0.2927423722693627, "step": 139600 }, { "epoch": 14.96, "eval_loss": 0.4572872817516327, "eval_runtime": 48.5718, "eval_samples_per_second": 41.732, "eval_steps_per_second": 5.229, "eval_wer": 0.2926521032677379, "step": 139700 }, { "epoch": 14.97, "eval_loss": 0.45759284496307373, "eval_runtime": 48.8708, "eval_samples_per_second": 41.477, "eval_steps_per_second": 5.197, "eval_wer": 0.2921104892579888, "step": 139800 }, { "epoch": 14.98, "eval_loss": 0.45777422189712524, "eval_runtime": 48.4515, "eval_samples_per_second": 41.836, "eval_steps_per_second": 5.242, "eval_wer": 0.2922910272612385, "step": 139900 }, { "epoch": 14.99, "learning_rate": 3.330945558739255e-07, "loss": 0.0705, "step": 140000 }, { "epoch": 14.99, "eval_loss": 0.45787951350212097, "eval_runtime": 48.5181, "eval_samples_per_second": 41.778, "eval_steps_per_second": 5.235, "eval_wer": 0.29283264127098757, "step": 140000 }, { "epoch": 15.0, "eval_loss": 0.4578445553779602, "eval_runtime": 48.7019, "eval_samples_per_second": 41.621, "eval_steps_per_second": 5.215, "eval_wer": 0.2926521032677379, "step": 140100 }, { "epoch": 15.0, "step": 140100, "total_flos": 7.232425156722584e+20, "train_loss": 0.23010640207313793, "train_runtime": 407183.7095, "train_samples_per_second": 11.011, "train_steps_per_second": 0.344 } ], "max_steps": 140100, "num_train_epochs": 15, "total_flos": 7.232425156722584e+20, "trial_name": null, "trial_params": null }