diff --git "a/trainer_state.json" "b/trainer_state.json" --- "a/trainer_state.json" +++ "b/trainer_state.json" @@ -1,8 +1,8 @@ { "best_metric": null, "best_model_checkpoint": null, - "epoch": 19.007506666666668, - "global_step": 20000, + "epoch": 56.002826666666664, + "global_step": 57500, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, @@ -12366,11 +12366,23186 @@ "eval_steps_per_second": 3.51, "eval_wer": 0.12542515025858453, "step": 20000 + }, + { + "epoch": 19.01, + "learning_rate": 7.432297297297298e-05, + "loss": 0.268, + "step": 20010 + }, + { + "epoch": 19.01, + "learning_rate": 7.430945945945946e-05, + "loss": 0.2439, + "step": 20020 + }, + { + "epoch": 19.01, + "learning_rate": 7.429594594594596e-05, + "loss": 0.2271, + "step": 20030 + }, + { + "epoch": 19.01, + "learning_rate": 7.428243243243244e-05, + "loss": 0.2142, + "step": 20040 + }, + { + "epoch": 19.01, + "learning_rate": 7.426891891891892e-05, + "loss": 0.2386, + "step": 20050 + }, + { + "epoch": 19.01, + "learning_rate": 7.425540540540541e-05, + "loss": 0.543, + "step": 20060 + }, + { + "epoch": 19.01, + "learning_rate": 7.42418918918919e-05, + "loss": 0.4487, + "step": 20070 + }, + { + "epoch": 19.01, + "learning_rate": 7.422837837837839e-05, + "loss": 0.369, + "step": 20080 + }, + { + "epoch": 19.01, + "learning_rate": 7.421486486486487e-05, + "loss": 0.3811, + "step": 20090 + }, + { + "epoch": 19.01, + "learning_rate": 7.420135135135135e-05, + "loss": 0.5954, + "step": 20100 + }, + { + "epoch": 19.01, + "learning_rate": 7.418783783783783e-05, + "loss": 0.3521, + "step": 20110 + }, + { + "epoch": 19.01, + "learning_rate": 7.417432432432433e-05, + "loss": 0.2702, + "step": 20120 + }, + { + "epoch": 19.01, + "learning_rate": 7.416081081081081e-05, + "loss": 0.3522, + "step": 20130 + }, + { + "epoch": 19.01, + "learning_rate": 7.41472972972973e-05, + "loss": 0.451, + "step": 20140 + }, + { + "epoch": 19.01, + "learning_rate": 7.413378378378378e-05, + "loss": 0.4276, + "step": 20150 + }, + { + "epoch": 19.01, + "learning_rate": 7.412027027027028e-05, + "loss": 0.4072, + "step": 20160 + }, + { + "epoch": 19.01, + "learning_rate": 7.410675675675676e-05, + "loss": 0.3231, + "step": 20170 + }, + { + "epoch": 19.01, + "learning_rate": 7.409324324324325e-05, + "loss": 0.3499, + "step": 20180 + }, + { + "epoch": 19.01, + "learning_rate": 7.407972972972973e-05, + "loss": 0.3187, + "step": 20190 + }, + { + "epoch": 19.01, + "learning_rate": 7.406621621621623e-05, + "loss": 0.2682, + "step": 20200 + }, + { + "epoch": 19.01, + "learning_rate": 7.405270270270271e-05, + "loss": 0.2492, + "step": 20210 + }, + { + "epoch": 19.01, + "learning_rate": 7.403918918918919e-05, + "loss": 0.2007, + "step": 20220 + }, + { + "epoch": 19.01, + "learning_rate": 7.402567567567567e-05, + "loss": 0.3584, + "step": 20230 + }, + { + "epoch": 19.01, + "learning_rate": 7.401216216216217e-05, + "loss": 0.7601, + "step": 20240 + }, + { + "epoch": 19.01, + "learning_rate": 7.399864864864865e-05, + "loss": 0.2866, + "step": 20250 + }, + { + "epoch": 19.01, + "learning_rate": 7.398513513513514e-05, + "loss": 0.2139, + "step": 20260 + }, + { + "epoch": 19.01, + "learning_rate": 7.397162162162162e-05, + "loss": 0.4415, + "step": 20270 + }, + { + "epoch": 19.01, + "learning_rate": 7.395810810810812e-05, + "loss": 0.3176, + "step": 20280 + }, + { + "epoch": 19.01, + "learning_rate": 7.39445945945946e-05, + "loss": 0.3646, + "step": 20290 + }, + { + "epoch": 19.01, + "learning_rate": 7.393108108108109e-05, + "loss": 0.4352, + "step": 20300 + }, + { + "epoch": 19.01, + "learning_rate": 7.391756756756757e-05, + "loss": 0.4188, + "step": 20310 + }, + { + "epoch": 19.01, + "learning_rate": 7.390405405405405e-05, + "loss": 0.2299, + "step": 20320 + }, + { + "epoch": 19.01, + "learning_rate": 7.389054054054054e-05, + "loss": 0.4064, + "step": 20330 + }, + { + "epoch": 19.01, + "learning_rate": 7.387702702702703e-05, + "loss": 0.3626, + "step": 20340 + }, + { + "epoch": 19.01, + "learning_rate": 7.386351351351351e-05, + "loss": 0.4859, + "step": 20350 + }, + { + "epoch": 19.01, + "learning_rate": 7.385e-05, + "loss": 0.5692, + "step": 20360 + }, + { + "epoch": 19.01, + "learning_rate": 7.383648648648649e-05, + "loss": 0.4183, + "step": 20370 + }, + { + "epoch": 19.01, + "learning_rate": 7.382297297297298e-05, + "loss": 0.665, + "step": 20380 + }, + { + "epoch": 19.01, + "learning_rate": 7.380945945945946e-05, + "loss": 0.5323, + "step": 20390 + }, + { + "epoch": 19.01, + "learning_rate": 7.379594594594596e-05, + "loss": 0.6536, + "step": 20400 + }, + { + "epoch": 19.01, + "learning_rate": 7.378243243243244e-05, + "loss": 0.6767, + "step": 20410 + }, + { + "epoch": 19.01, + "learning_rate": 7.376891891891893e-05, + "loss": 0.4806, + "step": 20420 + }, + { + "epoch": 19.01, + "learning_rate": 7.375540540540541e-05, + "loss": 0.5395, + "step": 20430 + }, + { + "epoch": 19.01, + "learning_rate": 7.37418918918919e-05, + "loss": 0.4833, + "step": 20440 + }, + { + "epoch": 19.01, + "learning_rate": 7.372837837837838e-05, + "loss": 0.4534, + "step": 20450 + }, + { + "epoch": 19.01, + "learning_rate": 7.371486486486486e-05, + "loss": 0.6846, + "step": 20460 + }, + { + "epoch": 20.0, + "learning_rate": 7.370135135135135e-05, + "loss": 0.4885, + "step": 20470 + }, + { + "epoch": 20.0, + "learning_rate": 7.368783783783783e-05, + "loss": 0.5059, + "step": 20480 + }, + { + "epoch": 20.0, + "learning_rate": 7.367432432432433e-05, + "loss": 0.5352, + "step": 20490 + }, + { + "epoch": 20.0, + "learning_rate": 7.366081081081081e-05, + "loss": 0.4575, + "step": 20500 + }, + { + "epoch": 20.0, + "eval_loss": 0.12828099727630615, + "eval_runtime": 129.9704, + "eval_samples_per_second": 27.76, + "eval_steps_per_second": 3.47, + "eval_wer": 0.13604808274705307, + "step": 20500 + }, + { + "epoch": 20.0, + "learning_rate": 7.36472972972973e-05, + "loss": 0.5025, + "step": 20510 + }, + { + "epoch": 20.0, + "learning_rate": 7.363378378378378e-05, + "loss": 0.5135, + "step": 20520 + }, + { + "epoch": 20.0, + "learning_rate": 7.362027027027028e-05, + "loss": 0.6385, + "step": 20530 + }, + { + "epoch": 20.0, + "learning_rate": 7.360675675675676e-05, + "loss": 0.4386, + "step": 20540 + }, + { + "epoch": 20.0, + "learning_rate": 7.359324324324325e-05, + "loss": 0.5307, + "step": 20550 + }, + { + "epoch": 20.0, + "learning_rate": 7.357972972972974e-05, + "loss": 0.5175, + "step": 20560 + }, + { + "epoch": 20.0, + "learning_rate": 7.356621621621622e-05, + "loss": 0.4435, + "step": 20570 + }, + { + "epoch": 20.0, + "learning_rate": 7.35527027027027e-05, + "loss": 0.4313, + "step": 20580 + }, + { + "epoch": 20.0, + "learning_rate": 7.353918918918919e-05, + "loss": 0.2996, + "step": 20590 + }, + { + "epoch": 20.0, + "learning_rate": 7.352567567567567e-05, + "loss": 0.2915, + "step": 20600 + }, + { + "epoch": 20.0, + "learning_rate": 7.351216216216217e-05, + "loss": 0.3092, + "step": 20610 + }, + { + "epoch": 20.0, + "learning_rate": 7.349864864864865e-05, + "loss": 0.5326, + "step": 20620 + }, + { + "epoch": 20.0, + "learning_rate": 7.348513513513514e-05, + "loss": 1.2507, + "step": 20630 + }, + { + "epoch": 20.0, + "learning_rate": 7.347162162162162e-05, + "loss": 1.9339, + "step": 20640 + }, + { + "epoch": 20.0, + "learning_rate": 7.345810810810812e-05, + "loss": 2.5969, + "step": 20650 + }, + { + "epoch": 20.0, + "learning_rate": 7.34445945945946e-05, + "loss": 2.4496, + "step": 20660 + }, + { + "epoch": 20.0, + "learning_rate": 7.34310810810811e-05, + "loss": 2.5993, + "step": 20670 + }, + { + "epoch": 20.0, + "learning_rate": 7.341756756756758e-05, + "loss": 2.159, + "step": 20680 + }, + { + "epoch": 20.0, + "learning_rate": 7.340405405405406e-05, + "loss": 1.732, + "step": 20690 + }, + { + "epoch": 20.0, + "learning_rate": 7.339054054054054e-05, + "loss": 1.22, + "step": 20700 + }, + { + "epoch": 20.0, + "learning_rate": 7.337702702702703e-05, + "loss": 0.6503, + "step": 20710 + }, + { + "epoch": 20.0, + "learning_rate": 7.336351351351351e-05, + "loss": 0.1789, + "step": 20720 + }, + { + "epoch": 20.0, + "learning_rate": 7.335000000000001e-05, + "loss": 0.3429, + "step": 20730 + }, + { + "epoch": 20.0, + "learning_rate": 7.333648648648649e-05, + "loss": 0.3081, + "step": 20740 + }, + { + "epoch": 20.0, + "learning_rate": 7.332297297297298e-05, + "loss": 0.3783, + "step": 20750 + }, + { + "epoch": 20.0, + "learning_rate": 7.330945945945946e-05, + "loss": 0.5532, + "step": 20760 + }, + { + "epoch": 20.0, + "learning_rate": 7.329594594594596e-05, + "loss": 0.371, + "step": 20770 + }, + { + "epoch": 20.0, + "learning_rate": 7.328243243243244e-05, + "loss": 0.1947, + "step": 20780 + }, + { + "epoch": 20.0, + "learning_rate": 7.326891891891892e-05, + "loss": 0.2947, + "step": 20790 + }, + { + "epoch": 20.0, + "learning_rate": 7.32554054054054e-05, + "loss": 0.3126, + "step": 20800 + }, + { + "epoch": 20.0, + "learning_rate": 7.32418918918919e-05, + "loss": 0.2972, + "step": 20810 + }, + { + "epoch": 20.0, + "learning_rate": 7.322837837837838e-05, + "loss": 0.3899, + "step": 20820 + }, + { + "epoch": 20.0, + "learning_rate": 7.321486486486487e-05, + "loss": 0.2347, + "step": 20830 + }, + { + "epoch": 20.01, + "learning_rate": 7.320135135135135e-05, + "loss": 0.2637, + "step": 20840 + }, + { + "epoch": 20.01, + "learning_rate": 7.318783783783783e-05, + "loss": 0.1634, + "step": 20850 + }, + { + "epoch": 20.01, + "learning_rate": 7.317432432432433e-05, + "loss": 0.2529, + "step": 20860 + }, + { + "epoch": 20.01, + "learning_rate": 7.316081081081081e-05, + "loss": 0.2868, + "step": 20870 + }, + { + "epoch": 20.01, + "learning_rate": 7.31472972972973e-05, + "loss": 0.1971, + "step": 20880 + }, + { + "epoch": 20.01, + "learning_rate": 7.313378378378379e-05, + "loss": 0.2657, + "step": 20890 + }, + { + "epoch": 20.01, + "learning_rate": 7.312027027027028e-05, + "loss": 0.4097, + "step": 20900 + }, + { + "epoch": 20.01, + "learning_rate": 7.310675675675676e-05, + "loss": 0.3372, + "step": 20910 + }, + { + "epoch": 20.01, + "learning_rate": 7.309324324324324e-05, + "loss": 0.3307, + "step": 20920 + }, + { + "epoch": 20.01, + "learning_rate": 7.307972972972972e-05, + "loss": 0.4294, + "step": 20930 + }, + { + "epoch": 20.01, + "learning_rate": 7.306621621621622e-05, + "loss": 0.38, + "step": 20940 + }, + { + "epoch": 20.01, + "learning_rate": 7.30527027027027e-05, + "loss": 0.4655, + "step": 20950 + }, + { + "epoch": 20.01, + "learning_rate": 7.303918918918919e-05, + "loss": 0.4414, + "step": 20960 + }, + { + "epoch": 20.01, + "learning_rate": 7.302567567567567e-05, + "loss": 0.2854, + "step": 20970 + }, + { + "epoch": 20.01, + "learning_rate": 7.301216216216217e-05, + "loss": 0.6525, + "step": 20980 + }, + { + "epoch": 20.01, + "learning_rate": 7.299864864864865e-05, + "loss": 0.6312, + "step": 20990 + }, + { + "epoch": 20.01, + "learning_rate": 7.298513513513514e-05, + "loss": 0.3321, + "step": 21000 + }, + { + "epoch": 20.01, + "eval_loss": 0.11452169716358185, + "eval_runtime": 133.5513, + "eval_samples_per_second": 27.016, + "eval_steps_per_second": 3.377, + "eval_wer": 0.12062619391510972, + "step": 21000 + }, + { + "epoch": 20.01, + "learning_rate": 7.297162162162163e-05, + "loss": 0.208, + "step": 21010 + }, + { + "epoch": 20.01, + "learning_rate": 7.295810810810812e-05, + "loss": 0.311, + "step": 21020 + }, + { + "epoch": 20.01, + "learning_rate": 7.29445945945946e-05, + "loss": 0.299, + "step": 21030 + }, + { + "epoch": 20.01, + "learning_rate": 7.293108108108108e-05, + "loss": 0.244, + "step": 21040 + }, + { + "epoch": 20.01, + "learning_rate": 7.291756756756756e-05, + "loss": 0.2301, + "step": 21050 + }, + { + "epoch": 20.01, + "learning_rate": 7.290405405405406e-05, + "loss": 0.2209, + "step": 21060 + }, + { + "epoch": 20.01, + "learning_rate": 7.289054054054054e-05, + "loss": 0.2409, + "step": 21070 + }, + { + "epoch": 20.01, + "learning_rate": 7.287702702702703e-05, + "loss": 0.442, + "step": 21080 + }, + { + "epoch": 20.01, + "learning_rate": 7.286351351351351e-05, + "loss": 0.4693, + "step": 21090 + }, + { + "epoch": 20.01, + "learning_rate": 7.285000000000001e-05, + "loss": 0.4175, + "step": 21100 + }, + { + "epoch": 20.01, + "learning_rate": 7.283648648648649e-05, + "loss": 0.3796, + "step": 21110 + }, + { + "epoch": 20.01, + "learning_rate": 7.282297297297298e-05, + "loss": 0.4882, + "step": 21120 + }, + { + "epoch": 20.01, + "learning_rate": 7.280945945945947e-05, + "loss": 0.4329, + "step": 21130 + }, + { + "epoch": 20.01, + "learning_rate": 7.279594594594596e-05, + "loss": 0.2736, + "step": 21140 + }, + { + "epoch": 20.01, + "learning_rate": 7.278243243243244e-05, + "loss": 0.3123, + "step": 21150 + }, + { + "epoch": 20.01, + "learning_rate": 7.276891891891892e-05, + "loss": 0.3431, + "step": 21160 + }, + { + "epoch": 20.01, + "learning_rate": 7.27554054054054e-05, + "loss": 0.523, + "step": 21170 + }, + { + "epoch": 20.01, + "learning_rate": 7.27418918918919e-05, + "loss": 0.4667, + "step": 21180 + }, + { + "epoch": 20.01, + "learning_rate": 7.272837837837838e-05, + "loss": 0.3351, + "step": 21190 + }, + { + "epoch": 20.01, + "learning_rate": 7.271486486486487e-05, + "loss": 0.3564, + "step": 21200 + }, + { + "epoch": 20.01, + "learning_rate": 7.270135135135135e-05, + "loss": 0.2961, + "step": 21210 + }, + { + "epoch": 20.01, + "learning_rate": 7.268783783783785e-05, + "loss": 0.2938, + "step": 21220 + }, + { + "epoch": 20.01, + "learning_rate": 7.267432432432433e-05, + "loss": 0.2852, + "step": 21230 + }, + { + "epoch": 20.01, + "learning_rate": 7.266081081081081e-05, + "loss": 0.1811, + "step": 21240 + }, + { + "epoch": 20.01, + "learning_rate": 7.26472972972973e-05, + "loss": 0.3424, + "step": 21250 + }, + { + "epoch": 20.01, + "learning_rate": 7.263378378378379e-05, + "loss": 0.5923, + "step": 21260 + }, + { + "epoch": 20.01, + "learning_rate": 7.262027027027027e-05, + "loss": 0.4097, + "step": 21270 + }, + { + "epoch": 20.01, + "learning_rate": 7.260675675675675e-05, + "loss": 0.2343, + "step": 21280 + }, + { + "epoch": 20.01, + "learning_rate": 7.259324324324324e-05, + "loss": 0.2994, + "step": 21290 + }, + { + "epoch": 20.01, + "learning_rate": 7.257972972972972e-05, + "loss": 0.3271, + "step": 21300 + }, + { + "epoch": 20.01, + "learning_rate": 7.256621621621622e-05, + "loss": 0.3081, + "step": 21310 + }, + { + "epoch": 20.01, + "learning_rate": 7.25527027027027e-05, + "loss": 0.4385, + "step": 21320 + }, + { + "epoch": 20.01, + "learning_rate": 7.25391891891892e-05, + "loss": 0.468, + "step": 21330 + }, + { + "epoch": 20.01, + "learning_rate": 7.252567567567568e-05, + "loss": 0.223, + "step": 21340 + }, + { + "epoch": 20.01, + "learning_rate": 7.251216216216217e-05, + "loss": 0.4362, + "step": 21350 + }, + { + "epoch": 20.01, + "learning_rate": 7.249864864864865e-05, + "loss": 0.2899, + "step": 21360 + }, + { + "epoch": 20.01, + "learning_rate": 7.248513513513515e-05, + "loss": 0.5365, + "step": 21370 + }, + { + "epoch": 20.01, + "learning_rate": 7.247162162162163e-05, + "loss": 0.5099, + "step": 21380 + }, + { + "epoch": 20.01, + "learning_rate": 7.245810810810811e-05, + "loss": 0.5344, + "step": 21390 + }, + { + "epoch": 20.01, + "learning_rate": 7.244459459459459e-05, + "loss": 0.5577, + "step": 21400 + }, + { + "epoch": 20.01, + "learning_rate": 7.243108108108108e-05, + "loss": 0.6483, + "step": 21410 + }, + { + "epoch": 20.01, + "learning_rate": 7.241756756756756e-05, + "loss": 0.6068, + "step": 21420 + }, + { + "epoch": 20.01, + "learning_rate": 7.240405405405406e-05, + "loss": 0.7308, + "step": 21430 + }, + { + "epoch": 20.01, + "learning_rate": 7.239054054054054e-05, + "loss": 0.5031, + "step": 21440 + }, + { + "epoch": 20.01, + "learning_rate": 7.237702702702703e-05, + "loss": 0.5497, + "step": 21450 + }, + { + "epoch": 20.01, + "learning_rate": 7.236351351351352e-05, + "loss": 0.4673, + "step": 21460 + }, + { + "epoch": 20.01, + "learning_rate": 7.235000000000001e-05, + "loss": 0.4433, + "step": 21470 + }, + { + "epoch": 20.01, + "learning_rate": 7.233648648648649e-05, + "loss": 0.6504, + "step": 21480 + }, + { + "epoch": 21.0, + "learning_rate": 7.232297297297299e-05, + "loss": 0.5637, + "step": 21490 + }, + { + "epoch": 21.0, + "learning_rate": 7.230945945945947e-05, + "loss": 0.4932, + "step": 21500 + }, + { + "epoch": 21.0, + "eval_loss": 0.12090499699115753, + "eval_runtime": 135.4468, + "eval_samples_per_second": 26.638, + "eval_steps_per_second": 3.33, + "eval_wer": 0.12700927177002283, + "step": 21500 + }, + { + "epoch": 21.0, + "learning_rate": 7.229594594594595e-05, + "loss": 0.5399, + "step": 21510 + }, + { + "epoch": 21.0, + "learning_rate": 7.228243243243243e-05, + "loss": 0.4564, + "step": 21520 + }, + { + "epoch": 21.0, + "learning_rate": 7.226891891891892e-05, + "loss": 0.4891, + "step": 21530 + }, + { + "epoch": 21.0, + "learning_rate": 7.22554054054054e-05, + "loss": 0.4748, + "step": 21540 + }, + { + "epoch": 21.0, + "learning_rate": 7.22418918918919e-05, + "loss": 0.6633, + "step": 21550 + }, + { + "epoch": 21.0, + "learning_rate": 7.222837837837838e-05, + "loss": 0.4485, + "step": 21560 + }, + { + "epoch": 21.0, + "learning_rate": 7.221486486486487e-05, + "loss": 0.4764, + "step": 21570 + }, + { + "epoch": 21.0, + "learning_rate": 7.220135135135136e-05, + "loss": 0.473, + "step": 21580 + }, + { + "epoch": 21.0, + "learning_rate": 7.218783783783785e-05, + "loss": 0.4901, + "step": 21590 + }, + { + "epoch": 21.0, + "learning_rate": 7.217432432432433e-05, + "loss": 0.4695, + "step": 21600 + }, + { + "epoch": 21.0, + "learning_rate": 7.216081081081083e-05, + "loss": 0.299, + "step": 21610 + }, + { + "epoch": 21.0, + "learning_rate": 7.214729729729731e-05, + "loss": 0.28, + "step": 21620 + }, + { + "epoch": 21.0, + "learning_rate": 7.213378378378379e-05, + "loss": 0.3015, + "step": 21630 + }, + { + "epoch": 21.0, + "learning_rate": 7.212027027027027e-05, + "loss": 0.3078, + "step": 21640 + }, + { + "epoch": 21.0, + "learning_rate": 7.210675675675675e-05, + "loss": 1.2595, + "step": 21650 + }, + { + "epoch": 21.0, + "learning_rate": 7.209324324324324e-05, + "loss": 1.4027, + "step": 21660 + }, + { + "epoch": 21.0, + "learning_rate": 7.207972972972973e-05, + "loss": 2.6305, + "step": 21670 + }, + { + "epoch": 21.0, + "learning_rate": 7.206621621621622e-05, + "loss": 2.451, + "step": 21680 + }, + { + "epoch": 21.0, + "learning_rate": 7.20527027027027e-05, + "loss": 2.6105, + "step": 21690 + }, + { + "epoch": 21.0, + "learning_rate": 7.20391891891892e-05, + "loss": 2.3709, + "step": 21700 + }, + { + "epoch": 21.0, + "learning_rate": 7.202567567567568e-05, + "loss": 1.5761, + "step": 21710 + }, + { + "epoch": 21.0, + "learning_rate": 7.201216216216217e-05, + "loss": 1.3888, + "step": 21720 + }, + { + "epoch": 21.0, + "learning_rate": 7.199864864864865e-05, + "loss": 0.791, + "step": 21730 + }, + { + "epoch": 21.0, + "learning_rate": 7.198513513513513e-05, + "loss": 0.2311, + "step": 21740 + }, + { + "epoch": 21.0, + "learning_rate": 7.197162162162161e-05, + "loss": 0.282, + "step": 21750 + }, + { + "epoch": 21.0, + "learning_rate": 7.195810810810811e-05, + "loss": 0.217, + "step": 21760 + }, + { + "epoch": 21.0, + "learning_rate": 7.194459459459459e-05, + "loss": 0.4329, + "step": 21770 + }, + { + "epoch": 21.0, + "learning_rate": 7.193108108108108e-05, + "loss": 0.4488, + "step": 21780 + }, + { + "epoch": 21.0, + "learning_rate": 7.191756756756757e-05, + "loss": 0.4633, + "step": 21790 + }, + { + "epoch": 21.0, + "learning_rate": 7.190405405405406e-05, + "loss": 0.2488, + "step": 21800 + }, + { + "epoch": 21.0, + "learning_rate": 7.189054054054054e-05, + "loss": 0.225, + "step": 21810 + }, + { + "epoch": 21.0, + "learning_rate": 7.187702702702704e-05, + "loss": 0.3065, + "step": 21820 + }, + { + "epoch": 21.0, + "learning_rate": 7.186351351351352e-05, + "loss": 0.3062, + "step": 21830 + }, + { + "epoch": 21.0, + "learning_rate": 7.185000000000001e-05, + "loss": 0.3519, + "step": 21840 + }, + { + "epoch": 21.0, + "learning_rate": 7.183648648648649e-05, + "loss": 0.3002, + "step": 21850 + }, + { + "epoch": 21.01, + "learning_rate": 7.182297297297297e-05, + "loss": 0.2477, + "step": 21860 + }, + { + "epoch": 21.01, + "learning_rate": 7.180945945945945e-05, + "loss": 0.1779, + "step": 21870 + }, + { + "epoch": 21.01, + "learning_rate": 7.179594594594595e-05, + "loss": 0.1709, + "step": 21880 + }, + { + "epoch": 21.01, + "learning_rate": 7.178243243243243e-05, + "loss": 0.2549, + "step": 21890 + }, + { + "epoch": 21.01, + "learning_rate": 7.176891891891893e-05, + "loss": 0.2134, + "step": 21900 + }, + { + "epoch": 21.01, + "learning_rate": 7.17554054054054e-05, + "loss": 0.2758, + "step": 21910 + }, + { + "epoch": 21.01, + "learning_rate": 7.17418918918919e-05, + "loss": 0.3599, + "step": 21920 + }, + { + "epoch": 21.01, + "learning_rate": 7.172837837837838e-05, + "loss": 0.3769, + "step": 21930 + }, + { + "epoch": 21.01, + "learning_rate": 7.171486486486488e-05, + "loss": 0.3003, + "step": 21940 + }, + { + "epoch": 21.01, + "learning_rate": 7.170135135135136e-05, + "loss": 0.4111, + "step": 21950 + }, + { + "epoch": 21.01, + "learning_rate": 7.168783783783785e-05, + "loss": 0.4773, + "step": 21960 + }, + { + "epoch": 21.01, + "learning_rate": 7.167432432432433e-05, + "loss": 0.4675, + "step": 21970 + }, + { + "epoch": 21.01, + "learning_rate": 7.166081081081081e-05, + "loss": 0.5319, + "step": 21980 + }, + { + "epoch": 21.01, + "learning_rate": 7.16472972972973e-05, + "loss": 0.2779, + "step": 21990 + }, + { + "epoch": 21.01, + "learning_rate": 7.163378378378379e-05, + "loss": 0.5322, + "step": 22000 + }, + { + "epoch": 21.01, + "eval_loss": 0.12237009406089783, + "eval_runtime": 128.2638, + "eval_samples_per_second": 28.13, + "eval_steps_per_second": 3.516, + "eval_wer": 0.12882635232726086, + "step": 22000 + }, + { + "epoch": 21.01, + "learning_rate": 7.162027027027027e-05, + "loss": 0.6163, + "step": 22010 + }, + { + "epoch": 21.01, + "learning_rate": 7.160675675675677e-05, + "loss": 0.5263, + "step": 22020 + }, + { + "epoch": 21.01, + "learning_rate": 7.159324324324325e-05, + "loss": 0.1945, + "step": 22030 + }, + { + "epoch": 21.01, + "learning_rate": 7.157972972972974e-05, + "loss": 0.2868, + "step": 22040 + }, + { + "epoch": 21.01, + "learning_rate": 7.156621621621622e-05, + "loss": 0.2241, + "step": 22050 + }, + { + "epoch": 21.01, + "learning_rate": 7.15527027027027e-05, + "loss": 0.2246, + "step": 22060 + }, + { + "epoch": 21.01, + "learning_rate": 7.15391891891892e-05, + "loss": 0.2388, + "step": 22070 + }, + { + "epoch": 21.01, + "learning_rate": 7.152567567567568e-05, + "loss": 0.2025, + "step": 22080 + }, + { + "epoch": 21.01, + "learning_rate": 7.151216216216217e-05, + "loss": 0.2062, + "step": 22090 + }, + { + "epoch": 21.01, + "learning_rate": 7.149864864864865e-05, + "loss": 0.39, + "step": 22100 + }, + { + "epoch": 21.01, + "learning_rate": 7.148513513513514e-05, + "loss": 0.4665, + "step": 22110 + }, + { + "epoch": 21.01, + "learning_rate": 7.147162162162162e-05, + "loss": 0.433, + "step": 22120 + }, + { + "epoch": 21.01, + "learning_rate": 7.145810810810811e-05, + "loss": 0.3409, + "step": 22130 + }, + { + "epoch": 21.01, + "learning_rate": 7.144459459459459e-05, + "loss": 0.4624, + "step": 22140 + }, + { + "epoch": 21.01, + "learning_rate": 7.143108108108109e-05, + "loss": 0.5375, + "step": 22150 + }, + { + "epoch": 21.01, + "learning_rate": 7.141756756756757e-05, + "loss": 0.2812, + "step": 22160 + }, + { + "epoch": 21.01, + "learning_rate": 7.140405405405406e-05, + "loss": 0.2558, + "step": 22170 + }, + { + "epoch": 21.01, + "learning_rate": 7.139054054054054e-05, + "loss": 0.3307, + "step": 22180 + }, + { + "epoch": 21.01, + "learning_rate": 7.137702702702704e-05, + "loss": 0.4197, + "step": 22190 + }, + { + "epoch": 21.01, + "learning_rate": 7.136351351351352e-05, + "loss": 0.473, + "step": 22200 + }, + { + "epoch": 21.01, + "learning_rate": 7.135e-05, + "loss": 0.3666, + "step": 22210 + }, + { + "epoch": 21.01, + "learning_rate": 7.133783783783784e-05, + "loss": 0.309, + "step": 22220 + }, + { + "epoch": 21.01, + "learning_rate": 7.132432432432434e-05, + "loss": 0.2942, + "step": 22230 + }, + { + "epoch": 21.01, + "learning_rate": 7.131081081081082e-05, + "loss": 0.261, + "step": 22240 + }, + { + "epoch": 21.01, + "learning_rate": 7.12972972972973e-05, + "loss": 0.3467, + "step": 22250 + }, + { + "epoch": 21.01, + "learning_rate": 7.128378378378378e-05, + "loss": 0.1699, + "step": 22260 + }, + { + "epoch": 21.01, + "learning_rate": 7.127027027027028e-05, + "loss": 0.3052, + "step": 22270 + }, + { + "epoch": 21.01, + "learning_rate": 7.125675675675676e-05, + "loss": 0.406, + "step": 22280 + }, + { + "epoch": 21.01, + "learning_rate": 7.124324324324325e-05, + "loss": 0.6173, + "step": 22290 + }, + { + "epoch": 21.01, + "learning_rate": 7.122972972972973e-05, + "loss": 0.2186, + "step": 22300 + }, + { + "epoch": 21.01, + "learning_rate": 7.121621621621623e-05, + "loss": 0.2323, + "step": 22310 + }, + { + "epoch": 21.01, + "learning_rate": 7.120270270270271e-05, + "loss": 0.3353, + "step": 22320 + }, + { + "epoch": 21.01, + "learning_rate": 7.118918918918919e-05, + "loss": 0.354, + "step": 22330 + }, + { + "epoch": 21.01, + "learning_rate": 7.117567567567568e-05, + "loss": 0.3348, + "step": 22340 + }, + { + "epoch": 21.01, + "learning_rate": 7.116216216216216e-05, + "loss": 0.415, + "step": 22350 + }, + { + "epoch": 21.01, + "learning_rate": 7.114864864864866e-05, + "loss": 0.2806, + "step": 22360 + }, + { + "epoch": 21.01, + "learning_rate": 7.113513513513514e-05, + "loss": 0.318, + "step": 22370 + }, + { + "epoch": 21.01, + "learning_rate": 7.112162162162162e-05, + "loss": 0.3353, + "step": 22380 + }, + { + "epoch": 21.01, + "learning_rate": 7.11081081081081e-05, + "loss": 0.494, + "step": 22390 + }, + { + "epoch": 21.01, + "learning_rate": 7.10945945945946e-05, + "loss": 0.423, + "step": 22400 + }, + { + "epoch": 21.01, + "learning_rate": 7.108108108108108e-05, + "loss": 0.5261, + "step": 22410 + }, + { + "epoch": 21.01, + "learning_rate": 7.106756756756757e-05, + "loss": 0.4433, + "step": 22420 + }, + { + "epoch": 21.01, + "learning_rate": 7.105405405405405e-05, + "loss": 0.6798, + "step": 22430 + }, + { + "epoch": 21.01, + "learning_rate": 7.104054054054055e-05, + "loss": 0.4904, + "step": 22440 + }, + { + "epoch": 21.01, + "learning_rate": 7.102702702702703e-05, + "loss": 0.7175, + "step": 22450 + }, + { + "epoch": 21.01, + "learning_rate": 7.101351351351352e-05, + "loss": 0.5399, + "step": 22460 + }, + { + "epoch": 21.01, + "learning_rate": 7.1e-05, + "loss": 0.4867, + "step": 22470 + }, + { + "epoch": 21.01, + "learning_rate": 7.098648648648649e-05, + "loss": 0.4741, + "step": 22480 + }, + { + "epoch": 21.01, + "learning_rate": 7.097297297297297e-05, + "loss": 0.5038, + "step": 22490 + }, + { + "epoch": 21.01, + "learning_rate": 7.095945945945946e-05, + "loss": 0.5693, + "step": 22500 + }, + { + "epoch": 21.01, + "eval_loss": 0.1170545294880867, + "eval_runtime": 128.1458, + "eval_samples_per_second": 28.155, + "eval_steps_per_second": 3.519, + "eval_wer": 0.13255369706005685, + "step": 22500 + }, + { + "epoch": 22.0, + "learning_rate": 7.094594594594594e-05, + "loss": 0.6163, + "step": 22510 + }, + { + "epoch": 22.0, + "learning_rate": 7.093243243243244e-05, + "loss": 0.492, + "step": 22520 + }, + { + "epoch": 22.0, + "learning_rate": 7.091891891891892e-05, + "loss": 0.5218, + "step": 22530 + }, + { + "epoch": 22.0, + "learning_rate": 7.090540540540541e-05, + "loss": 0.4696, + "step": 22540 + }, + { + "epoch": 22.0, + "learning_rate": 7.08918918918919e-05, + "loss": 0.4263, + "step": 22550 + }, + { + "epoch": 22.0, + "learning_rate": 7.087837837837839e-05, + "loss": 0.4988, + "step": 22560 + }, + { + "epoch": 22.0, + "learning_rate": 7.086486486486487e-05, + "loss": 0.6063, + "step": 22570 + }, + { + "epoch": 22.0, + "learning_rate": 7.085135135135136e-05, + "loss": 0.5198, + "step": 22580 + }, + { + "epoch": 22.0, + "learning_rate": 7.083783783783784e-05, + "loss": 0.418, + "step": 22590 + }, + { + "epoch": 22.0, + "learning_rate": 7.082432432432433e-05, + "loss": 0.453, + "step": 22600 + }, + { + "epoch": 22.0, + "learning_rate": 7.081081081081081e-05, + "loss": 0.4833, + "step": 22610 + }, + { + "epoch": 22.0, + "learning_rate": 7.07972972972973e-05, + "loss": 0.5119, + "step": 22620 + }, + { + "epoch": 22.0, + "learning_rate": 7.078378378378378e-05, + "loss": 0.3357, + "step": 22630 + }, + { + "epoch": 22.0, + "learning_rate": 7.077027027027028e-05, + "loss": 0.2913, + "step": 22640 + }, + { + "epoch": 22.0, + "learning_rate": 7.075675675675676e-05, + "loss": 0.2836, + "step": 22650 + }, + { + "epoch": 22.0, + "learning_rate": 7.074324324324325e-05, + "loss": 0.3014, + "step": 22660 + }, + { + "epoch": 22.0, + "learning_rate": 7.072972972972973e-05, + "loss": 1.0133, + "step": 22670 + }, + { + "epoch": 22.0, + "learning_rate": 7.071621621621623e-05, + "loss": 0.8979, + "step": 22680 + }, + { + "epoch": 22.0, + "learning_rate": 7.070270270270271e-05, + "loss": 2.6523, + "step": 22690 + }, + { + "epoch": 22.0, + "learning_rate": 7.06891891891892e-05, + "loss": 2.5464, + "step": 22700 + }, + { + "epoch": 22.0, + "learning_rate": 7.067567567567568e-05, + "loss": 2.4752, + "step": 22710 + }, + { + "epoch": 22.0, + "learning_rate": 7.066216216216217e-05, + "loss": 2.5816, + "step": 22720 + }, + { + "epoch": 22.0, + "learning_rate": 7.064864864864865e-05, + "loss": 1.5899, + "step": 22730 + }, + { + "epoch": 22.0, + "learning_rate": 7.063513513513513e-05, + "loss": 1.4958, + "step": 22740 + }, + { + "epoch": 22.0, + "learning_rate": 7.062162162162162e-05, + "loss": 0.9694, + "step": 22750 + }, + { + "epoch": 22.0, + "learning_rate": 7.06081081081081e-05, + "loss": 0.3387, + "step": 22760 + }, + { + "epoch": 22.0, + "learning_rate": 7.05945945945946e-05, + "loss": 0.1924, + "step": 22770 + }, + { + "epoch": 22.0, + "learning_rate": 7.058108108108108e-05, + "loss": 0.3269, + "step": 22780 + }, + { + "epoch": 22.0, + "learning_rate": 7.056891891891892e-05, + "loss": 0.3489, + "step": 22790 + }, + { + "epoch": 22.0, + "learning_rate": 7.05554054054054e-05, + "loss": 0.4595, + "step": 22800 + }, + { + "epoch": 22.0, + "learning_rate": 7.05418918918919e-05, + "loss": 0.5365, + "step": 22810 + }, + { + "epoch": 22.0, + "learning_rate": 7.052837837837838e-05, + "loss": 0.2811, + "step": 22820 + }, + { + "epoch": 22.0, + "learning_rate": 7.051486486486487e-05, + "loss": 0.1976, + "step": 22830 + }, + { + "epoch": 22.0, + "learning_rate": 7.050135135135136e-05, + "loss": 0.3073, + "step": 22840 + }, + { + "epoch": 22.0, + "learning_rate": 7.048783783783785e-05, + "loss": 0.2467, + "step": 22850 + }, + { + "epoch": 22.0, + "learning_rate": 7.047432432432433e-05, + "loss": 0.2946, + "step": 22860 + }, + { + "epoch": 22.0, + "learning_rate": 7.046081081081081e-05, + "loss": 0.3138, + "step": 22870 + }, + { + "epoch": 22.0, + "learning_rate": 7.044729729729729e-05, + "loss": 0.2364, + "step": 22880 + }, + { + "epoch": 22.01, + "learning_rate": 7.043378378378379e-05, + "loss": 0.1955, + "step": 22890 + }, + { + "epoch": 22.01, + "learning_rate": 7.042027027027027e-05, + "loss": 0.1562, + "step": 22900 + }, + { + "epoch": 22.01, + "learning_rate": 7.040675675675676e-05, + "loss": 0.2541, + "step": 22910 + }, + { + "epoch": 22.01, + "learning_rate": 7.039324324324324e-05, + "loss": 0.242, + "step": 22920 + }, + { + "epoch": 22.01, + "learning_rate": 7.037972972972974e-05, + "loss": 0.2034, + "step": 22930 + }, + { + "epoch": 22.01, + "learning_rate": 7.036621621621622e-05, + "loss": 0.2504, + "step": 22940 + }, + { + "epoch": 22.01, + "learning_rate": 7.035270270270271e-05, + "loss": 0.4409, + "step": 22950 + }, + { + "epoch": 22.01, + "learning_rate": 7.03391891891892e-05, + "loss": 0.281, + "step": 22960 + }, + { + "epoch": 22.01, + "learning_rate": 7.032567567567569e-05, + "loss": 0.3679, + "step": 22970 + }, + { + "epoch": 22.01, + "learning_rate": 7.031216216216217e-05, + "loss": 0.3796, + "step": 22980 + }, + { + "epoch": 22.01, + "learning_rate": 7.029864864864865e-05, + "loss": 0.3897, + "step": 22990 + }, + { + "epoch": 22.01, + "learning_rate": 7.028513513513513e-05, + "loss": 0.4322, + "step": 23000 + }, + { + "epoch": 22.01, + "eval_loss": 0.11891253292560577, + "eval_runtime": 137.7082, + "eval_samples_per_second": 26.2, + "eval_steps_per_second": 3.275, + "eval_wer": 0.11643293109071426, + "step": 23000 + }, + { + "epoch": 22.01, + "learning_rate": 7.027162162162161e-05, + "loss": 0.3027, + "step": 23010 + }, + { + "epoch": 22.01, + "learning_rate": 7.025810810810811e-05, + "loss": 0.403, + "step": 23020 + }, + { + "epoch": 22.01, + "learning_rate": 7.024459459459459e-05, + "loss": 0.6595, + "step": 23030 + }, + { + "epoch": 22.01, + "learning_rate": 7.023108108108108e-05, + "loss": 0.5767, + "step": 23040 + }, + { + "epoch": 22.01, + "learning_rate": 7.021756756756757e-05, + "loss": 0.2145, + "step": 23050 + }, + { + "epoch": 22.01, + "learning_rate": 7.020405405405406e-05, + "loss": 0.2637, + "step": 23060 + }, + { + "epoch": 22.01, + "learning_rate": 7.019054054054054e-05, + "loss": 0.2887, + "step": 23070 + }, + { + "epoch": 22.01, + "learning_rate": 7.017702702702704e-05, + "loss": 0.2267, + "step": 23080 + }, + { + "epoch": 22.01, + "learning_rate": 7.016351351351352e-05, + "loss": 0.2313, + "step": 23090 + }, + { + "epoch": 22.01, + "learning_rate": 7.015000000000001e-05, + "loss": 0.1875, + "step": 23100 + }, + { + "epoch": 22.01, + "learning_rate": 7.013648648648649e-05, + "loss": 0.1961, + "step": 23110 + }, + { + "epoch": 22.01, + "learning_rate": 7.012297297297297e-05, + "loss": 0.2499, + "step": 23120 + }, + { + "epoch": 22.01, + "learning_rate": 7.010945945945945e-05, + "loss": 0.5526, + "step": 23130 + }, + { + "epoch": 22.01, + "learning_rate": 7.009594594594595e-05, + "loss": 0.4675, + "step": 23140 + }, + { + "epoch": 22.01, + "learning_rate": 7.008243243243243e-05, + "loss": 0.3895, + "step": 23150 + }, + { + "epoch": 22.01, + "learning_rate": 7.006891891891892e-05, + "loss": 0.4104, + "step": 23160 + }, + { + "epoch": 22.01, + "learning_rate": 7.00554054054054e-05, + "loss": 0.6808, + "step": 23170 + }, + { + "epoch": 22.01, + "learning_rate": 7.00418918918919e-05, + "loss": 0.3173, + "step": 23180 + }, + { + "epoch": 22.01, + "learning_rate": 7.002837837837838e-05, + "loss": 0.2584, + "step": 23190 + }, + { + "epoch": 22.01, + "learning_rate": 7.001486486486488e-05, + "loss": 0.2674, + "step": 23200 + }, + { + "epoch": 22.01, + "learning_rate": 7.000135135135136e-05, + "loss": 0.4371, + "step": 23210 + }, + { + "epoch": 22.01, + "learning_rate": 6.998783783783784e-05, + "loss": 0.4077, + "step": 23220 + }, + { + "epoch": 22.01, + "learning_rate": 6.997432432432432e-05, + "loss": 0.3451, + "step": 23230 + }, + { + "epoch": 22.01, + "learning_rate": 6.996081081081081e-05, + "loss": 0.3243, + "step": 23240 + }, + { + "epoch": 22.01, + "learning_rate": 6.99472972972973e-05, + "loss": 0.3741, + "step": 23250 + }, + { + "epoch": 22.01, + "learning_rate": 6.993378378378379e-05, + "loss": 0.2877, + "step": 23260 + }, + { + "epoch": 22.01, + "learning_rate": 6.992027027027027e-05, + "loss": 0.3038, + "step": 23270 + }, + { + "epoch": 22.01, + "learning_rate": 6.990675675675676e-05, + "loss": 0.1921, + "step": 23280 + }, + { + "epoch": 22.01, + "learning_rate": 6.989324324324325e-05, + "loss": 0.1948, + "step": 23290 + }, + { + "epoch": 22.01, + "learning_rate": 6.987972972972974e-05, + "loss": 0.3242, + "step": 23300 + }, + { + "epoch": 22.01, + "learning_rate": 6.986621621621622e-05, + "loss": 0.728, + "step": 23310 + }, + { + "epoch": 22.01, + "learning_rate": 6.985270270270272e-05, + "loss": 0.1856, + "step": 23320 + }, + { + "epoch": 22.01, + "learning_rate": 6.98391891891892e-05, + "loss": 0.219, + "step": 23330 + }, + { + "epoch": 22.01, + "learning_rate": 6.982567567567568e-05, + "loss": 0.3381, + "step": 23340 + }, + { + "epoch": 22.01, + "learning_rate": 6.981216216216216e-05, + "loss": 0.3031, + "step": 23350 + }, + { + "epoch": 22.01, + "learning_rate": 6.979864864864865e-05, + "loss": 0.3626, + "step": 23360 + }, + { + "epoch": 22.01, + "learning_rate": 6.978513513513513e-05, + "loss": 0.4441, + "step": 23370 + }, + { + "epoch": 22.01, + "learning_rate": 6.977162162162163e-05, + "loss": 0.3858, + "step": 23380 + }, + { + "epoch": 22.01, + "learning_rate": 6.975810810810811e-05, + "loss": 0.2601, + "step": 23390 + }, + { + "epoch": 22.01, + "learning_rate": 6.97445945945946e-05, + "loss": 0.3871, + "step": 23400 + }, + { + "epoch": 22.01, + "learning_rate": 6.973108108108109e-05, + "loss": 0.3953, + "step": 23410 + }, + { + "epoch": 22.01, + "learning_rate": 6.971756756756757e-05, + "loss": 0.4409, + "step": 23420 + }, + { + "epoch": 22.01, + "learning_rate": 6.970405405405406e-05, + "loss": 0.5266, + "step": 23430 + }, + { + "epoch": 22.01, + "learning_rate": 6.969054054054054e-05, + "loss": 0.4432, + "step": 23440 + }, + { + "epoch": 22.01, + "learning_rate": 6.967702702702704e-05, + "loss": 0.659, + "step": 23450 + }, + { + "epoch": 22.01, + "learning_rate": 6.966351351351352e-05, + "loss": 0.5053, + "step": 23460 + }, + { + "epoch": 22.01, + "learning_rate": 6.965e-05, + "loss": 0.6145, + "step": 23470 + }, + { + "epoch": 22.01, + "learning_rate": 6.963648648648648e-05, + "loss": 0.5613, + "step": 23480 + }, + { + "epoch": 22.01, + "learning_rate": 6.962297297297297e-05, + "loss": 0.4291, + "step": 23490 + }, + { + "epoch": 22.01, + "learning_rate": 6.960945945945946e-05, + "loss": 0.4603, + "step": 23500 + }, + { + "epoch": 22.01, + "eval_loss": 0.11944066733121872, + "eval_runtime": 133.6515, + "eval_samples_per_second": 26.996, + "eval_steps_per_second": 3.374, + "eval_wer": 0.13283324791501655, + "step": 23500 + }, + { + "epoch": 22.01, + "learning_rate": 6.959594594594595e-05, + "loss": 0.433, + "step": 23510 + }, + { + "epoch": 22.01, + "learning_rate": 6.958243243243243e-05, + "loss": 0.4252, + "step": 23520 + }, + { + "epoch": 23.0, + "learning_rate": 6.956891891891893e-05, + "loss": 0.6308, + "step": 23530 + }, + { + "epoch": 23.0, + "learning_rate": 6.955540540540541e-05, + "loss": 0.4707, + "step": 23540 + }, + { + "epoch": 23.0, + "learning_rate": 6.95418918918919e-05, + "loss": 0.5031, + "step": 23550 + }, + { + "epoch": 23.0, + "learning_rate": 6.952837837837838e-05, + "loss": 0.5163, + "step": 23560 + }, + { + "epoch": 23.0, + "learning_rate": 6.951486486486488e-05, + "loss": 0.4116, + "step": 23570 + }, + { + "epoch": 23.0, + "learning_rate": 6.950135135135136e-05, + "loss": 0.4687, + "step": 23580 + }, + { + "epoch": 23.0, + "learning_rate": 6.948783783783784e-05, + "loss": 0.5094, + "step": 23590 + }, + { + "epoch": 23.0, + "learning_rate": 6.947432432432432e-05, + "loss": 0.632, + "step": 23600 + }, + { + "epoch": 23.0, + "learning_rate": 6.946081081081081e-05, + "loss": 0.4125, + "step": 23610 + }, + { + "epoch": 23.0, + "learning_rate": 6.94472972972973e-05, + "loss": 0.5182, + "step": 23620 + }, + { + "epoch": 23.0, + "learning_rate": 6.943378378378379e-05, + "loss": 0.51, + "step": 23630 + }, + { + "epoch": 23.0, + "learning_rate": 6.942027027027027e-05, + "loss": 0.4503, + "step": 23640 + }, + { + "epoch": 23.0, + "learning_rate": 6.940675675675677e-05, + "loss": 0.4427, + "step": 23650 + }, + { + "epoch": 23.0, + "learning_rate": 6.939324324324325e-05, + "loss": 0.2879, + "step": 23660 + }, + { + "epoch": 23.0, + "learning_rate": 6.937972972972974e-05, + "loss": 0.2903, + "step": 23670 + }, + { + "epoch": 23.0, + "learning_rate": 6.936621621621622e-05, + "loss": 0.2809, + "step": 23680 + }, + { + "epoch": 23.0, + "learning_rate": 6.93527027027027e-05, + "loss": 0.6774, + "step": 23690 + }, + { + "epoch": 23.0, + "learning_rate": 6.933918918918918e-05, + "loss": 1.1525, + "step": 23700 + }, + { + "epoch": 23.0, + "learning_rate": 6.932567567567568e-05, + "loss": 2.1822, + "step": 23710 + }, + { + "epoch": 23.0, + "learning_rate": 6.931216216216216e-05, + "loss": 2.5999, + "step": 23720 + }, + { + "epoch": 23.0, + "learning_rate": 6.929864864864865e-05, + "loss": 2.4792, + "step": 23730 + }, + { + "epoch": 23.0, + "learning_rate": 6.928513513513514e-05, + "loss": 2.5794, + "step": 23740 + }, + { + "epoch": 23.0, + "learning_rate": 6.927162162162163e-05, + "loss": 1.9319, + "step": 23750 + }, + { + "epoch": 23.0, + "learning_rate": 6.925810810810811e-05, + "loss": 1.6625, + "step": 23760 + }, + { + "epoch": 23.0, + "learning_rate": 6.92445945945946e-05, + "loss": 1.0574, + "step": 23770 + }, + { + "epoch": 23.0, + "learning_rate": 6.923108108108109e-05, + "loss": 0.5089, + "step": 23780 + }, + { + "epoch": 23.0, + "learning_rate": 6.921756756756758e-05, + "loss": 0.193, + "step": 23790 + }, + { + "epoch": 23.0, + "learning_rate": 6.920405405405406e-05, + "loss": 0.2848, + "step": 23800 + }, + { + "epoch": 23.0, + "learning_rate": 6.919054054054054e-05, + "loss": 0.2523, + "step": 23810 + }, + { + "epoch": 23.0, + "learning_rate": 6.917702702702702e-05, + "loss": 0.3646, + "step": 23820 + }, + { + "epoch": 23.0, + "learning_rate": 6.91635135135135e-05, + "loss": 0.5389, + "step": 23830 + }, + { + "epoch": 23.0, + "learning_rate": 6.915e-05, + "loss": 0.3028, + "step": 23840 + }, + { + "epoch": 23.0, + "learning_rate": 6.913648648648648e-05, + "loss": 0.1789, + "step": 23850 + }, + { + "epoch": 23.0, + "learning_rate": 6.912297297297298e-05, + "loss": 0.3189, + "step": 23860 + }, + { + "epoch": 23.0, + "learning_rate": 6.910945945945946e-05, + "loss": 0.2565, + "step": 23870 + }, + { + "epoch": 23.0, + "learning_rate": 6.909594594594595e-05, + "loss": 0.3095, + "step": 23880 + }, + { + "epoch": 23.0, + "learning_rate": 6.908243243243243e-05, + "loss": 0.2851, + "step": 23890 + }, + { + "epoch": 23.0, + "learning_rate": 6.906891891891893e-05, + "loss": 0.2173, + "step": 23900 + }, + { + "epoch": 23.01, + "learning_rate": 6.905540540540541e-05, + "loss": 0.2611, + "step": 23910 + }, + { + "epoch": 23.01, + "learning_rate": 6.90418918918919e-05, + "loss": 0.1513, + "step": 23920 + }, + { + "epoch": 23.01, + "learning_rate": 6.902837837837838e-05, + "loss": 0.2155, + "step": 23930 + }, + { + "epoch": 23.01, + "learning_rate": 6.901486486486486e-05, + "loss": 0.2703, + "step": 23940 + }, + { + "epoch": 23.01, + "learning_rate": 6.900135135135135e-05, + "loss": 0.1763, + "step": 23950 + }, + { + "epoch": 23.01, + "learning_rate": 6.898783783783784e-05, + "loss": 0.2805, + "step": 23960 + }, + { + "epoch": 23.01, + "learning_rate": 6.897432432432432e-05, + "loss": 0.4076, + "step": 23970 + }, + { + "epoch": 23.01, + "learning_rate": 6.896081081081082e-05, + "loss": 0.2675, + "step": 23980 + }, + { + "epoch": 23.01, + "learning_rate": 6.89472972972973e-05, + "loss": 0.3137, + "step": 23990 + }, + { + "epoch": 23.01, + "learning_rate": 6.893378378378379e-05, + "loss": 0.4311, + "step": 24000 + }, + { + "epoch": 23.01, + "eval_loss": 0.1236981675028801, + "eval_runtime": 129.1838, + "eval_samples_per_second": 27.929, + "eval_steps_per_second": 3.491, + "eval_wer": 0.12076596934258957, + "step": 24000 + }, + { + "epoch": 23.01, + "learning_rate": 6.892027027027027e-05, + "loss": 0.3502, + "step": 24010 + }, + { + "epoch": 23.01, + "learning_rate": 6.890675675675677e-05, + "loss": 0.4809, + "step": 24020 + }, + { + "epoch": 23.01, + "learning_rate": 6.889324324324325e-05, + "loss": 0.3823, + "step": 24030 + }, + { + "epoch": 23.01, + "learning_rate": 6.887972972972974e-05, + "loss": 0.296, + "step": 24040 + }, + { + "epoch": 23.01, + "learning_rate": 6.886621621621622e-05, + "loss": 0.6311, + "step": 24050 + }, + { + "epoch": 23.01, + "learning_rate": 6.88527027027027e-05, + "loss": 0.5891, + "step": 24060 + }, + { + "epoch": 23.01, + "learning_rate": 6.883918918918919e-05, + "loss": 0.2723, + "step": 24070 + }, + { + "epoch": 23.01, + "learning_rate": 6.882567567567568e-05, + "loss": 0.208, + "step": 24080 + }, + { + "epoch": 23.01, + "learning_rate": 6.881216216216216e-05, + "loss": 0.2836, + "step": 24090 + }, + { + "epoch": 23.01, + "learning_rate": 6.879864864864866e-05, + "loss": 0.2334, + "step": 24100 + }, + { + "epoch": 23.01, + "learning_rate": 6.878513513513514e-05, + "loss": 0.2696, + "step": 24110 + }, + { + "epoch": 23.01, + "learning_rate": 6.877162162162163e-05, + "loss": 0.1928, + "step": 24120 + }, + { + "epoch": 23.01, + "learning_rate": 6.875810810810811e-05, + "loss": 0.2033, + "step": 24130 + }, + { + "epoch": 23.01, + "learning_rate": 6.874459459459461e-05, + "loss": 0.2233, + "step": 24140 + }, + { + "epoch": 23.01, + "learning_rate": 6.873108108108109e-05, + "loss": 0.5213, + "step": 24150 + }, + { + "epoch": 23.01, + "learning_rate": 6.871756756756757e-05, + "loss": 0.4445, + "step": 24160 + }, + { + "epoch": 23.01, + "learning_rate": 6.870405405405405e-05, + "loss": 0.388, + "step": 24170 + }, + { + "epoch": 23.01, + "learning_rate": 6.869054054054055e-05, + "loss": 0.3658, + "step": 24180 + }, + { + "epoch": 23.01, + "learning_rate": 6.867702702702703e-05, + "loss": 0.4936, + "step": 24190 + }, + { + "epoch": 23.01, + "learning_rate": 6.866351351351352e-05, + "loss": 0.4415, + "step": 24200 + }, + { + "epoch": 23.01, + "learning_rate": 6.865e-05, + "loss": 0.2683, + "step": 24210 + }, + { + "epoch": 23.01, + "learning_rate": 6.863648648648648e-05, + "loss": 0.2804, + "step": 24220 + }, + { + "epoch": 23.01, + "learning_rate": 6.862297297297298e-05, + "loss": 0.39, + "step": 24230 + }, + { + "epoch": 23.01, + "learning_rate": 6.860945945945946e-05, + "loss": 0.4435, + "step": 24240 + }, + { + "epoch": 23.01, + "learning_rate": 6.859594594594595e-05, + "loss": 0.3233, + "step": 24250 + }, + { + "epoch": 23.01, + "learning_rate": 6.858243243243243e-05, + "loss": 0.3113, + "step": 24260 + }, + { + "epoch": 23.01, + "learning_rate": 6.856891891891893e-05, + "loss": 0.3671, + "step": 24270 + }, + { + "epoch": 23.01, + "learning_rate": 6.855540540540541e-05, + "loss": 0.3038, + "step": 24280 + }, + { + "epoch": 23.01, + "learning_rate": 6.854189189189189e-05, + "loss": 0.2487, + "step": 24290 + }, + { + "epoch": 23.01, + "learning_rate": 6.852837837837837e-05, + "loss": 0.2575, + "step": 24300 + }, + { + "epoch": 23.01, + "learning_rate": 6.851486486486487e-05, + "loss": 0.1885, + "step": 24310 + }, + { + "epoch": 23.01, + "learning_rate": 6.850135135135135e-05, + "loss": 0.3126, + "step": 24320 + }, + { + "epoch": 23.01, + "learning_rate": 6.848783783783784e-05, + "loss": 0.6653, + "step": 24330 + }, + { + "epoch": 23.01, + "learning_rate": 6.847432432432432e-05, + "loss": 0.3414, + "step": 24340 + }, + { + "epoch": 23.01, + "learning_rate": 6.846081081081082e-05, + "loss": 0.2471, + "step": 24350 + }, + { + "epoch": 23.01, + "learning_rate": 6.84472972972973e-05, + "loss": 0.3358, + "step": 24360 + }, + { + "epoch": 23.01, + "learning_rate": 6.843378378378379e-05, + "loss": 0.3219, + "step": 24370 + }, + { + "epoch": 23.01, + "learning_rate": 6.842027027027027e-05, + "loss": 0.2688, + "step": 24380 + }, + { + "epoch": 23.01, + "learning_rate": 6.840675675675677e-05, + "loss": 0.3898, + "step": 24390 + }, + { + "epoch": 23.01, + "learning_rate": 6.839324324324325e-05, + "loss": 0.4302, + "step": 24400 + }, + { + "epoch": 23.01, + "learning_rate": 6.837972972972973e-05, + "loss": 0.2815, + "step": 24410 + }, + { + "epoch": 23.01, + "learning_rate": 6.836621621621621e-05, + "loss": 0.3345, + "step": 24420 + }, + { + "epoch": 23.01, + "learning_rate": 6.83527027027027e-05, + "loss": 0.268, + "step": 24430 + }, + { + "epoch": 23.01, + "learning_rate": 6.833918918918919e-05, + "loss": 0.4632, + "step": 24440 + }, + { + "epoch": 23.01, + "learning_rate": 6.832567567567568e-05, + "loss": 0.5049, + "step": 24450 + }, + { + "epoch": 23.01, + "learning_rate": 6.831216216216216e-05, + "loss": 0.4324, + "step": 24460 + }, + { + "epoch": 23.01, + "learning_rate": 6.829864864864866e-05, + "loss": 0.4638, + "step": 24470 + }, + { + "epoch": 23.01, + "learning_rate": 6.828513513513514e-05, + "loss": 0.5446, + "step": 24480 + }, + { + "epoch": 23.01, + "learning_rate": 6.827162162162163e-05, + "loss": 0.5173, + "step": 24490 + }, + { + "epoch": 23.01, + "learning_rate": 6.825810810810811e-05, + "loss": 0.6475, + "step": 24500 + }, + { + "epoch": 23.01, + "eval_loss": 0.1159677729010582, + "eval_runtime": 129.4773, + "eval_samples_per_second": 27.866, + "eval_steps_per_second": 3.483, + "eval_wer": 0.12309555980058706, + "step": 24500 + }, + { + "epoch": 23.01, + "learning_rate": 6.82445945945946e-05, + "loss": 0.5098, + "step": 24510 + }, + { + "epoch": 23.01, + "learning_rate": 6.823108108108108e-05, + "loss": 0.4869, + "step": 24520 + }, + { + "epoch": 23.01, + "learning_rate": 6.821756756756757e-05, + "loss": 0.5014, + "step": 24530 + }, + { + "epoch": 23.01, + "learning_rate": 6.820405405405405e-05, + "loss": 0.4153, + "step": 24540 + }, + { + "epoch": 23.01, + "learning_rate": 6.819054054054055e-05, + "loss": 0.5658, + "step": 24550 + }, + { + "epoch": 24.0, + "learning_rate": 6.817702702702703e-05, + "loss": 0.5418, + "step": 24560 + }, + { + "epoch": 24.0, + "learning_rate": 6.816351351351352e-05, + "loss": 0.497, + "step": 24570 + }, + { + "epoch": 24.0, + "learning_rate": 6.815e-05, + "loss": 0.5352, + "step": 24580 + }, + { + "epoch": 24.0, + "learning_rate": 6.81364864864865e-05, + "loss": 0.4335, + "step": 24590 + }, + { + "epoch": 24.0, + "learning_rate": 6.812297297297298e-05, + "loss": 0.4603, + "step": 24600 + }, + { + "epoch": 24.0, + "learning_rate": 6.810945945945947e-05, + "loss": 0.4417, + "step": 24610 + }, + { + "epoch": 24.0, + "learning_rate": 6.809594594594595e-05, + "loss": 0.6753, + "step": 24620 + }, + { + "epoch": 24.0, + "learning_rate": 6.808243243243244e-05, + "loss": 0.4617, + "step": 24630 + }, + { + "epoch": 24.0, + "learning_rate": 6.806891891891892e-05, + "loss": 0.4919, + "step": 24640 + }, + { + "epoch": 24.0, + "learning_rate": 6.80554054054054e-05, + "loss": 0.5021, + "step": 24650 + }, + { + "epoch": 24.0, + "learning_rate": 6.804189189189189e-05, + "loss": 0.4452, + "step": 24660 + }, + { + "epoch": 24.0, + "learning_rate": 6.802837837837837e-05, + "loss": 0.4514, + "step": 24670 + }, + { + "epoch": 24.0, + "learning_rate": 6.801486486486487e-05, + "loss": 0.3179, + "step": 24680 + }, + { + "epoch": 24.0, + "learning_rate": 6.800135135135135e-05, + "loss": 0.2729, + "step": 24690 + }, + { + "epoch": 24.0, + "learning_rate": 6.798783783783784e-05, + "loss": 0.2912, + "step": 24700 + }, + { + "epoch": 24.0, + "learning_rate": 6.797432432432432e-05, + "loss": 0.3173, + "step": 24710 + }, + { + "epoch": 24.0, + "learning_rate": 6.796081081081082e-05, + "loss": 1.3187, + "step": 24720 + }, + { + "epoch": 24.0, + "learning_rate": 6.79472972972973e-05, + "loss": 1.5515, + "step": 24730 + }, + { + "epoch": 24.0, + "learning_rate": 6.79337837837838e-05, + "loss": 2.6183, + "step": 24740 + }, + { + "epoch": 24.0, + "learning_rate": 6.792027027027028e-05, + "loss": 2.451, + "step": 24750 + }, + { + "epoch": 24.0, + "learning_rate": 6.790675675675676e-05, + "loss": 2.5918, + "step": 24760 + }, + { + "epoch": 24.0, + "learning_rate": 6.789324324324324e-05, + "loss": 2.1879, + "step": 24770 + }, + { + "epoch": 24.0, + "learning_rate": 6.787972972972973e-05, + "loss": 1.5524, + "step": 24780 + }, + { + "epoch": 24.0, + "learning_rate": 6.786621621621621e-05, + "loss": 1.3473, + "step": 24790 + }, + { + "epoch": 24.0, + "learning_rate": 6.785270270270271e-05, + "loss": 0.5402, + "step": 24800 + }, + { + "epoch": 24.0, + "learning_rate": 6.783918918918919e-05, + "loss": 0.1954, + "step": 24810 + }, + { + "epoch": 24.0, + "learning_rate": 6.782567567567568e-05, + "loss": 0.2996, + "step": 24820 + }, + { + "epoch": 24.0, + "learning_rate": 6.781216216216216e-05, + "loss": 0.2224, + "step": 24830 + }, + { + "epoch": 24.0, + "learning_rate": 6.779864864864866e-05, + "loss": 0.4021, + "step": 24840 + }, + { + "epoch": 24.0, + "learning_rate": 6.778513513513514e-05, + "loss": 0.4529, + "step": 24850 + }, + { + "epoch": 24.0, + "learning_rate": 6.777162162162163e-05, + "loss": 0.4229, + "step": 24860 + }, + { + "epoch": 24.0, + "learning_rate": 6.775810810810812e-05, + "loss": 0.195, + "step": 24870 + }, + { + "epoch": 24.0, + "learning_rate": 6.77445945945946e-05, + "loss": 0.229, + "step": 24880 + }, + { + "epoch": 24.0, + "learning_rate": 6.773108108108108e-05, + "loss": 0.2792, + "step": 24890 + }, + { + "epoch": 24.0, + "learning_rate": 6.771756756756757e-05, + "loss": 0.2455, + "step": 24900 + }, + { + "epoch": 24.0, + "learning_rate": 6.770405405405405e-05, + "loss": 0.3148, + "step": 24910 + }, + { + "epoch": 24.0, + "learning_rate": 6.769054054054055e-05, + "loss": 0.2775, + "step": 24920 + }, + { + "epoch": 24.01, + "learning_rate": 6.767702702702703e-05, + "loss": 0.2299, + "step": 24930 + }, + { + "epoch": 24.01, + "learning_rate": 6.766351351351352e-05, + "loss": 0.1628, + "step": 24940 + }, + { + "epoch": 24.01, + "learning_rate": 6.765e-05, + "loss": 0.1693, + "step": 24950 + }, + { + "epoch": 24.01, + "learning_rate": 6.76364864864865e-05, + "loss": 0.2771, + "step": 24960 + }, + { + "epoch": 24.01, + "learning_rate": 6.762297297297298e-05, + "loss": 0.2097, + "step": 24970 + }, + { + "epoch": 24.01, + "learning_rate": 6.760945945945946e-05, + "loss": 0.2635, + "step": 24980 + }, + { + "epoch": 24.01, + "learning_rate": 6.759594594594594e-05, + "loss": 0.3242, + "step": 24990 + }, + { + "epoch": 24.01, + "learning_rate": 6.758243243243244e-05, + "loss": 0.3135, + "step": 25000 + }, + { + "epoch": 24.01, + "eval_loss": 0.11508933454751968, + "eval_runtime": 133.7262, + "eval_samples_per_second": 26.981, + "eval_steps_per_second": 3.373, + "eval_wer": 0.11671248194567395, + "step": 25000 + }, + { + "epoch": 24.01, + "learning_rate": 6.757027027027028e-05, + "loss": 0.299, + "step": 25010 + }, + { + "epoch": 24.01, + "learning_rate": 6.755675675675676e-05, + "loss": 0.379, + "step": 25020 + }, + { + "epoch": 24.01, + "learning_rate": 6.754324324324324e-05, + "loss": 0.3725, + "step": 25030 + }, + { + "epoch": 24.01, + "learning_rate": 6.752972972972972e-05, + "loss": 0.4602, + "step": 25040 + }, + { + "epoch": 24.01, + "learning_rate": 6.751621621621622e-05, + "loss": 0.4828, + "step": 25050 + }, + { + "epoch": 24.01, + "learning_rate": 6.75027027027027e-05, + "loss": 0.243, + "step": 25060 + }, + { + "epoch": 24.01, + "learning_rate": 6.74891891891892e-05, + "loss": 0.5806, + "step": 25070 + }, + { + "epoch": 24.01, + "learning_rate": 6.747567567567567e-05, + "loss": 0.6303, + "step": 25080 + }, + { + "epoch": 24.01, + "learning_rate": 6.746216216216217e-05, + "loss": 0.4278, + "step": 25090 + }, + { + "epoch": 24.01, + "learning_rate": 6.744864864864865e-05, + "loss": 0.1677, + "step": 25100 + }, + { + "epoch": 24.01, + "learning_rate": 6.743513513513515e-05, + "loss": 0.2909, + "step": 25110 + }, + { + "epoch": 24.01, + "learning_rate": 6.742162162162163e-05, + "loss": 0.2256, + "step": 25120 + }, + { + "epoch": 24.01, + "learning_rate": 6.740810810810812e-05, + "loss": 0.2394, + "step": 25130 + }, + { + "epoch": 24.01, + "learning_rate": 6.73945945945946e-05, + "loss": 0.2005, + "step": 25140 + }, + { + "epoch": 24.01, + "learning_rate": 6.738108108108108e-05, + "loss": 0.2, + "step": 25150 + }, + { + "epoch": 24.01, + "learning_rate": 6.736756756756756e-05, + "loss": 0.1714, + "step": 25160 + }, + { + "epoch": 24.01, + "learning_rate": 6.735405405405406e-05, + "loss": 0.3573, + "step": 25170 + }, + { + "epoch": 24.01, + "learning_rate": 6.734054054054054e-05, + "loss": 0.5306, + "step": 25180 + }, + { + "epoch": 24.01, + "learning_rate": 6.732702702702703e-05, + "loss": 0.4544, + "step": 25190 + }, + { + "epoch": 24.01, + "learning_rate": 6.731351351351351e-05, + "loss": 0.2923, + "step": 25200 + }, + { + "epoch": 24.01, + "learning_rate": 6.730000000000001e-05, + "loss": 0.4682, + "step": 25210 + }, + { + "epoch": 24.01, + "learning_rate": 6.728648648648649e-05, + "loss": 0.4943, + "step": 25220 + }, + { + "epoch": 24.01, + "learning_rate": 6.727297297297299e-05, + "loss": 0.2568, + "step": 25230 + }, + { + "epoch": 24.01, + "learning_rate": 6.725945945945947e-05, + "loss": 0.2222, + "step": 25240 + }, + { + "epoch": 24.01, + "learning_rate": 6.724594594594595e-05, + "loss": 0.3297, + "step": 25250 + }, + { + "epoch": 24.01, + "learning_rate": 6.723243243243244e-05, + "loss": 0.3813, + "step": 25260 + }, + { + "epoch": 24.01, + "learning_rate": 6.721891891891892e-05, + "loss": 0.4679, + "step": 25270 + }, + { + "epoch": 24.01, + "learning_rate": 6.72054054054054e-05, + "loss": 0.3092, + "step": 25280 + }, + { + "epoch": 24.01, + "learning_rate": 6.71918918918919e-05, + "loss": 0.3069, + "step": 25290 + }, + { + "epoch": 24.01, + "learning_rate": 6.717837837837838e-05, + "loss": 0.2571, + "step": 25300 + }, + { + "epoch": 24.01, + "learning_rate": 6.716486486486486e-05, + "loss": 0.2762, + "step": 25310 + }, + { + "epoch": 24.01, + "learning_rate": 6.715135135135136e-05, + "loss": 0.3283, + "step": 25320 + }, + { + "epoch": 24.01, + "learning_rate": 6.713783783783784e-05, + "loss": 0.1604, + "step": 25330 + }, + { + "epoch": 24.01, + "learning_rate": 6.712432432432433e-05, + "loss": 0.2811, + "step": 25340 + }, + { + "epoch": 24.01, + "learning_rate": 6.711081081081081e-05, + "loss": 0.471, + "step": 25350 + }, + { + "epoch": 24.01, + "learning_rate": 6.70972972972973e-05, + "loss": 0.453, + "step": 25360 + }, + { + "epoch": 24.01, + "learning_rate": 6.708378378378379e-05, + "loss": 0.208, + "step": 25370 + }, + { + "epoch": 24.01, + "learning_rate": 6.707027027027027e-05, + "loss": 0.2719, + "step": 25380 + }, + { + "epoch": 24.01, + "learning_rate": 6.705675675675675e-05, + "loss": 0.2994, + "step": 25390 + }, + { + "epoch": 24.01, + "learning_rate": 6.704324324324324e-05, + "loss": 0.3038, + "step": 25400 + }, + { + "epoch": 24.01, + "learning_rate": 6.702972972972973e-05, + "loss": 0.3527, + "step": 25410 + }, + { + "epoch": 24.01, + "learning_rate": 6.701621621621622e-05, + "loss": 0.4291, + "step": 25420 + }, + { + "epoch": 24.01, + "learning_rate": 6.70027027027027e-05, + "loss": 0.2909, + "step": 25430 + }, + { + "epoch": 24.01, + "learning_rate": 6.69891891891892e-05, + "loss": 0.3028, + "step": 25440 + }, + { + "epoch": 24.01, + "learning_rate": 6.697567567567568e-05, + "loss": 0.299, + "step": 25450 + }, + { + "epoch": 24.01, + "learning_rate": 6.696216216216217e-05, + "loss": 0.4272, + "step": 25460 + }, + { + "epoch": 24.01, + "learning_rate": 6.694864864864865e-05, + "loss": 0.3889, + "step": 25470 + }, + { + "epoch": 24.01, + "learning_rate": 6.693513513513515e-05, + "loss": 0.5198, + "step": 25480 + }, + { + "epoch": 24.01, + "learning_rate": 6.692162162162163e-05, + "loss": 0.4122, + "step": 25490 + }, + { + "epoch": 24.01, + "learning_rate": 6.690810810810811e-05, + "loss": 0.6479, + "step": 25500 + }, + { + "epoch": 24.01, + "eval_loss": 0.10787811130285263, + "eval_runtime": 133.7479, + "eval_samples_per_second": 26.976, + "eval_steps_per_second": 3.372, + "eval_wer": 0.11354423892279737, + "step": 25500 + }, + { + "epoch": 24.01, + "learning_rate": 6.689459459459459e-05, + "loss": 0.5095, + "step": 25510 + }, + { + "epoch": 24.01, + "learning_rate": 6.688108108108108e-05, + "loss": 0.6117, + "step": 25520 + }, + { + "epoch": 24.01, + "learning_rate": 6.686756756756757e-05, + "loss": 0.5088, + "step": 25530 + }, + { + "epoch": 24.01, + "learning_rate": 6.685405405405406e-05, + "loss": 0.4522, + "step": 25540 + }, + { + "epoch": 24.01, + "learning_rate": 6.684054054054054e-05, + "loss": 0.4954, + "step": 25550 + }, + { + "epoch": 24.01, + "learning_rate": 6.682702702702704e-05, + "loss": 0.4786, + "step": 25560 + }, + { + "epoch": 24.01, + "learning_rate": 6.681351351351352e-05, + "loss": 0.5247, + "step": 25570 + }, + { + "epoch": 25.0, + "learning_rate": 6.680000000000001e-05, + "loss": 0.5121, + "step": 25580 + }, + { + "epoch": 25.0, + "learning_rate": 6.678648648648649e-05, + "loss": 0.4795, + "step": 25590 + }, + { + "epoch": 25.0, + "learning_rate": 6.677297297297299e-05, + "loss": 0.543, + "step": 25600 + }, + { + "epoch": 25.0, + "learning_rate": 6.675945945945947e-05, + "loss": 0.4424, + "step": 25610 + }, + { + "epoch": 25.0, + "learning_rate": 6.674594594594595e-05, + "loss": 0.4372, + "step": 25620 + }, + { + "epoch": 25.0, + "learning_rate": 6.673243243243243e-05, + "loss": 0.4757, + "step": 25630 + }, + { + "epoch": 25.0, + "learning_rate": 6.671891891891892e-05, + "loss": 0.686, + "step": 25640 + }, + { + "epoch": 25.0, + "learning_rate": 6.67054054054054e-05, + "loss": 0.4259, + "step": 25650 + }, + { + "epoch": 25.0, + "learning_rate": 6.66918918918919e-05, + "loss": 0.425, + "step": 25660 + }, + { + "epoch": 25.0, + "learning_rate": 6.667837837837838e-05, + "loss": 0.4644, + "step": 25670 + }, + { + "epoch": 25.0, + "learning_rate": 6.666486486486488e-05, + "loss": 0.4735, + "step": 25680 + }, + { + "epoch": 25.0, + "learning_rate": 6.665135135135136e-05, + "loss": 0.4552, + "step": 25690 + }, + { + "epoch": 25.0, + "learning_rate": 6.663783783783785e-05, + "loss": 0.304, + "step": 25700 + }, + { + "epoch": 25.0, + "learning_rate": 6.662432432432433e-05, + "loss": 0.2749, + "step": 25710 + }, + { + "epoch": 25.0, + "learning_rate": 6.661081081081081e-05, + "loss": 0.2761, + "step": 25720 + }, + { + "epoch": 25.0, + "learning_rate": 6.65972972972973e-05, + "loss": 0.2698, + "step": 25730 + }, + { + "epoch": 25.0, + "learning_rate": 6.658378378378378e-05, + "loss": 1.0491, + "step": 25740 + }, + { + "epoch": 25.0, + "learning_rate": 6.657027027027027e-05, + "loss": 1.0601, + "step": 25750 + }, + { + "epoch": 25.0, + "learning_rate": 6.655675675675675e-05, + "loss": 2.6915, + "step": 25760 + }, + { + "epoch": 25.0, + "learning_rate": 6.654324324324325e-05, + "loss": 2.4412, + "step": 25770 + }, + { + "epoch": 25.0, + "learning_rate": 6.652972972972973e-05, + "loss": 2.5773, + "step": 25780 + }, + { + "epoch": 25.0, + "learning_rate": 6.651621621621622e-05, + "loss": 2.6003, + "step": 25790 + }, + { + "epoch": 25.0, + "learning_rate": 6.65027027027027e-05, + "loss": 1.3939, + "step": 25800 + }, + { + "epoch": 25.0, + "learning_rate": 6.64891891891892e-05, + "loss": 1.5407, + "step": 25810 + }, + { + "epoch": 25.0, + "learning_rate": 6.647567567567568e-05, + "loss": 0.7416, + "step": 25820 + }, + { + "epoch": 25.0, + "learning_rate": 6.646216216216217e-05, + "loss": 0.2765, + "step": 25830 + }, + { + "epoch": 25.0, + "learning_rate": 6.644864864864865e-05, + "loss": 0.2079, + "step": 25840 + }, + { + "epoch": 25.0, + "learning_rate": 6.643513513513513e-05, + "loss": 0.2551, + "step": 25850 + }, + { + "epoch": 25.0, + "learning_rate": 6.642162162162162e-05, + "loss": 0.3592, + "step": 25860 + }, + { + "epoch": 25.0, + "learning_rate": 6.640810810810811e-05, + "loss": 0.4471, + "step": 25870 + }, + { + "epoch": 25.0, + "learning_rate": 6.639459459459459e-05, + "loss": 0.404, + "step": 25880 + }, + { + "epoch": 25.0, + "learning_rate": 6.638108108108109e-05, + "loss": 0.2541, + "step": 25890 + }, + { + "epoch": 25.0, + "learning_rate": 6.636756756756757e-05, + "loss": 0.1549, + "step": 25900 + }, + { + "epoch": 25.0, + "learning_rate": 6.635405405405406e-05, + "loss": 0.3025, + "step": 25910 + }, + { + "epoch": 25.0, + "learning_rate": 6.634054054054054e-05, + "loss": 0.2617, + "step": 25920 + }, + { + "epoch": 25.0, + "learning_rate": 6.632702702702704e-05, + "loss": 0.281, + "step": 25930 + }, + { + "epoch": 25.0, + "learning_rate": 6.631351351351352e-05, + "loss": 0.282, + "step": 25940 + }, + { + "epoch": 25.0, + "learning_rate": 6.630000000000001e-05, + "loss": 0.2368, + "step": 25950 + }, + { + "epoch": 25.01, + "learning_rate": 6.62864864864865e-05, + "loss": 0.1784, + "step": 25960 + }, + { + "epoch": 25.01, + "learning_rate": 6.627297297297297e-05, + "loss": 0.1247, + "step": 25970 + }, + { + "epoch": 25.01, + "learning_rate": 6.625945945945946e-05, + "loss": 0.2875, + "step": 25980 + }, + { + "epoch": 25.01, + "learning_rate": 6.624594594594595e-05, + "loss": 0.2065, + "step": 25990 + }, + { + "epoch": 25.01, + "learning_rate": 6.623243243243243e-05, + "loss": 0.2319, + "step": 26000 + }, + { + "epoch": 25.01, + "eval_loss": 0.11887121200561523, + "eval_runtime": 128.3334, + "eval_samples_per_second": 28.114, + "eval_steps_per_second": 3.514, + "eval_wer": 0.1151749522433956, + "step": 26000 + }, + { + "epoch": 25.01, + "learning_rate": 6.621891891891893e-05, + "loss": 0.2635, + "step": 26010 + }, + { + "epoch": 25.01, + "learning_rate": 6.62054054054054e-05, + "loss": 0.3368, + "step": 26020 + }, + { + "epoch": 25.01, + "learning_rate": 6.61918918918919e-05, + "loss": 0.246, + "step": 26030 + }, + { + "epoch": 25.01, + "learning_rate": 6.617837837837838e-05, + "loss": 0.3683, + "step": 26040 + }, + { + "epoch": 25.01, + "learning_rate": 6.616486486486488e-05, + "loss": 0.4312, + "step": 26050 + }, + { + "epoch": 25.01, + "learning_rate": 6.615135135135136e-05, + "loss": 0.4236, + "step": 26060 + }, + { + "epoch": 25.01, + "learning_rate": 6.613783783783785e-05, + "loss": 0.4573, + "step": 26070 + }, + { + "epoch": 25.01, + "learning_rate": 6.612432432432433e-05, + "loss": 0.3358, + "step": 26080 + }, + { + "epoch": 25.01, + "learning_rate": 6.611081081081081e-05, + "loss": 0.4104, + "step": 26090 + }, + { + "epoch": 25.01, + "learning_rate": 6.60972972972973e-05, + "loss": 0.6111, + "step": 26100 + }, + { + "epoch": 25.01, + "learning_rate": 6.608378378378378e-05, + "loss": 0.5127, + "step": 26110 + }, + { + "epoch": 25.01, + "learning_rate": 6.607027027027027e-05, + "loss": 0.1661, + "step": 26120 + }, + { + "epoch": 25.01, + "learning_rate": 6.605675675675675e-05, + "loss": 0.2635, + "step": 26130 + }, + { + "epoch": 25.01, + "learning_rate": 6.604324324324325e-05, + "loss": 0.2609, + "step": 26140 + }, + { + "epoch": 25.01, + "learning_rate": 6.602972972972973e-05, + "loss": 0.23, + "step": 26150 + }, + { + "epoch": 25.01, + "learning_rate": 6.601621621621622e-05, + "loss": 0.2208, + "step": 26160 + }, + { + "epoch": 25.01, + "learning_rate": 6.60027027027027e-05, + "loss": 0.1831, + "step": 26170 + }, + { + "epoch": 25.01, + "learning_rate": 6.59891891891892e-05, + "loss": 0.2004, + "step": 26180 + }, + { + "epoch": 25.01, + "learning_rate": 6.597567567567568e-05, + "loss": 0.2372, + "step": 26190 + }, + { + "epoch": 25.01, + "learning_rate": 6.596216216216216e-05, + "loss": 0.4932, + "step": 26200 + }, + { + "epoch": 25.01, + "learning_rate": 6.594864864864864e-05, + "loss": 0.4111, + "step": 26210 + }, + { + "epoch": 25.01, + "learning_rate": 6.593513513513514e-05, + "loss": 0.3578, + "step": 26220 + }, + { + "epoch": 25.01, + "learning_rate": 6.592162162162162e-05, + "loss": 0.3535, + "step": 26230 + }, + { + "epoch": 25.01, + "learning_rate": 6.590810810810811e-05, + "loss": 0.5951, + "step": 26240 + }, + { + "epoch": 25.01, + "learning_rate": 6.589459459459459e-05, + "loss": 0.2822, + "step": 26250 + }, + { + "epoch": 25.01, + "learning_rate": 6.588108108108109e-05, + "loss": 0.235, + "step": 26260 + }, + { + "epoch": 25.01, + "learning_rate": 6.586756756756757e-05, + "loss": 0.3347, + "step": 26270 + }, + { + "epoch": 25.01, + "learning_rate": 6.585405405405406e-05, + "loss": 0.4581, + "step": 26280 + }, + { + "epoch": 25.01, + "learning_rate": 6.584054054054054e-05, + "loss": 0.3922, + "step": 26290 + }, + { + "epoch": 25.01, + "learning_rate": 6.582702702702704e-05, + "loss": 0.3722, + "step": 26300 + }, + { + "epoch": 25.01, + "learning_rate": 6.581351351351352e-05, + "loss": 0.319, + "step": 26310 + }, + { + "epoch": 25.01, + "learning_rate": 6.58e-05, + "loss": 0.3239, + "step": 26320 + }, + { + "epoch": 25.01, + "learning_rate": 6.578648648648648e-05, + "loss": 0.2082, + "step": 26330 + }, + { + "epoch": 25.01, + "learning_rate": 6.577297297297298e-05, + "loss": 0.3064, + "step": 26340 + }, + { + "epoch": 25.01, + "learning_rate": 6.575945945945946e-05, + "loss": 0.1563, + "step": 26350 + }, + { + "epoch": 25.01, + "learning_rate": 6.574594594594595e-05, + "loss": 0.1977, + "step": 26360 + }, + { + "epoch": 25.01, + "learning_rate": 6.573243243243243e-05, + "loss": 0.382, + "step": 26370 + }, + { + "epoch": 25.01, + "learning_rate": 6.571891891891893e-05, + "loss": 0.6592, + "step": 26380 + }, + { + "epoch": 25.01, + "learning_rate": 6.570540540540541e-05, + "loss": 0.201, + "step": 26390 + }, + { + "epoch": 25.01, + "learning_rate": 6.56918918918919e-05, + "loss": 0.2314, + "step": 26400 + }, + { + "epoch": 25.01, + "learning_rate": 6.567837837837838e-05, + "loss": 0.3317, + "step": 26410 + }, + { + "epoch": 25.01, + "learning_rate": 6.566486486486488e-05, + "loss": 0.3089, + "step": 26420 + }, + { + "epoch": 25.01, + "learning_rate": 6.565135135135136e-05, + "loss": 0.3038, + "step": 26430 + }, + { + "epoch": 25.01, + "learning_rate": 6.563783783783784e-05, + "loss": 0.4369, + "step": 26440 + }, + { + "epoch": 25.01, + "learning_rate": 6.562432432432432e-05, + "loss": 0.3454, + "step": 26450 + }, + { + "epoch": 25.01, + "learning_rate": 6.561081081081082e-05, + "loss": 0.2374, + "step": 26460 + }, + { + "epoch": 25.01, + "learning_rate": 6.55972972972973e-05, + "loss": 0.3895, + "step": 26470 + }, + { + "epoch": 25.01, + "learning_rate": 6.558378378378379e-05, + "loss": 0.3773, + "step": 26480 + }, + { + "epoch": 25.01, + "learning_rate": 6.557027027027027e-05, + "loss": 0.409, + "step": 26490 + }, + { + "epoch": 25.01, + "learning_rate": 6.555675675675677e-05, + "loss": 0.4571, + "step": 26500 + }, + { + "epoch": 25.01, + "eval_loss": 0.10201442986726761, + "eval_runtime": 143.0008, + "eval_samples_per_second": 25.231, + "eval_steps_per_second": 3.154, + "eval_wer": 0.10809299725108326, + "step": 26500 + }, + { + "epoch": 25.01, + "learning_rate": 6.554324324324325e-05, + "loss": 0.4082, + "step": 26510 + }, + { + "epoch": 25.01, + "learning_rate": 6.552972972972973e-05, + "loss": 0.6082, + "step": 26520 + }, + { + "epoch": 25.01, + "learning_rate": 6.551621621621622e-05, + "loss": 0.4122, + "step": 26530 + }, + { + "epoch": 25.01, + "learning_rate": 6.55027027027027e-05, + "loss": 0.5685, + "step": 26540 + }, + { + "epoch": 25.01, + "learning_rate": 6.54891891891892e-05, + "loss": 0.5386, + "step": 26550 + }, + { + "epoch": 25.01, + "learning_rate": 6.547567567567568e-05, + "loss": 0.4089, + "step": 26560 + }, + { + "epoch": 25.01, + "learning_rate": 6.546216216216216e-05, + "loss": 0.455, + "step": 26570 + }, + { + "epoch": 25.01, + "learning_rate": 6.544864864864864e-05, + "loss": 0.5013, + "step": 26580 + }, + { + "epoch": 25.01, + "learning_rate": 6.543513513513514e-05, + "loss": 0.4749, + "step": 26590 + }, + { + "epoch": 26.0, + "learning_rate": 6.542162162162162e-05, + "loss": 0.6608, + "step": 26600 + }, + { + "epoch": 26.0, + "learning_rate": 6.540810810810811e-05, + "loss": 0.4651, + "step": 26610 + }, + { + "epoch": 26.0, + "learning_rate": 6.53945945945946e-05, + "loss": 0.4847, + "step": 26620 + }, + { + "epoch": 26.0, + "learning_rate": 6.538108108108109e-05, + "loss": 0.4908, + "step": 26630 + }, + { + "epoch": 26.0, + "learning_rate": 6.536756756756757e-05, + "loss": 0.4085, + "step": 26640 + }, + { + "epoch": 26.0, + "learning_rate": 6.535405405405406e-05, + "loss": 0.4714, + "step": 26650 + }, + { + "epoch": 26.0, + "learning_rate": 6.534054054054054e-05, + "loss": 0.5146, + "step": 26660 + }, + { + "epoch": 26.0, + "learning_rate": 6.532702702702703e-05, + "loss": 0.5939, + "step": 26670 + }, + { + "epoch": 26.0, + "learning_rate": 6.531351351351351e-05, + "loss": 0.434, + "step": 26680 + }, + { + "epoch": 26.0, + "learning_rate": 6.53e-05, + "loss": 0.4717, + "step": 26690 + }, + { + "epoch": 26.0, + "learning_rate": 6.528648648648648e-05, + "loss": 0.4338, + "step": 26700 + }, + { + "epoch": 26.0, + "learning_rate": 6.527297297297298e-05, + "loss": 0.448, + "step": 26710 + }, + { + "epoch": 26.0, + "learning_rate": 6.525945945945946e-05, + "loss": 0.3657, + "step": 26720 + }, + { + "epoch": 26.0, + "learning_rate": 6.524594594594595e-05, + "loss": 0.2764, + "step": 26730 + }, + { + "epoch": 26.0, + "learning_rate": 6.523243243243243e-05, + "loss": 0.2752, + "step": 26740 + }, + { + "epoch": 26.0, + "learning_rate": 6.521891891891893e-05, + "loss": 0.316, + "step": 26750 + }, + { + "epoch": 26.0, + "learning_rate": 6.520540540540541e-05, + "loss": 0.7303, + "step": 26760 + }, + { + "epoch": 26.0, + "learning_rate": 6.51918918918919e-05, + "loss": 0.9961, + "step": 26770 + }, + { + "epoch": 26.0, + "learning_rate": 6.517837837837839e-05, + "loss": 2.2981, + "step": 26780 + }, + { + "epoch": 26.0, + "learning_rate": 6.516486486486487e-05, + "loss": 2.558, + "step": 26790 + }, + { + "epoch": 26.0, + "learning_rate": 6.515135135135135e-05, + "loss": 2.4918, + "step": 26800 + }, + { + "epoch": 26.0, + "learning_rate": 6.513783783783784e-05, + "loss": 2.5737, + "step": 26810 + }, + { + "epoch": 26.0, + "learning_rate": 6.512432432432432e-05, + "loss": 1.7573, + "step": 26820 + }, + { + "epoch": 26.0, + "learning_rate": 6.511081081081082e-05, + "loss": 1.5662, + "step": 26830 + }, + { + "epoch": 26.0, + "learning_rate": 6.50972972972973e-05, + "loss": 0.932, + "step": 26840 + }, + { + "epoch": 26.0, + "learning_rate": 6.508378378378379e-05, + "loss": 0.4356, + "step": 26850 + }, + { + "epoch": 26.0, + "learning_rate": 6.507027027027027e-05, + "loss": 0.139, + "step": 26860 + }, + { + "epoch": 26.0, + "learning_rate": 6.505675675675677e-05, + "loss": 0.297, + "step": 26870 + }, + { + "epoch": 26.0, + "learning_rate": 6.504324324324325e-05, + "loss": 0.2592, + "step": 26880 + }, + { + "epoch": 26.0, + "learning_rate": 6.502972972972974e-05, + "loss": 0.294, + "step": 26890 + }, + { + "epoch": 26.0, + "learning_rate": 6.501621621621623e-05, + "loss": 0.4733, + "step": 26900 + }, + { + "epoch": 26.0, + "learning_rate": 6.50027027027027e-05, + "loss": 0.2726, + "step": 26910 + }, + { + "epoch": 26.0, + "learning_rate": 6.498918918918919e-05, + "loss": 0.1882, + "step": 26920 + }, + { + "epoch": 26.0, + "learning_rate": 6.497567567567567e-05, + "loss": 0.297, + "step": 26930 + }, + { + "epoch": 26.0, + "learning_rate": 6.496216216216216e-05, + "loss": 0.2417, + "step": 26940 + }, + { + "epoch": 26.0, + "learning_rate": 6.494864864864864e-05, + "loss": 0.3114, + "step": 26950 + }, + { + "epoch": 26.0, + "learning_rate": 6.493513513513514e-05, + "loss": 0.31, + "step": 26960 + }, + { + "epoch": 26.0, + "learning_rate": 6.492162162162162e-05, + "loss": 0.2601, + "step": 26970 + }, + { + "epoch": 26.01, + "learning_rate": 6.490810810810811e-05, + "loss": 0.1956, + "step": 26980 + }, + { + "epoch": 26.01, + "learning_rate": 6.48945945945946e-05, + "loss": 0.152, + "step": 26990 + }, + { + "epoch": 26.01, + "learning_rate": 6.488108108108109e-05, + "loss": 0.2397, + "step": 27000 + }, + { + "epoch": 26.01, + "eval_loss": 0.11449452489614487, + "eval_runtime": 129.7322, + "eval_samples_per_second": 27.811, + "eval_steps_per_second": 3.476, + "eval_wer": 0.11289195359455807, + "step": 27000 + }, + { + "epoch": 26.01, + "learning_rate": 6.486756756756757e-05, + "loss": 0.2281, + "step": 27010 + }, + { + "epoch": 26.01, + "learning_rate": 6.485405405405407e-05, + "loss": 0.1428, + "step": 27020 + }, + { + "epoch": 26.01, + "learning_rate": 6.484054054054055e-05, + "loss": 0.2407, + "step": 27030 + }, + { + "epoch": 26.01, + "learning_rate": 6.482702702702703e-05, + "loss": 0.3904, + "step": 27040 + }, + { + "epoch": 26.01, + "learning_rate": 6.481351351351351e-05, + "loss": 0.2565, + "step": 27050 + }, + { + "epoch": 26.01, + "learning_rate": 6.48e-05, + "loss": 0.3409, + "step": 27060 + }, + { + "epoch": 26.01, + "learning_rate": 6.478648648648648e-05, + "loss": 0.3777, + "step": 27070 + }, + { + "epoch": 26.01, + "learning_rate": 6.477297297297298e-05, + "loss": 0.3204, + "step": 27080 + }, + { + "epoch": 26.01, + "learning_rate": 6.475945945945946e-05, + "loss": 0.4675, + "step": 27090 + }, + { + "epoch": 26.01, + "learning_rate": 6.474594594594595e-05, + "loss": 0.3226, + "step": 27100 + }, + { + "epoch": 26.01, + "learning_rate": 6.473243243243244e-05, + "loss": 0.3444, + "step": 27110 + }, + { + "epoch": 26.01, + "learning_rate": 6.471891891891893e-05, + "loss": 0.7034, + "step": 27120 + }, + { + "epoch": 26.01, + "learning_rate": 6.470540540540541e-05, + "loss": 0.5647, + "step": 27130 + }, + { + "epoch": 26.01, + "learning_rate": 6.469189189189189e-05, + "loss": 0.2329, + "step": 27140 + }, + { + "epoch": 26.01, + "learning_rate": 6.467837837837837e-05, + "loss": 0.1768, + "step": 27150 + }, + { + "epoch": 26.01, + "learning_rate": 6.466486486486487e-05, + "loss": 0.2971, + "step": 27160 + }, + { + "epoch": 26.01, + "learning_rate": 6.465135135135135e-05, + "loss": 0.1993, + "step": 27170 + }, + { + "epoch": 26.01, + "learning_rate": 6.463783783783784e-05, + "loss": 0.2255, + "step": 27180 + }, + { + "epoch": 26.01, + "learning_rate": 6.462432432432432e-05, + "loss": 0.2244, + "step": 27190 + }, + { + "epoch": 26.01, + "learning_rate": 6.461081081081082e-05, + "loss": 0.1772, + "step": 27200 + }, + { + "epoch": 26.01, + "learning_rate": 6.45972972972973e-05, + "loss": 0.1977, + "step": 27210 + }, + { + "epoch": 26.01, + "learning_rate": 6.45837837837838e-05, + "loss": 0.439, + "step": 27220 + }, + { + "epoch": 26.01, + "learning_rate": 6.457027027027028e-05, + "loss": 0.4024, + "step": 27230 + }, + { + "epoch": 26.01, + "learning_rate": 6.455675675675677e-05, + "loss": 0.3872, + "step": 27240 + }, + { + "epoch": 26.01, + "learning_rate": 6.454324324324325e-05, + "loss": 0.3882, + "step": 27250 + }, + { + "epoch": 26.01, + "learning_rate": 6.452972972972973e-05, + "loss": 0.5401, + "step": 27260 + }, + { + "epoch": 26.01, + "learning_rate": 6.451621621621621e-05, + "loss": 0.3393, + "step": 27270 + }, + { + "epoch": 26.01, + "learning_rate": 6.450270270270271e-05, + "loss": 0.2566, + "step": 27280 + }, + { + "epoch": 26.01, + "learning_rate": 6.448918918918919e-05, + "loss": 0.2679, + "step": 27290 + }, + { + "epoch": 26.01, + "learning_rate": 6.447567567567568e-05, + "loss": 0.3746, + "step": 27300 + }, + { + "epoch": 26.01, + "learning_rate": 6.446216216216216e-05, + "loss": 0.4116, + "step": 27310 + }, + { + "epoch": 26.01, + "learning_rate": 6.444864864864865e-05, + "loss": 0.3575, + "step": 27320 + }, + { + "epoch": 26.01, + "learning_rate": 6.443513513513514e-05, + "loss": 0.3237, + "step": 27330 + }, + { + "epoch": 26.01, + "learning_rate": 6.442162162162162e-05, + "loss": 0.3988, + "step": 27340 + }, + { + "epoch": 26.01, + "learning_rate": 6.440810810810812e-05, + "loss": 0.2846, + "step": 27350 + }, + { + "epoch": 26.01, + "learning_rate": 6.43945945945946e-05, + "loss": 0.2565, + "step": 27360 + }, + { + "epoch": 26.01, + "learning_rate": 6.438108108108109e-05, + "loss": 0.1881, + "step": 27370 + }, + { + "epoch": 26.01, + "learning_rate": 6.436756756756757e-05, + "loss": 0.1531, + "step": 27380 + }, + { + "epoch": 26.01, + "learning_rate": 6.435405405405405e-05, + "loss": 0.2613, + "step": 27390 + }, + { + "epoch": 26.01, + "learning_rate": 6.434054054054053e-05, + "loss": 0.6908, + "step": 27400 + }, + { + "epoch": 26.01, + "learning_rate": 6.432702702702703e-05, + "loss": 0.2543, + "step": 27410 + }, + { + "epoch": 26.01, + "learning_rate": 6.431351351351351e-05, + "loss": 0.2082, + "step": 27420 + }, + { + "epoch": 26.01, + "learning_rate": 6.43e-05, + "loss": 0.33, + "step": 27430 + }, + { + "epoch": 26.01, + "learning_rate": 6.428648648648649e-05, + "loss": 0.2553, + "step": 27440 + }, + { + "epoch": 26.01, + "learning_rate": 6.427297297297298e-05, + "loss": 0.2999, + "step": 27450 + }, + { + "epoch": 26.01, + "learning_rate": 6.425945945945946e-05, + "loss": 0.4085, + "step": 27460 + }, + { + "epoch": 26.01, + "learning_rate": 6.424594594594596e-05, + "loss": 0.3914, + "step": 27470 + }, + { + "epoch": 26.01, + "learning_rate": 6.423243243243244e-05, + "loss": 0.2441, + "step": 27480 + }, + { + "epoch": 26.01, + "learning_rate": 6.421891891891892e-05, + "loss": 0.3549, + "step": 27490 + }, + { + "epoch": 26.01, + "learning_rate": 6.420540540540541e-05, + "loss": 0.2694, + "step": 27500 + }, + { + "epoch": 26.01, + "eval_loss": 0.10637255758047104, + "eval_runtime": 128.9083, + "eval_samples_per_second": 27.989, + "eval_steps_per_second": 3.499, + "eval_wer": 0.10497134603736663, + "step": 27500 + }, + { + "epoch": 26.01, + "learning_rate": 6.41918918918919e-05, + "loss": 0.5209, + "step": 27510 + }, + { + "epoch": 26.01, + "learning_rate": 6.417837837837837e-05, + "loss": 0.4668, + "step": 27520 + }, + { + "epoch": 26.01, + "learning_rate": 6.416486486486487e-05, + "loss": 0.3629, + "step": 27530 + }, + { + "epoch": 26.01, + "learning_rate": 6.415135135135135e-05, + "loss": 0.5479, + "step": 27540 + }, + { + "epoch": 26.01, + "learning_rate": 6.413783783783784e-05, + "loss": 0.493, + "step": 27550 + }, + { + "epoch": 26.01, + "learning_rate": 6.412432432432433e-05, + "loss": 0.5472, + "step": 27560 + }, + { + "epoch": 26.01, + "learning_rate": 6.411081081081082e-05, + "loss": 0.5803, + "step": 27570 + }, + { + "epoch": 26.01, + "learning_rate": 6.40972972972973e-05, + "loss": 0.4331, + "step": 27580 + }, + { + "epoch": 26.01, + "learning_rate": 6.40837837837838e-05, + "loss": 0.4689, + "step": 27590 + }, + { + "epoch": 26.01, + "learning_rate": 6.407027027027028e-05, + "loss": 0.4274, + "step": 27600 + }, + { + "epoch": 26.01, + "learning_rate": 6.405675675675676e-05, + "loss": 0.4069, + "step": 27610 + }, + { + "epoch": 26.01, + "learning_rate": 6.40445945945946e-05, + "loss": 0.6467, + "step": 27620 + }, + { + "epoch": 27.0, + "learning_rate": 6.403108108108108e-05, + "loss": 0.4593, + "step": 27630 + }, + { + "epoch": 27.0, + "learning_rate": 6.401756756756758e-05, + "loss": 0.4659, + "step": 27640 + }, + { + "epoch": 27.0, + "learning_rate": 6.400405405405406e-05, + "loss": 0.5027, + "step": 27650 + }, + { + "epoch": 27.0, + "learning_rate": 6.399054054054054e-05, + "loss": 0.3915, + "step": 27660 + }, + { + "epoch": 27.0, + "learning_rate": 6.397702702702702e-05, + "loss": 0.4261, + "step": 27670 + }, + { + "epoch": 27.0, + "learning_rate": 6.396351351351351e-05, + "loss": 0.4431, + "step": 27680 + }, + { + "epoch": 27.0, + "learning_rate": 6.395e-05, + "loss": 0.6415, + "step": 27690 + }, + { + "epoch": 27.0, + "learning_rate": 6.393648648648649e-05, + "loss": 0.4363, + "step": 27700 + }, + { + "epoch": 27.0, + "learning_rate": 6.392297297297297e-05, + "loss": 0.4611, + "step": 27710 + }, + { + "epoch": 27.0, + "learning_rate": 6.390945945945947e-05, + "loss": 0.509, + "step": 27720 + }, + { + "epoch": 27.0, + "learning_rate": 6.389594594594595e-05, + "loss": 0.4291, + "step": 27730 + }, + { + "epoch": 27.0, + "learning_rate": 6.388243243243244e-05, + "loss": 0.384, + "step": 27740 + }, + { + "epoch": 27.0, + "learning_rate": 6.386891891891892e-05, + "loss": 0.3118, + "step": 27750 + }, + { + "epoch": 27.0, + "learning_rate": 6.385540540540542e-05, + "loss": 0.2786, + "step": 27760 + }, + { + "epoch": 27.0, + "learning_rate": 6.38418918918919e-05, + "loss": 0.2865, + "step": 27770 + }, + { + "epoch": 27.0, + "learning_rate": 6.382837837837838e-05, + "loss": 0.3352, + "step": 27780 + }, + { + "epoch": 27.0, + "learning_rate": 6.381486486486486e-05, + "loss": 1.246, + "step": 27790 + }, + { + "epoch": 27.0, + "learning_rate": 6.380135135135135e-05, + "loss": 1.6831, + "step": 27800 + }, + { + "epoch": 27.0, + "learning_rate": 6.378783783783784e-05, + "loss": 2.6091, + "step": 27810 + }, + { + "epoch": 27.0, + "learning_rate": 6.377432432432433e-05, + "loss": 2.4371, + "step": 27820 + }, + { + "epoch": 27.0, + "learning_rate": 6.376081081081081e-05, + "loss": 2.5782, + "step": 27830 + }, + { + "epoch": 27.0, + "learning_rate": 6.37472972972973e-05, + "loss": 2.1281, + "step": 27840 + }, + { + "epoch": 27.0, + "learning_rate": 6.373378378378379e-05, + "loss": 1.5139, + "step": 27850 + }, + { + "epoch": 27.0, + "learning_rate": 6.372027027027028e-05, + "loss": 1.2191, + "step": 27860 + }, + { + "epoch": 27.0, + "learning_rate": 6.370675675675676e-05, + "loss": 0.5481, + "step": 27870 + }, + { + "epoch": 27.0, + "learning_rate": 6.369324324324324e-05, + "loss": 0.1666, + "step": 27880 + }, + { + "epoch": 27.0, + "learning_rate": 6.367972972972972e-05, + "loss": 0.2833, + "step": 27890 + }, + { + "epoch": 27.0, + "learning_rate": 6.366621621621622e-05, + "loss": 0.2291, + "step": 27900 + }, + { + "epoch": 27.0, + "learning_rate": 6.36527027027027e-05, + "loss": 0.3398, + "step": 27910 + }, + { + "epoch": 27.0, + "learning_rate": 6.36391891891892e-05, + "loss": 0.4497, + "step": 27920 + }, + { + "epoch": 27.0, + "learning_rate": 6.362567567567568e-05, + "loss": 0.3535, + "step": 27930 + }, + { + "epoch": 27.0, + "learning_rate": 6.361216216216217e-05, + "loss": 0.1776, + "step": 27940 + }, + { + "epoch": 27.0, + "learning_rate": 6.359864864864865e-05, + "loss": 0.2457, + "step": 27950 + }, + { + "epoch": 27.0, + "learning_rate": 6.358513513513515e-05, + "loss": 0.2335, + "step": 27960 + }, + { + "epoch": 27.0, + "learning_rate": 6.357162162162163e-05, + "loss": 0.2547, + "step": 27970 + }, + { + "epoch": 27.0, + "learning_rate": 6.355810810810812e-05, + "loss": 0.2877, + "step": 27980 + }, + { + "epoch": 27.0, + "learning_rate": 6.35445945945946e-05, + "loss": 0.2373, + "step": 27990 + }, + { + "epoch": 27.01, + "learning_rate": 6.353108108108108e-05, + "loss": 0.2274, + "step": 28000 + }, + { + "epoch": 27.01, + "eval_loss": 0.11035533994436264, + "eval_runtime": 131.9625, + "eval_samples_per_second": 27.341, + "eval_steps_per_second": 3.418, + "eval_wer": 0.10720775287704422, + "step": 28000 + }, + { + "epoch": 27.01, + "learning_rate": 6.351756756756757e-05, + "loss": 0.1297, + "step": 28010 + }, + { + "epoch": 27.01, + "learning_rate": 6.350405405405405e-05, + "loss": 0.1524, + "step": 28020 + }, + { + "epoch": 27.01, + "learning_rate": 6.349054054054054e-05, + "loss": 0.2742, + "step": 28030 + }, + { + "epoch": 27.01, + "learning_rate": 6.347702702702702e-05, + "loss": 0.1543, + "step": 28040 + }, + { + "epoch": 27.01, + "learning_rate": 6.346351351351352e-05, + "loss": 0.2272, + "step": 28050 + }, + { + "epoch": 27.01, + "learning_rate": 6.345e-05, + "loss": 0.3361, + "step": 28060 + }, + { + "epoch": 27.01, + "learning_rate": 6.343648648648649e-05, + "loss": 0.313, + "step": 28070 + }, + { + "epoch": 27.01, + "learning_rate": 6.342297297297297e-05, + "loss": 0.2662, + "step": 28080 + }, + { + "epoch": 27.01, + "learning_rate": 6.340945945945947e-05, + "loss": 0.4196, + "step": 28090 + }, + { + "epoch": 27.01, + "learning_rate": 6.339594594594595e-05, + "loss": 0.3632, + "step": 28100 + }, + { + "epoch": 27.01, + "learning_rate": 6.338243243243244e-05, + "loss": 0.4099, + "step": 28110 + }, + { + "epoch": 27.01, + "learning_rate": 6.336891891891892e-05, + "loss": 0.4414, + "step": 28120 + }, + { + "epoch": 27.01, + "learning_rate": 6.33554054054054e-05, + "loss": 0.2717, + "step": 28130 + }, + { + "epoch": 27.01, + "learning_rate": 6.334189189189189e-05, + "loss": 0.4952, + "step": 28140 + }, + { + "epoch": 27.01, + "learning_rate": 6.332837837837838e-05, + "loss": 0.6076, + "step": 28150 + }, + { + "epoch": 27.01, + "learning_rate": 6.331486486486486e-05, + "loss": 0.3146, + "step": 28160 + }, + { + "epoch": 27.01, + "learning_rate": 6.330135135135136e-05, + "loss": 0.1568, + "step": 28170 + }, + { + "epoch": 27.01, + "learning_rate": 6.328783783783784e-05, + "loss": 0.2925, + "step": 28180 + }, + { + "epoch": 27.01, + "learning_rate": 6.327432432432433e-05, + "loss": 0.2037, + "step": 28190 + }, + { + "epoch": 27.01, + "learning_rate": 6.326081081081081e-05, + "loss": 0.2446, + "step": 28200 + }, + { + "epoch": 27.01, + "learning_rate": 6.324729729729731e-05, + "loss": 0.1969, + "step": 28210 + }, + { + "epoch": 27.01, + "learning_rate": 6.323378378378379e-05, + "loss": 0.1704, + "step": 28220 + }, + { + "epoch": 27.01, + "learning_rate": 6.322027027027028e-05, + "loss": 0.1673, + "step": 28230 + }, + { + "epoch": 27.01, + "learning_rate": 6.320675675675676e-05, + "loss": 0.3861, + "step": 28240 + }, + { + "epoch": 27.01, + "learning_rate": 6.319324324324325e-05, + "loss": 0.4354, + "step": 28250 + }, + { + "epoch": 27.01, + "learning_rate": 6.317972972972973e-05, + "loss": 0.345, + "step": 28260 + }, + { + "epoch": 27.01, + "learning_rate": 6.316621621621622e-05, + "loss": 0.3035, + "step": 28270 + }, + { + "epoch": 27.01, + "learning_rate": 6.31527027027027e-05, + "loss": 0.4296, + "step": 28280 + }, + { + "epoch": 27.01, + "learning_rate": 6.31391891891892e-05, + "loss": 0.4021, + "step": 28290 + }, + { + "epoch": 27.01, + "learning_rate": 6.312567567567568e-05, + "loss": 0.2103, + "step": 28300 + }, + { + "epoch": 27.01, + "learning_rate": 6.311216216216217e-05, + "loss": 0.2332, + "step": 28310 + }, + { + "epoch": 27.01, + "learning_rate": 6.309864864864865e-05, + "loss": 0.2813, + "step": 28320 + }, + { + "epoch": 27.01, + "learning_rate": 6.308513513513515e-05, + "loss": 0.3966, + "step": 28330 + }, + { + "epoch": 27.01, + "learning_rate": 6.307162162162163e-05, + "loss": 0.4454, + "step": 28340 + }, + { + "epoch": 27.01, + "learning_rate": 6.305810810810811e-05, + "loss": 0.257, + "step": 28350 + }, + { + "epoch": 27.01, + "learning_rate": 6.304459459459459e-05, + "loss": 0.2786, + "step": 28360 + }, + { + "epoch": 27.01, + "learning_rate": 6.303108108108109e-05, + "loss": 0.2467, + "step": 28370 + }, + { + "epoch": 27.01, + "learning_rate": 6.301756756756757e-05, + "loss": 0.2773, + "step": 28380 + }, + { + "epoch": 27.01, + "learning_rate": 6.300405405405406e-05, + "loss": 0.2775, + "step": 28390 + }, + { + "epoch": 27.01, + "learning_rate": 6.299054054054054e-05, + "loss": 0.143, + "step": 28400 + }, + { + "epoch": 27.01, + "learning_rate": 6.297702702702702e-05, + "loss": 0.2952, + "step": 28410 + }, + { + "epoch": 27.01, + "learning_rate": 6.296351351351352e-05, + "loss": 0.4869, + "step": 28420 + }, + { + "epoch": 27.01, + "learning_rate": 6.295e-05, + "loss": 0.453, + "step": 28430 + }, + { + "epoch": 27.01, + "learning_rate": 6.29364864864865e-05, + "loss": 0.1887, + "step": 28440 + }, + { + "epoch": 27.01, + "learning_rate": 6.292297297297297e-05, + "loss": 0.2707, + "step": 28450 + }, + { + "epoch": 27.01, + "learning_rate": 6.290945945945947e-05, + "loss": 0.3032, + "step": 28460 + }, + { + "epoch": 27.01, + "learning_rate": 6.289594594594595e-05, + "loss": 0.28, + "step": 28470 + }, + { + "epoch": 27.01, + "learning_rate": 6.288243243243243e-05, + "loss": 0.3168, + "step": 28480 + }, + { + "epoch": 27.01, + "learning_rate": 6.286891891891891e-05, + "loss": 0.412, + "step": 28490 + }, + { + "epoch": 27.01, + "learning_rate": 6.28554054054054e-05, + "loss": 0.2474, + "step": 28500 + }, + { + "epoch": 27.01, + "eval_loss": 0.09908636659383774, + "eval_runtime": 129.9354, + "eval_samples_per_second": 27.768, + "eval_steps_per_second": 3.471, + "eval_wer": 0.10292130643432884, + "step": 28500 + }, + { + "epoch": 27.01, + "learning_rate": 6.284189189189189e-05, + "loss": 0.3053, + "step": 28510 + }, + { + "epoch": 27.01, + "learning_rate": 6.282837837837838e-05, + "loss": 0.3105, + "step": 28520 + }, + { + "epoch": 27.01, + "learning_rate": 6.281486486486486e-05, + "loss": 0.4599, + "step": 28530 + }, + { + "epoch": 27.01, + "learning_rate": 6.280135135135136e-05, + "loss": 0.3789, + "step": 28540 + }, + { + "epoch": 27.01, + "learning_rate": 6.278783783783784e-05, + "loss": 0.4459, + "step": 28550 + }, + { + "epoch": 27.01, + "learning_rate": 6.277432432432433e-05, + "loss": 0.3739, + "step": 28560 + }, + { + "epoch": 27.01, + "learning_rate": 6.276081081081081e-05, + "loss": 0.5088, + "step": 28570 + }, + { + "epoch": 27.01, + "learning_rate": 6.274729729729731e-05, + "loss": 0.4492, + "step": 28580 + }, + { + "epoch": 27.01, + "learning_rate": 6.273378378378379e-05, + "loss": 0.5886, + "step": 28590 + }, + { + "epoch": 27.01, + "learning_rate": 6.272027027027027e-05, + "loss": 0.4498, + "step": 28600 + }, + { + "epoch": 27.01, + "learning_rate": 6.270675675675675e-05, + "loss": 0.4667, + "step": 28610 + }, + { + "epoch": 27.01, + "learning_rate": 6.269324324324325e-05, + "loss": 0.3937, + "step": 28620 + }, + { + "epoch": 27.01, + "learning_rate": 6.267972972972973e-05, + "loss": 0.4058, + "step": 28630 + }, + { + "epoch": 27.01, + "learning_rate": 6.266621621621622e-05, + "loss": 0.504, + "step": 28640 + }, + { + "epoch": 28.0, + "learning_rate": 6.26527027027027e-05, + "loss": 0.538, + "step": 28650 + }, + { + "epoch": 28.0, + "learning_rate": 6.26391891891892e-05, + "loss": 0.4586, + "step": 28660 + }, + { + "epoch": 28.0, + "learning_rate": 6.262567567567568e-05, + "loss": 0.48, + "step": 28670 + }, + { + "epoch": 28.0, + "learning_rate": 6.261216216216217e-05, + "loss": 0.4229, + "step": 28680 + }, + { + "epoch": 28.0, + "learning_rate": 6.259864864864865e-05, + "loss": 0.4251, + "step": 28690 + }, + { + "epoch": 28.0, + "learning_rate": 6.258513513513514e-05, + "loss": 0.4264, + "step": 28700 + }, + { + "epoch": 28.0, + "learning_rate": 6.257162162162162e-05, + "loss": 0.6254, + "step": 28710 + }, + { + "epoch": 28.0, + "learning_rate": 6.255810810810811e-05, + "loss": 0.4382, + "step": 28720 + }, + { + "epoch": 28.0, + "learning_rate": 6.254459459459459e-05, + "loss": 0.3957, + "step": 28730 + }, + { + "epoch": 28.0, + "learning_rate": 6.253108108108109e-05, + "loss": 0.4558, + "step": 28740 + }, + { + "epoch": 28.0, + "learning_rate": 6.251756756756757e-05, + "loss": 0.413, + "step": 28750 + }, + { + "epoch": 28.0, + "learning_rate": 6.250405405405406e-05, + "loss": 0.4479, + "step": 28760 + }, + { + "epoch": 28.0, + "learning_rate": 6.249054054054054e-05, + "loss": 0.3068, + "step": 28770 + }, + { + "epoch": 28.0, + "learning_rate": 6.247702702702704e-05, + "loss": 0.2582, + "step": 28780 + }, + { + "epoch": 28.0, + "learning_rate": 6.246351351351352e-05, + "loss": 0.2507, + "step": 28790 + }, + { + "epoch": 28.0, + "learning_rate": 6.245000000000001e-05, + "loss": 0.2775, + "step": 28800 + }, + { + "epoch": 28.0, + "learning_rate": 6.24364864864865e-05, + "loss": 1.1265, + "step": 28810 + }, + { + "epoch": 28.0, + "learning_rate": 6.242297297297298e-05, + "loss": 1.1831, + "step": 28820 + }, + { + "epoch": 28.0, + "learning_rate": 6.240945945945946e-05, + "loss": 2.5897, + "step": 28830 + }, + { + "epoch": 28.0, + "learning_rate": 6.239594594594594e-05, + "loss": 2.4395, + "step": 28840 + }, + { + "epoch": 28.0, + "learning_rate": 6.238243243243243e-05, + "loss": 2.5735, + "step": 28850 + }, + { + "epoch": 28.0, + "learning_rate": 6.236891891891891e-05, + "loss": 2.4496, + "step": 28860 + }, + { + "epoch": 28.0, + "learning_rate": 6.235540540540541e-05, + "loss": 1.3853, + "step": 28870 + }, + { + "epoch": 28.0, + "learning_rate": 6.234189189189189e-05, + "loss": 1.4816, + "step": 28880 + }, + { + "epoch": 28.0, + "learning_rate": 6.232837837837838e-05, + "loss": 0.6655, + "step": 28890 + }, + { + "epoch": 28.0, + "learning_rate": 6.231486486486486e-05, + "loss": 0.2246, + "step": 28900 + }, + { + "epoch": 28.0, + "learning_rate": 6.230135135135136e-05, + "loss": 0.2228, + "step": 28910 + }, + { + "epoch": 28.0, + "learning_rate": 6.228783783783784e-05, + "loss": 0.2247, + "step": 28920 + }, + { + "epoch": 28.0, + "learning_rate": 6.227432432432433e-05, + "loss": 0.3481, + "step": 28930 + }, + { + "epoch": 28.0, + "learning_rate": 6.226081081081082e-05, + "loss": 0.3752, + "step": 28940 + }, + { + "epoch": 28.0, + "learning_rate": 6.22472972972973e-05, + "loss": 0.3932, + "step": 28950 + }, + { + "epoch": 28.0, + "learning_rate": 6.223378378378378e-05, + "loss": 0.2111, + "step": 28960 + }, + { + "epoch": 28.0, + "learning_rate": 6.222027027027027e-05, + "loss": 0.186, + "step": 28970 + }, + { + "epoch": 28.0, + "learning_rate": 6.220675675675675e-05, + "loss": 0.2458, + "step": 28980 + }, + { + "epoch": 28.0, + "learning_rate": 6.219324324324325e-05, + "loss": 0.1946, + "step": 28990 + }, + { + "epoch": 28.0, + "learning_rate": 6.217972972972973e-05, + "loss": 0.31, + "step": 29000 + }, + { + "epoch": 28.0, + "eval_loss": 0.11357536166906357, + "eval_runtime": 131.7798, + "eval_samples_per_second": 27.379, + "eval_steps_per_second": 3.422, + "eval_wer": 0.10702138564040442, + "step": 29000 + }, + { + "epoch": 28.0, + "learning_rate": 6.216621621621622e-05, + "loss": 0.2557, + "step": 29010 + }, + { + "epoch": 28.01, + "learning_rate": 6.21527027027027e-05, + "loss": 0.2359, + "step": 29020 + }, + { + "epoch": 28.01, + "learning_rate": 6.21391891891892e-05, + "loss": 0.1537, + "step": 29030 + }, + { + "epoch": 28.01, + "learning_rate": 6.212567567567568e-05, + "loss": 0.1369, + "step": 29040 + }, + { + "epoch": 28.01, + "learning_rate": 6.211216216216217e-05, + "loss": 0.2206, + "step": 29050 + }, + { + "epoch": 28.01, + "learning_rate": 6.209864864864866e-05, + "loss": 0.2053, + "step": 29060 + }, + { + "epoch": 28.01, + "learning_rate": 6.208513513513514e-05, + "loss": 0.1911, + "step": 29070 + }, + { + "epoch": 28.01, + "learning_rate": 6.207162162162162e-05, + "loss": 0.303, + "step": 29080 + }, + { + "epoch": 28.01, + "learning_rate": 6.205810810810811e-05, + "loss": 0.3322, + "step": 29090 + }, + { + "epoch": 28.01, + "learning_rate": 6.20445945945946e-05, + "loss": 0.2421, + "step": 29100 + }, + { + "epoch": 28.01, + "learning_rate": 6.203108108108109e-05, + "loss": 0.2992, + "step": 29110 + }, + { + "epoch": 28.01, + "learning_rate": 6.201756756756757e-05, + "loss": 0.3347, + "step": 29120 + }, + { + "epoch": 28.01, + "learning_rate": 6.200405405405406e-05, + "loss": 0.3481, + "step": 29130 + }, + { + "epoch": 28.01, + "learning_rate": 6.199054054054054e-05, + "loss": 0.3711, + "step": 29140 + }, + { + "epoch": 28.01, + "learning_rate": 6.197702702702704e-05, + "loss": 0.2789, + "step": 29150 + }, + { + "epoch": 28.01, + "learning_rate": 6.196351351351352e-05, + "loss": 0.416, + "step": 29160 + }, + { + "epoch": 28.01, + "learning_rate": 6.195e-05, + "loss": 0.5692, + "step": 29170 + }, + { + "epoch": 28.01, + "learning_rate": 6.193648648648648e-05, + "loss": 0.4765, + "step": 29180 + }, + { + "epoch": 28.01, + "learning_rate": 6.192297297297298e-05, + "loss": 0.154, + "step": 29190 + }, + { + "epoch": 28.01, + "learning_rate": 6.190945945945946e-05, + "loss": 0.2561, + "step": 29200 + }, + { + "epoch": 28.01, + "learning_rate": 6.189594594594594e-05, + "loss": 0.2292, + "step": 29210 + }, + { + "epoch": 28.01, + "learning_rate": 6.188243243243243e-05, + "loss": 0.2504, + "step": 29220 + }, + { + "epoch": 28.01, + "learning_rate": 6.186891891891891e-05, + "loss": 0.2038, + "step": 29230 + }, + { + "epoch": 28.01, + "learning_rate": 6.185540540540541e-05, + "loss": 0.1837, + "step": 29240 + }, + { + "epoch": 28.01, + "learning_rate": 6.184189189189189e-05, + "loss": 0.1798, + "step": 29250 + }, + { + "epoch": 28.01, + "learning_rate": 6.182837837837838e-05, + "loss": 0.2705, + "step": 29260 + }, + { + "epoch": 28.01, + "learning_rate": 6.181486486486487e-05, + "loss": 0.4467, + "step": 29270 + }, + { + "epoch": 28.01, + "learning_rate": 6.180135135135136e-05, + "loss": 0.3838, + "step": 29280 + }, + { + "epoch": 28.01, + "learning_rate": 6.178783783783784e-05, + "loss": 0.3202, + "step": 29290 + }, + { + "epoch": 28.01, + "learning_rate": 6.177432432432432e-05, + "loss": 0.4068, + "step": 29300 + }, + { + "epoch": 28.01, + "learning_rate": 6.17608108108108e-05, + "loss": 0.4908, + "step": 29310 + }, + { + "epoch": 28.01, + "learning_rate": 6.17472972972973e-05, + "loss": 0.239, + "step": 29320 + }, + { + "epoch": 28.01, + "learning_rate": 6.173378378378378e-05, + "loss": 0.1663, + "step": 29330 + }, + { + "epoch": 28.01, + "learning_rate": 6.172027027027027e-05, + "loss": 0.272, + "step": 29340 + }, + { + "epoch": 28.01, + "learning_rate": 6.170675675675675e-05, + "loss": 0.3715, + "step": 29350 + }, + { + "epoch": 28.01, + "learning_rate": 6.169324324324325e-05, + "loss": 0.3877, + "step": 29360 + }, + { + "epoch": 28.01, + "learning_rate": 6.167972972972973e-05, + "loss": 0.3982, + "step": 29370 + }, + { + "epoch": 28.01, + "learning_rate": 6.166621621621623e-05, + "loss": 0.2737, + "step": 29380 + }, + { + "epoch": 28.01, + "learning_rate": 6.16527027027027e-05, + "loss": 0.2563, + "step": 29390 + }, + { + "epoch": 28.01, + "learning_rate": 6.16391891891892e-05, + "loss": 0.2899, + "step": 29400 + }, + { + "epoch": 28.01, + "learning_rate": 6.162567567567568e-05, + "loss": 0.2551, + "step": 29410 + }, + { + "epoch": 28.01, + "learning_rate": 6.161216216216216e-05, + "loss": 0.1609, + "step": 29420 + }, + { + "epoch": 28.01, + "learning_rate": 6.159864864864864e-05, + "loss": 0.2489, + "step": 29430 + }, + { + "epoch": 28.01, + "learning_rate": 6.158513513513514e-05, + "loss": 0.3219, + "step": 29440 + }, + { + "epoch": 28.01, + "learning_rate": 6.157162162162162e-05, + "loss": 0.5805, + "step": 29450 + }, + { + "epoch": 28.01, + "learning_rate": 6.155810810810811e-05, + "loss": 0.1808, + "step": 29460 + }, + { + "epoch": 28.01, + "learning_rate": 6.15445945945946e-05, + "loss": 0.2675, + "step": 29470 + }, + { + "epoch": 28.01, + "learning_rate": 6.153108108108109e-05, + "loss": 0.2879, + "step": 29480 + }, + { + "epoch": 28.01, + "learning_rate": 6.151756756756757e-05, + "loss": 0.2804, + "step": 29490 + }, + { + "epoch": 28.01, + "learning_rate": 6.150405405405407e-05, + "loss": 0.3041, + "step": 29500 + }, + { + "epoch": 28.01, + "eval_loss": 0.1057649701833725, + "eval_runtime": 128.7009, + "eval_samples_per_second": 28.034, + "eval_steps_per_second": 3.504, + "eval_wer": 0.10282812281600895, + "step": 29500 + }, + { + "epoch": 28.01, + "learning_rate": 6.149054054054055e-05, + "loss": 0.4358, + "step": 29510 + }, + { + "epoch": 28.01, + "learning_rate": 6.147702702702704e-05, + "loss": 0.2782, + "step": 29520 + }, + { + "epoch": 28.01, + "learning_rate": 6.146351351351352e-05, + "loss": 0.2883, + "step": 29530 + }, + { + "epoch": 28.01, + "learning_rate": 6.145e-05, + "loss": 0.2898, + "step": 29540 + }, + { + "epoch": 28.01, + "learning_rate": 6.143648648648648e-05, + "loss": 0.4179, + "step": 29550 + }, + { + "epoch": 28.01, + "learning_rate": 6.142297297297298e-05, + "loss": 0.4026, + "step": 29560 + }, + { + "epoch": 28.01, + "learning_rate": 6.140945945945946e-05, + "loss": 0.4682, + "step": 29570 + }, + { + "epoch": 28.01, + "learning_rate": 6.139594594594595e-05, + "loss": 0.3255, + "step": 29580 + }, + { + "epoch": 28.01, + "learning_rate": 6.138243243243244e-05, + "loss": 0.5896, + "step": 29590 + }, + { + "epoch": 28.01, + "learning_rate": 6.136891891891893e-05, + "loss": 0.4049, + "step": 29600 + }, + { + "epoch": 28.01, + "learning_rate": 6.135540540540541e-05, + "loss": 0.6356, + "step": 29610 + }, + { + "epoch": 28.01, + "learning_rate": 6.134189189189189e-05, + "loss": 0.4903, + "step": 29620 + }, + { + "epoch": 28.01, + "learning_rate": 6.132837837837839e-05, + "loss": 0.4214, + "step": 29630 + }, + { + "epoch": 28.01, + "learning_rate": 6.131486486486487e-05, + "loss": 0.3959, + "step": 29640 + }, + { + "epoch": 28.01, + "learning_rate": 6.130135135135135e-05, + "loss": 0.4026, + "step": 29650 + }, + { + "epoch": 28.01, + "learning_rate": 6.128783783783783e-05, + "loss": 0.4695, + "step": 29660 + }, + { + "epoch": 29.0, + "learning_rate": 6.127432432432432e-05, + "loss": 0.5551, + "step": 29670 + }, + { + "epoch": 29.0, + "learning_rate": 6.12608108108108e-05, + "loss": 0.4537, + "step": 29680 + }, + { + "epoch": 29.0, + "learning_rate": 6.12472972972973e-05, + "loss": 0.4551, + "step": 29690 + }, + { + "epoch": 29.0, + "learning_rate": 6.123378378378378e-05, + "loss": 0.4491, + "step": 29700 + }, + { + "epoch": 29.0, + "learning_rate": 6.122027027027028e-05, + "loss": 0.3701, + "step": 29710 + }, + { + "epoch": 29.0, + "learning_rate": 6.120675675675676e-05, + "loss": 0.4158, + "step": 29720 + }, + { + "epoch": 29.0, + "learning_rate": 6.119324324324325e-05, + "loss": 0.508, + "step": 29730 + }, + { + "epoch": 29.0, + "learning_rate": 6.117972972972973e-05, + "loss": 0.5463, + "step": 29740 + }, + { + "epoch": 29.0, + "learning_rate": 6.116621621621623e-05, + "loss": 0.4084, + "step": 29750 + }, + { + "epoch": 29.0, + "learning_rate": 6.115270270270271e-05, + "loss": 0.4594, + "step": 29760 + }, + { + "epoch": 29.0, + "learning_rate": 6.113918918918919e-05, + "loss": 0.4419, + "step": 29770 + }, + { + "epoch": 29.0, + "learning_rate": 6.112567567567567e-05, + "loss": 0.4165, + "step": 29780 + }, + { + "epoch": 29.0, + "learning_rate": 6.111216216216216e-05, + "loss": 0.3601, + "step": 29790 + }, + { + "epoch": 29.0, + "learning_rate": 6.109864864864865e-05, + "loss": 0.2424, + "step": 29800 + }, + { + "epoch": 29.0, + "learning_rate": 6.108513513513514e-05, + "loss": 0.2828, + "step": 29810 + }, + { + "epoch": 29.0, + "learning_rate": 6.107162162162162e-05, + "loss": 0.2857, + "step": 29820 + }, + { + "epoch": 29.0, + "learning_rate": 6.105810810810812e-05, + "loss": 0.8875, + "step": 29830 + }, + { + "epoch": 29.0, + "learning_rate": 6.10445945945946e-05, + "loss": 0.9101, + "step": 29840 + }, + { + "epoch": 29.0, + "learning_rate": 6.1031081081081084e-05, + "loss": 2.4894, + "step": 29850 + }, + { + "epoch": 29.0, + "learning_rate": 6.1017567567567565e-05, + "loss": 2.5408, + "step": 29860 + }, + { + "epoch": 29.0, + "learning_rate": 6.100405405405406e-05, + "loss": 2.447, + "step": 29870 + }, + { + "epoch": 29.0, + "learning_rate": 6.099054054054054e-05, + "loss": 2.5475, + "step": 29880 + }, + { + "epoch": 29.0, + "learning_rate": 6.0977027027027035e-05, + "loss": 1.6521, + "step": 29890 + }, + { + "epoch": 29.0, + "learning_rate": 6.0963513513513516e-05, + "loss": 1.511, + "step": 29900 + }, + { + "epoch": 29.0, + "learning_rate": 6.0950000000000004e-05, + "loss": 0.8657, + "step": 29910 + }, + { + "epoch": 29.0, + "learning_rate": 6.0936486486486485e-05, + "loss": 0.3303, + "step": 29920 + }, + { + "epoch": 29.0, + "learning_rate": 6.092432432432432e-05, + "loss": 0.1607, + "step": 29930 + }, + { + "epoch": 29.0, + "learning_rate": 6.091081081081082e-05, + "loss": 0.2617, + "step": 29940 + }, + { + "epoch": 29.0, + "learning_rate": 6.08972972972973e-05, + "loss": 0.2986, + "step": 29950 + }, + { + "epoch": 29.0, + "learning_rate": 6.0883783783783786e-05, + "loss": 0.3349, + "step": 29960 + }, + { + "epoch": 29.0, + "learning_rate": 6.087027027027027e-05, + "loss": 0.4289, + "step": 29970 + }, + { + "epoch": 29.0, + "learning_rate": 6.085675675675676e-05, + "loss": 0.2795, + "step": 29980 + }, + { + "epoch": 29.0, + "learning_rate": 6.084324324324324e-05, + "loss": 0.1552, + "step": 29990 + }, + { + "epoch": 29.0, + "learning_rate": 6.082972972972974e-05, + "loss": 0.3472, + "step": 30000 + }, + { + "epoch": 29.0, + "eval_loss": 0.11379099637269974, + "eval_runtime": 130.7805, + "eval_samples_per_second": 27.588, + "eval_steps_per_second": 3.449, + "eval_wer": 0.10744071192284396, + "step": 30000 + }, + { + "epoch": 29.0, + "learning_rate": 6.081621621621622e-05, + "loss": 0.1842, + "step": 30010 + }, + { + "epoch": 29.0, + "learning_rate": 6.0802702702702706e-05, + "loss": 0.3017, + "step": 30020 + }, + { + "epoch": 29.0, + "learning_rate": 6.078918918918919e-05, + "loss": 0.2801, + "step": 30030 + }, + { + "epoch": 29.0, + "learning_rate": 6.077567567567568e-05, + "loss": 0.1931, + "step": 30040 + }, + { + "epoch": 29.01, + "learning_rate": 6.076216216216216e-05, + "loss": 0.1981, + "step": 30050 + }, + { + "epoch": 29.01, + "learning_rate": 6.074864864864866e-05, + "loss": 0.1401, + "step": 30060 + }, + { + "epoch": 29.01, + "learning_rate": 6.073513513513514e-05, + "loss": 0.2277, + "step": 30070 + }, + { + "epoch": 29.01, + "learning_rate": 6.0721621621621626e-05, + "loss": 0.2073, + "step": 30080 + }, + { + "epoch": 29.01, + "learning_rate": 6.070810810810811e-05, + "loss": 0.1816, + "step": 30090 + }, + { + "epoch": 29.01, + "learning_rate": 6.06945945945946e-05, + "loss": 0.232, + "step": 30100 + }, + { + "epoch": 29.01, + "learning_rate": 6.068108108108108e-05, + "loss": 0.3445, + "step": 30110 + }, + { + "epoch": 29.01, + "learning_rate": 6.066756756756757e-05, + "loss": 0.24, + "step": 30120 + }, + { + "epoch": 29.01, + "learning_rate": 6.065405405405406e-05, + "loss": 0.3485, + "step": 30130 + }, + { + "epoch": 29.01, + "learning_rate": 6.0640540540540546e-05, + "loss": 0.3955, + "step": 30140 + }, + { + "epoch": 29.01, + "learning_rate": 6.062702702702703e-05, + "loss": 0.3143, + "step": 30150 + }, + { + "epoch": 29.01, + "learning_rate": 6.061351351351352e-05, + "loss": 0.4199, + "step": 30160 + }, + { + "epoch": 29.01, + "learning_rate": 6.06e-05, + "loss": 0.3618, + "step": 30170 + }, + { + "epoch": 29.01, + "learning_rate": 6.058648648648649e-05, + "loss": 0.3169, + "step": 30180 + }, + { + "epoch": 29.01, + "learning_rate": 6.057297297297297e-05, + "loss": 0.6606, + "step": 30190 + }, + { + "epoch": 29.01, + "learning_rate": 6.0559459459459466e-05, + "loss": 0.5481, + "step": 30200 + }, + { + "epoch": 29.01, + "learning_rate": 6.054594594594595e-05, + "loss": 0.2424, + "step": 30210 + }, + { + "epoch": 29.01, + "learning_rate": 6.053243243243244e-05, + "loss": 0.2029, + "step": 30220 + }, + { + "epoch": 29.01, + "learning_rate": 6.051891891891892e-05, + "loss": 0.2558, + "step": 30230 + }, + { + "epoch": 29.01, + "learning_rate": 6.050540540540541e-05, + "loss": 0.2005, + "step": 30240 + }, + { + "epoch": 29.01, + "learning_rate": 6.049189189189189e-05, + "loss": 0.2054, + "step": 30250 + }, + { + "epoch": 29.01, + "learning_rate": 6.0478378378378386e-05, + "loss": 0.1769, + "step": 30260 + }, + { + "epoch": 29.01, + "learning_rate": 6.046486486486487e-05, + "loss": 0.1678, + "step": 30270 + }, + { + "epoch": 29.01, + "learning_rate": 6.045135135135136e-05, + "loss": 0.1853, + "step": 30280 + }, + { + "epoch": 29.01, + "learning_rate": 6.043783783783784e-05, + "loss": 0.5143, + "step": 30290 + }, + { + "epoch": 29.01, + "learning_rate": 6.0424324324324324e-05, + "loss": 0.3789, + "step": 30300 + }, + { + "epoch": 29.01, + "learning_rate": 6.041081081081081e-05, + "loss": 0.3225, + "step": 30310 + }, + { + "epoch": 29.01, + "learning_rate": 6.039729729729729e-05, + "loss": 0.3204, + "step": 30320 + }, + { + "epoch": 29.01, + "learning_rate": 6.038378378378379e-05, + "loss": 0.4983, + "step": 30330 + }, + { + "epoch": 29.01, + "learning_rate": 6.037027027027027e-05, + "loss": 0.2941, + "step": 30340 + }, + { + "epoch": 29.01, + "learning_rate": 6.035675675675676e-05, + "loss": 0.2155, + "step": 30350 + }, + { + "epoch": 29.01, + "learning_rate": 6.0343243243243244e-05, + "loss": 0.2737, + "step": 30360 + }, + { + "epoch": 29.01, + "learning_rate": 6.032972972972973e-05, + "loss": 0.3921, + "step": 30370 + }, + { + "epoch": 29.01, + "learning_rate": 6.031621621621621e-05, + "loss": 0.3585, + "step": 30380 + }, + { + "epoch": 29.01, + "learning_rate": 6.030270270270271e-05, + "loss": 0.3201, + "step": 30390 + }, + { + "epoch": 29.01, + "learning_rate": 6.028918918918919e-05, + "loss": 0.2721, + "step": 30400 + }, + { + "epoch": 29.01, + "learning_rate": 6.027567567567568e-05, + "loss": 0.3273, + "step": 30410 + }, + { + "epoch": 29.01, + "learning_rate": 6.0262162162162164e-05, + "loss": 0.2663, + "step": 30420 + }, + { + "epoch": 29.01, + "learning_rate": 6.024864864864865e-05, + "loss": 0.28, + "step": 30430 + }, + { + "epoch": 29.01, + "learning_rate": 6.023513513513513e-05, + "loss": 0.1879, + "step": 30440 + }, + { + "epoch": 29.01, + "learning_rate": 6.022162162162163e-05, + "loss": 0.1509, + "step": 30450 + }, + { + "epoch": 29.01, + "learning_rate": 6.020810810810811e-05, + "loss": 0.3049, + "step": 30460 + }, + { + "epoch": 29.01, + "learning_rate": 6.01945945945946e-05, + "loss": 0.621, + "step": 30470 + }, + { + "epoch": 29.01, + "learning_rate": 6.0181081081081084e-05, + "loss": 0.2413, + "step": 30480 + }, + { + "epoch": 29.01, + "learning_rate": 6.016756756756757e-05, + "loss": 0.2195, + "step": 30490 + }, + { + "epoch": 29.01, + "learning_rate": 6.015405405405405e-05, + "loss": 0.2935, + "step": 30500 + }, + { + "epoch": 29.01, + "eval_loss": 0.1046026349067688, + "eval_runtime": 134.8299, + "eval_samples_per_second": 26.76, + "eval_steps_per_second": 3.345, + "eval_wer": 0.10105763406793086, + "step": 30500 + }, + { + "epoch": 29.01, + "learning_rate": 6.014054054054055e-05, + "loss": 0.2612, + "step": 30510 + }, + { + "epoch": 29.01, + "learning_rate": 6.012702702702703e-05, + "loss": 0.2696, + "step": 30520 + }, + { + "epoch": 29.01, + "learning_rate": 6.011351351351352e-05, + "loss": 0.3682, + "step": 30530 + }, + { + "epoch": 29.01, + "learning_rate": 6.0100000000000004e-05, + "loss": 0.412, + "step": 30540 + }, + { + "epoch": 29.01, + "learning_rate": 6.008648648648649e-05, + "loss": 0.1813, + "step": 30550 + }, + { + "epoch": 29.01, + "learning_rate": 6.007297297297297e-05, + "loss": 0.2998, + "step": 30560 + }, + { + "epoch": 29.01, + "learning_rate": 6.005945945945947e-05, + "loss": 0.2955, + "step": 30570 + }, + { + "epoch": 29.01, + "learning_rate": 6.004594594594595e-05, + "loss": 0.4669, + "step": 30580 + }, + { + "epoch": 29.01, + "learning_rate": 6.0032432432432436e-05, + "loss": 0.4793, + "step": 30590 + }, + { + "epoch": 29.01, + "learning_rate": 6.001891891891892e-05, + "loss": 0.4101, + "step": 30600 + }, + { + "epoch": 29.01, + "learning_rate": 6.000540540540541e-05, + "loss": 0.507, + "step": 30610 + }, + { + "epoch": 29.01, + "learning_rate": 5.999189189189189e-05, + "loss": 0.4628, + "step": 30620 + }, + { + "epoch": 29.01, + "learning_rate": 5.997837837837839e-05, + "loss": 0.4809, + "step": 30630 + }, + { + "epoch": 29.01, + "learning_rate": 5.996486486486487e-05, + "loss": 0.527, + "step": 30640 + }, + { + "epoch": 29.01, + "learning_rate": 5.9951351351351356e-05, + "loss": 0.4257, + "step": 30650 + }, + { + "epoch": 29.01, + "learning_rate": 5.993783783783784e-05, + "loss": 0.3978, + "step": 30660 + }, + { + "epoch": 29.01, + "learning_rate": 5.992432432432433e-05, + "loss": 0.3858, + "step": 30670 + }, + { + "epoch": 29.01, + "learning_rate": 5.991081081081081e-05, + "loss": 0.3634, + "step": 30680 + }, + { + "epoch": 29.01, + "learning_rate": 5.989729729729731e-05, + "loss": 0.5449, + "step": 30690 + }, + { + "epoch": 30.0, + "learning_rate": 5.988378378378379e-05, + "loss": 0.4474, + "step": 30700 + }, + { + "epoch": 30.0, + "learning_rate": 5.987027027027027e-05, + "loss": 0.4635, + "step": 30710 + }, + { + "epoch": 30.0, + "learning_rate": 5.985675675675676e-05, + "loss": 0.4653, + "step": 30720 + }, + { + "epoch": 30.0, + "learning_rate": 5.984324324324324e-05, + "loss": 0.3869, + "step": 30730 + }, + { + "epoch": 30.0, + "learning_rate": 5.982972972972973e-05, + "loss": 0.4348, + "step": 30740 + }, + { + "epoch": 30.0, + "learning_rate": 5.9816216216216214e-05, + "loss": 0.4357, + "step": 30750 + }, + { + "epoch": 30.0, + "learning_rate": 5.980270270270271e-05, + "loss": 0.6055, + "step": 30760 + }, + { + "epoch": 30.0, + "learning_rate": 5.978918918918919e-05, + "loss": 0.4155, + "step": 30770 + }, + { + "epoch": 30.0, + "learning_rate": 5.977567567567568e-05, + "loss": 0.4743, + "step": 30780 + }, + { + "epoch": 30.0, + "learning_rate": 5.976216216216216e-05, + "loss": 0.4375, + "step": 30790 + }, + { + "epoch": 30.0, + "learning_rate": 5.974864864864865e-05, + "loss": 0.3997, + "step": 30800 + }, + { + "epoch": 30.0, + "learning_rate": 5.9735135135135134e-05, + "loss": 0.3968, + "step": 30810 + }, + { + "epoch": 30.0, + "learning_rate": 5.972162162162163e-05, + "loss": 0.282, + "step": 30820 + }, + { + "epoch": 30.0, + "learning_rate": 5.970810810810811e-05, + "loss": 0.2531, + "step": 30830 + }, + { + "epoch": 30.0, + "learning_rate": 5.96945945945946e-05, + "loss": 0.2808, + "step": 30840 + }, + { + "epoch": 30.0, + "learning_rate": 5.968108108108108e-05, + "loss": 0.4826, + "step": 30850 + }, + { + "epoch": 30.0, + "learning_rate": 5.966756756756757e-05, + "loss": 1.1615, + "step": 30860 + }, + { + "epoch": 30.0, + "learning_rate": 5.9654054054054054e-05, + "loss": 1.8961, + "step": 30870 + }, + { + "epoch": 30.0, + "learning_rate": 5.964054054054055e-05, + "loss": 2.56, + "step": 30880 + }, + { + "epoch": 30.0, + "learning_rate": 5.962702702702703e-05, + "loss": 2.4123, + "step": 30890 + }, + { + "epoch": 30.0, + "learning_rate": 5.961351351351352e-05, + "loss": 2.5608, + "step": 30900 + }, + { + "epoch": 30.0, + "learning_rate": 5.96e-05, + "loss": 1.8938, + "step": 30910 + }, + { + "epoch": 30.0, + "learning_rate": 5.958648648648649e-05, + "loss": 1.5521, + "step": 30920 + }, + { + "epoch": 30.0, + "learning_rate": 5.9572972972972974e-05, + "loss": 1.0675, + "step": 30930 + }, + { + "epoch": 30.0, + "learning_rate": 5.955945945945947e-05, + "loss": 0.4783, + "step": 30940 + }, + { + "epoch": 30.0, + "learning_rate": 5.954594594594595e-05, + "loss": 0.1518, + "step": 30950 + }, + { + "epoch": 30.0, + "learning_rate": 5.953243243243244e-05, + "loss": 0.2548, + "step": 30960 + }, + { + "epoch": 30.0, + "learning_rate": 5.951891891891892e-05, + "loss": 0.2467, + "step": 30970 + }, + { + "epoch": 30.0, + "learning_rate": 5.950540540540541e-05, + "loss": 0.2916, + "step": 30980 + }, + { + "epoch": 30.0, + "learning_rate": 5.9491891891891894e-05, + "loss": 0.4717, + "step": 30990 + }, + { + "epoch": 30.0, + "learning_rate": 5.947837837837839e-05, + "loss": 0.2798, + "step": 31000 + }, + { + "epoch": 30.0, + "eval_loss": 0.10163089632987976, + "eval_runtime": 139.421, + "eval_samples_per_second": 25.878, + "eval_steps_per_second": 3.235, + "eval_wer": 0.10236220472440945, + "step": 31000 + }, + { + "epoch": 30.0, + "learning_rate": 5.946486486486487e-05, + "loss": 0.1356, + "step": 31010 + }, + { + "epoch": 30.0, + "learning_rate": 5.945135135135136e-05, + "loss": 0.2131, + "step": 31020 + }, + { + "epoch": 30.0, + "learning_rate": 5.943783783783784e-05, + "loss": 0.219, + "step": 31030 + }, + { + "epoch": 30.0, + "learning_rate": 5.942432432432433e-05, + "loss": 0.2498, + "step": 31040 + }, + { + "epoch": 30.0, + "learning_rate": 5.9410810810810814e-05, + "loss": 0.294, + "step": 31050 + }, + { + "epoch": 30.0, + "learning_rate": 5.93972972972973e-05, + "loss": 0.2198, + "step": 31060 + }, + { + "epoch": 30.01, + "learning_rate": 5.938378378378378e-05, + "loss": 0.2311, + "step": 31070 + }, + { + "epoch": 30.01, + "learning_rate": 5.937027027027028e-05, + "loss": 0.1211, + "step": 31080 + }, + { + "epoch": 30.01, + "learning_rate": 5.935675675675676e-05, + "loss": 0.1654, + "step": 31090 + }, + { + "epoch": 30.01, + "learning_rate": 5.934324324324324e-05, + "loss": 0.2476, + "step": 31100 + }, + { + "epoch": 30.01, + "learning_rate": 5.9331081081081084e-05, + "loss": 0.14, + "step": 31110 + }, + { + "epoch": 30.01, + "learning_rate": 5.9317567567567565e-05, + "loss": 0.2581, + "step": 31120 + }, + { + "epoch": 30.01, + "learning_rate": 5.930405405405406e-05, + "loss": 0.3134, + "step": 31130 + }, + { + "epoch": 30.01, + "learning_rate": 5.929054054054054e-05, + "loss": 0.2448, + "step": 31140 + }, + { + "epoch": 30.01, + "learning_rate": 5.9277027027027035e-05, + "loss": 0.2776, + "step": 31150 + }, + { + "epoch": 30.01, + "learning_rate": 5.9263513513513516e-05, + "loss": 0.3274, + "step": 31160 + }, + { + "epoch": 30.01, + "learning_rate": 5.9250000000000004e-05, + "loss": 0.3113, + "step": 31170 + }, + { + "epoch": 30.01, + "learning_rate": 5.9236486486486485e-05, + "loss": 0.3852, + "step": 31180 + }, + { + "epoch": 30.01, + "learning_rate": 5.922297297297298e-05, + "loss": 0.3555, + "step": 31190 + }, + { + "epoch": 30.01, + "learning_rate": 5.920945945945946e-05, + "loss": 0.2459, + "step": 31200 + }, + { + "epoch": 30.01, + "learning_rate": 5.9195945945945955e-05, + "loss": 0.6058, + "step": 31210 + }, + { + "epoch": 30.01, + "learning_rate": 5.9182432432432436e-05, + "loss": 0.5595, + "step": 31220 + }, + { + "epoch": 30.01, + "learning_rate": 5.9168918918918924e-05, + "loss": 0.2966, + "step": 31230 + }, + { + "epoch": 30.01, + "learning_rate": 5.9155405405405405e-05, + "loss": 0.1326, + "step": 31240 + }, + { + "epoch": 30.01, + "learning_rate": 5.91418918918919e-05, + "loss": 0.243, + "step": 31250 + }, + { + "epoch": 30.01, + "learning_rate": 5.912837837837838e-05, + "loss": 0.2223, + "step": 31260 + }, + { + "epoch": 30.01, + "learning_rate": 5.9114864864864875e-05, + "loss": 0.1994, + "step": 31270 + }, + { + "epoch": 30.01, + "learning_rate": 5.9101351351351356e-05, + "loss": 0.2102, + "step": 31280 + }, + { + "epoch": 30.01, + "learning_rate": 5.9087837837837844e-05, + "loss": 0.2074, + "step": 31290 + }, + { + "epoch": 30.01, + "learning_rate": 5.9074324324324325e-05, + "loss": 0.1779, + "step": 31300 + }, + { + "epoch": 30.01, + "learning_rate": 5.906081081081082e-05, + "loss": 0.3865, + "step": 31310 + }, + { + "epoch": 30.01, + "learning_rate": 5.90472972972973e-05, + "loss": 0.3923, + "step": 31320 + }, + { + "epoch": 30.01, + "learning_rate": 5.903378378378379e-05, + "loss": 0.3358, + "step": 31330 + }, + { + "epoch": 30.01, + "learning_rate": 5.902027027027027e-05, + "loss": 0.3066, + "step": 31340 + }, + { + "epoch": 30.01, + "learning_rate": 5.9006756756756764e-05, + "loss": 0.4113, + "step": 31350 + }, + { + "epoch": 30.01, + "learning_rate": 5.8993243243243245e-05, + "loss": 0.4369, + "step": 31360 + }, + { + "epoch": 30.01, + "learning_rate": 5.897972972972974e-05, + "loss": 0.2029, + "step": 31370 + }, + { + "epoch": 30.01, + "learning_rate": 5.896621621621622e-05, + "loss": 0.231, + "step": 31380 + }, + { + "epoch": 30.01, + "learning_rate": 5.89527027027027e-05, + "loss": 0.307, + "step": 31390 + }, + { + "epoch": 30.01, + "learning_rate": 5.893918918918919e-05, + "loss": 0.4039, + "step": 31400 + }, + { + "epoch": 30.01, + "learning_rate": 5.892567567567567e-05, + "loss": 0.3203, + "step": 31410 + }, + { + "epoch": 30.01, + "learning_rate": 5.8912162162162165e-05, + "loss": 0.2474, + "step": 31420 + }, + { + "epoch": 30.01, + "learning_rate": 5.8898648648648646e-05, + "loss": 0.3041, + "step": 31430 + }, + { + "epoch": 30.01, + "learning_rate": 5.888513513513514e-05, + "loss": 0.2453, + "step": 31440 + }, + { + "epoch": 30.01, + "learning_rate": 5.887162162162162e-05, + "loss": 0.2178, + "step": 31450 + }, + { + "epoch": 30.01, + "learning_rate": 5.885810810810811e-05, + "loss": 0.2738, + "step": 31460 + }, + { + "epoch": 30.01, + "learning_rate": 5.884459459459459e-05, + "loss": 0.1127, + "step": 31470 + }, + { + "epoch": 30.01, + "learning_rate": 5.8831081081081085e-05, + "loss": 0.2866, + "step": 31480 + }, + { + "epoch": 30.01, + "learning_rate": 5.8817567567567566e-05, + "loss": 0.4786, + "step": 31490 + }, + { + "epoch": 30.01, + "learning_rate": 5.880405405405406e-05, + "loss": 0.3927, + "step": 31500 + }, + { + "epoch": 30.01, + "eval_loss": 0.09929303079843521, + "eval_runtime": 127.7477, + "eval_samples_per_second": 28.243, + "eval_steps_per_second": 3.53, + "eval_wer": 0.10077808321297116, + "step": 31500 + }, + { + "epoch": 30.01, + "learning_rate": 5.879054054054054e-05, + "loss": 0.1954, + "step": 31510 + }, + { + "epoch": 30.01, + "learning_rate": 5.877702702702703e-05, + "loss": 0.2751, + "step": 31520 + }, + { + "epoch": 30.01, + "learning_rate": 5.876351351351351e-05, + "loss": 0.2964, + "step": 31530 + }, + { + "epoch": 30.01, + "learning_rate": 5.8750000000000005e-05, + "loss": 0.2723, + "step": 31540 + }, + { + "epoch": 30.01, + "learning_rate": 5.8736486486486486e-05, + "loss": 0.3518, + "step": 31550 + }, + { + "epoch": 30.01, + "learning_rate": 5.872297297297298e-05, + "loss": 0.382, + "step": 31560 + }, + { + "epoch": 30.01, + "learning_rate": 5.870945945945946e-05, + "loss": 0.1928, + "step": 31570 + }, + { + "epoch": 30.01, + "learning_rate": 5.869594594594595e-05, + "loss": 0.317, + "step": 31580 + }, + { + "epoch": 30.01, + "learning_rate": 5.868243243243243e-05, + "loss": 0.2676, + "step": 31590 + }, + { + "epoch": 30.01, + "learning_rate": 5.8668918918918925e-05, + "loss": 0.4138, + "step": 31600 + }, + { + "epoch": 30.01, + "learning_rate": 5.8655405405405406e-05, + "loss": 0.4187, + "step": 31610 + }, + { + "epoch": 30.01, + "learning_rate": 5.86418918918919e-05, + "loss": 0.3994, + "step": 31620 + }, + { + "epoch": 30.01, + "learning_rate": 5.862837837837838e-05, + "loss": 0.4176, + "step": 31630 + }, + { + "epoch": 30.01, + "learning_rate": 5.861486486486487e-05, + "loss": 0.5378, + "step": 31640 + }, + { + "epoch": 30.01, + "learning_rate": 5.860135135135135e-05, + "loss": 0.4536, + "step": 31650 + }, + { + "epoch": 30.01, + "learning_rate": 5.8587837837837845e-05, + "loss": 0.5825, + "step": 31660 + }, + { + "epoch": 30.01, + "learning_rate": 5.8574324324324326e-05, + "loss": 0.4281, + "step": 31670 + }, + { + "epoch": 30.01, + "learning_rate": 5.856081081081082e-05, + "loss": 0.445, + "step": 31680 + }, + { + "epoch": 30.01, + "learning_rate": 5.85472972972973e-05, + "loss": 0.372, + "step": 31690 + }, + { + "epoch": 30.01, + "learning_rate": 5.853378378378379e-05, + "loss": 0.3777, + "step": 31700 + }, + { + "epoch": 30.01, + "learning_rate": 5.852027027027027e-05, + "loss": 0.5408, + "step": 31710 + }, + { + "epoch": 31.0, + "learning_rate": 5.8506756756756765e-05, + "loss": 0.4885, + "step": 31720 + }, + { + "epoch": 31.0, + "learning_rate": 5.8493243243243246e-05, + "loss": 0.4328, + "step": 31730 + }, + { + "epoch": 31.0, + "learning_rate": 5.847972972972974e-05, + "loss": 0.4665, + "step": 31740 + }, + { + "epoch": 31.0, + "learning_rate": 5.846621621621622e-05, + "loss": 0.39, + "step": 31750 + }, + { + "epoch": 31.0, + "learning_rate": 5.845270270270271e-05, + "loss": 0.4104, + "step": 31760 + }, + { + "epoch": 31.0, + "learning_rate": 5.843918918918919e-05, + "loss": 0.4238, + "step": 31770 + }, + { + "epoch": 31.0, + "learning_rate": 5.8425675675675685e-05, + "loss": 0.6808, + "step": 31780 + }, + { + "epoch": 31.0, + "learning_rate": 5.8412162162162166e-05, + "loss": 0.4057, + "step": 31790 + }, + { + "epoch": 31.0, + "learning_rate": 5.839864864864865e-05, + "loss": 0.4116, + "step": 31800 + }, + { + "epoch": 31.0, + "learning_rate": 5.8385135135135135e-05, + "loss": 0.4601, + "step": 31810 + }, + { + "epoch": 31.0, + "learning_rate": 5.8371621621621616e-05, + "loss": 0.4571, + "step": 31820 + }, + { + "epoch": 31.0, + "learning_rate": 5.835810810810811e-05, + "loss": 0.4391, + "step": 31830 + }, + { + "epoch": 31.0, + "learning_rate": 5.834459459459459e-05, + "loss": 0.3082, + "step": 31840 + }, + { + "epoch": 31.0, + "learning_rate": 5.8331081081081086e-05, + "loss": 0.2414, + "step": 31850 + }, + { + "epoch": 31.0, + "learning_rate": 5.831756756756757e-05, + "loss": 0.2636, + "step": 31860 + }, + { + "epoch": 31.0, + "learning_rate": 5.8304054054054055e-05, + "loss": 0.2835, + "step": 31870 + }, + { + "epoch": 31.0, + "learning_rate": 5.8290540540540536e-05, + "loss": 1.1597, + "step": 31880 + }, + { + "epoch": 31.0, + "learning_rate": 5.827702702702703e-05, + "loss": 1.4014, + "step": 31890 + }, + { + "epoch": 31.0, + "learning_rate": 5.826351351351351e-05, + "loss": 2.5831, + "step": 31900 + }, + { + "epoch": 31.0, + "learning_rate": 5.8250000000000006e-05, + "loss": 2.3903, + "step": 31910 + }, + { + "epoch": 31.0, + "learning_rate": 5.823648648648649e-05, + "loss": 2.5671, + "step": 31920 + }, + { + "epoch": 31.0, + "learning_rate": 5.8222972972972975e-05, + "loss": 2.2941, + "step": 31930 + }, + { + "epoch": 31.0, + "learning_rate": 5.8209459459459456e-05, + "loss": 1.4906, + "step": 31940 + }, + { + "epoch": 31.0, + "learning_rate": 5.819594594594595e-05, + "loss": 1.3073, + "step": 31950 + }, + { + "epoch": 31.0, + "learning_rate": 5.818243243243243e-05, + "loss": 0.7396, + "step": 31960 + }, + { + "epoch": 31.0, + "learning_rate": 5.8168918918918926e-05, + "loss": 0.1965, + "step": 31970 + }, + { + "epoch": 31.0, + "learning_rate": 5.815540540540541e-05, + "loss": 0.2501, + "step": 31980 + }, + { + "epoch": 31.0, + "learning_rate": 5.8141891891891895e-05, + "loss": 0.1598, + "step": 31990 + }, + { + "epoch": 31.0, + "learning_rate": 5.8128378378378376e-05, + "loss": 0.3206, + "step": 32000 + }, + { + "epoch": 31.0, + "eval_loss": 0.09585515409708023, + "eval_runtime": 129.9298, + "eval_samples_per_second": 27.769, + "eval_steps_per_second": 3.471, + "eval_wer": 0.09635186134277594, + "step": 32000 + }, + { + "epoch": 31.0, + "learning_rate": 5.811486486486487e-05, + "loss": 0.4013, + "step": 32010 + }, + { + "epoch": 31.0, + "learning_rate": 5.810135135135135e-05, + "loss": 0.372, + "step": 32020 + }, + { + "epoch": 31.0, + "learning_rate": 5.8087837837837847e-05, + "loss": 0.1988, + "step": 32030 + }, + { + "epoch": 31.0, + "learning_rate": 5.807432432432433e-05, + "loss": 0.1979, + "step": 32040 + }, + { + "epoch": 31.0, + "learning_rate": 5.8060810810810815e-05, + "loss": 0.2715, + "step": 32050 + }, + { + "epoch": 31.0, + "learning_rate": 5.8047297297297296e-05, + "loss": 0.2401, + "step": 32060 + }, + { + "epoch": 31.0, + "learning_rate": 5.803378378378379e-05, + "loss": 0.2648, + "step": 32070 + }, + { + "epoch": 31.0, + "learning_rate": 5.802027027027027e-05, + "loss": 0.2395, + "step": 32080 + }, + { + "epoch": 31.01, + "learning_rate": 5.8006756756756767e-05, + "loss": 0.2142, + "step": 32090 + }, + { + "epoch": 31.01, + "learning_rate": 5.799324324324325e-05, + "loss": 0.1572, + "step": 32100 + }, + { + "epoch": 31.01, + "learning_rate": 5.7979729729729735e-05, + "loss": 0.1372, + "step": 32110 + }, + { + "epoch": 31.01, + "learning_rate": 5.7966216216216216e-05, + "loss": 0.2205, + "step": 32120 + }, + { + "epoch": 31.01, + "learning_rate": 5.795270270270271e-05, + "loss": 0.194, + "step": 32130 + }, + { + "epoch": 31.01, + "learning_rate": 5.793918918918919e-05, + "loss": 0.2013, + "step": 32140 + }, + { + "epoch": 31.01, + "learning_rate": 5.792567567567569e-05, + "loss": 0.3058, + "step": 32150 + }, + { + "epoch": 31.01, + "learning_rate": 5.791216216216217e-05, + "loss": 0.2889, + "step": 32160 + }, + { + "epoch": 31.01, + "learning_rate": 5.7898648648648655e-05, + "loss": 0.2278, + "step": 32170 + }, + { + "epoch": 31.01, + "learning_rate": 5.7885135135135137e-05, + "loss": 0.3381, + "step": 32180 + }, + { + "epoch": 31.01, + "learning_rate": 5.787162162162162e-05, + "loss": 0.323, + "step": 32190 + }, + { + "epoch": 31.01, + "learning_rate": 5.785810810810811e-05, + "loss": 0.3623, + "step": 32200 + }, + { + "epoch": 31.01, + "learning_rate": 5.784459459459459e-05, + "loss": 0.3613, + "step": 32210 + }, + { + "epoch": 31.01, + "learning_rate": 5.783108108108108e-05, + "loss": 0.2601, + "step": 32220 + }, + { + "epoch": 31.01, + "learning_rate": 5.781756756756757e-05, + "loss": 0.4916, + "step": 32230 + }, + { + "epoch": 31.01, + "learning_rate": 5.7804054054054057e-05, + "loss": 0.5367, + "step": 32240 + }, + { + "epoch": 31.01, + "learning_rate": 5.779054054054054e-05, + "loss": 0.4102, + "step": 32250 + }, + { + "epoch": 31.01, + "learning_rate": 5.777702702702703e-05, + "loss": 0.1664, + "step": 32260 + }, + { + "epoch": 31.01, + "learning_rate": 5.776351351351351e-05, + "loss": 0.2362, + "step": 32270 + }, + { + "epoch": 31.01, + "learning_rate": 5.775e-05, + "loss": 0.2093, + "step": 32280 + }, + { + "epoch": 31.01, + "learning_rate": 5.773648648648648e-05, + "loss": 0.1903, + "step": 32290 + }, + { + "epoch": 31.01, + "learning_rate": 5.772297297297298e-05, + "loss": 0.1834, + "step": 32300 + }, + { + "epoch": 31.01, + "learning_rate": 5.770945945945946e-05, + "loss": 0.1744, + "step": 32310 + }, + { + "epoch": 31.01, + "learning_rate": 5.769594594594595e-05, + "loss": 0.1716, + "step": 32320 + }, + { + "epoch": 31.01, + "learning_rate": 5.768243243243243e-05, + "loss": 0.3099, + "step": 32330 + }, + { + "epoch": 31.01, + "learning_rate": 5.766891891891892e-05, + "loss": 0.4334, + "step": 32340 + }, + { + "epoch": 31.01, + "learning_rate": 5.76554054054054e-05, + "loss": 0.3701, + "step": 32350 + }, + { + "epoch": 31.01, + "learning_rate": 5.76418918918919e-05, + "loss": 0.286, + "step": 32360 + }, + { + "epoch": 31.01, + "learning_rate": 5.762837837837838e-05, + "loss": 0.4339, + "step": 32370 + }, + { + "epoch": 31.01, + "learning_rate": 5.761486486486487e-05, + "loss": 0.3987, + "step": 32380 + }, + { + "epoch": 31.01, + "learning_rate": 5.760135135135135e-05, + "loss": 0.2272, + "step": 32390 + }, + { + "epoch": 31.01, + "learning_rate": 5.758783783783784e-05, + "loss": 0.185, + "step": 32400 + }, + { + "epoch": 31.01, + "learning_rate": 5.757432432432432e-05, + "loss": 0.2601, + "step": 32410 + }, + { + "epoch": 31.01, + "learning_rate": 5.756081081081082e-05, + "loss": 0.3321, + "step": 32420 + }, + { + "epoch": 31.01, + "learning_rate": 5.75472972972973e-05, + "loss": 0.3679, + "step": 32430 + }, + { + "epoch": 31.01, + "learning_rate": 5.753378378378379e-05, + "loss": 0.3297, + "step": 32440 + }, + { + "epoch": 31.01, + "learning_rate": 5.7520270270270273e-05, + "loss": 0.2289, + "step": 32450 + }, + { + "epoch": 31.01, + "learning_rate": 5.750675675675676e-05, + "loss": 0.2306, + "step": 32460 + }, + { + "epoch": 31.01, + "learning_rate": 5.749324324324324e-05, + "loss": 0.2331, + "step": 32470 + }, + { + "epoch": 31.01, + "learning_rate": 5.747972972972974e-05, + "loss": 0.2923, + "step": 32480 + }, + { + "epoch": 31.01, + "learning_rate": 5.746621621621622e-05, + "loss": 0.1413, + "step": 32490 + }, + { + "epoch": 31.01, + "learning_rate": 5.745270270270271e-05, + "loss": 0.2587, + "step": 32500 + }, + { + "epoch": 31.01, + "eval_loss": 0.10016533732414246, + "eval_runtime": 128.1598, + "eval_samples_per_second": 28.152, + "eval_steps_per_second": 3.519, + "eval_wer": 0.09965987979313237, + "step": 32500 + }, + { + "epoch": 31.01, + "learning_rate": 5.7439189189189193e-05, + "loss": 0.3457, + "step": 32510 + }, + { + "epoch": 31.01, + "learning_rate": 5.742567567567568e-05, + "loss": 0.5665, + "step": 32520 + }, + { + "epoch": 31.01, + "learning_rate": 5.741216216216216e-05, + "loss": 0.1758, + "step": 32530 + }, + { + "epoch": 31.01, + "learning_rate": 5.739864864864866e-05, + "loss": 0.2397, + "step": 32540 + }, + { + "epoch": 31.01, + "learning_rate": 5.738513513513514e-05, + "loss": 0.2542, + "step": 32550 + }, + { + "epoch": 31.01, + "learning_rate": 5.737162162162163e-05, + "loss": 0.2782, + "step": 32560 + }, + { + "epoch": 31.01, + "learning_rate": 5.7358108108108114e-05, + "loss": 0.3122, + "step": 32570 + }, + { + "epoch": 31.01, + "learning_rate": 5.73445945945946e-05, + "loss": 0.4181, + "step": 32580 + }, + { + "epoch": 31.01, + "learning_rate": 5.733108108108108e-05, + "loss": 0.2375, + "step": 32590 + }, + { + "epoch": 31.01, + "learning_rate": 5.7317567567567563e-05, + "loss": 0.2426, + "step": 32600 + }, + { + "epoch": 31.01, + "learning_rate": 5.730405405405406e-05, + "loss": 0.2776, + "step": 32610 + }, + { + "epoch": 31.01, + "learning_rate": 5.729054054054054e-05, + "loss": 0.4075, + "step": 32620 + }, + { + "epoch": 31.01, + "learning_rate": 5.7277027027027034e-05, + "loss": 0.3773, + "step": 32630 + }, + { + "epoch": 31.01, + "learning_rate": 5.7263513513513515e-05, + "loss": 0.4395, + "step": 32640 + }, + { + "epoch": 31.01, + "learning_rate": 5.725e-05, + "loss": 0.3886, + "step": 32650 + }, + { + "epoch": 31.01, + "learning_rate": 5.7236486486486483e-05, + "loss": 0.4467, + "step": 32660 + }, + { + "epoch": 31.01, + "learning_rate": 5.722297297297298e-05, + "loss": 0.3612, + "step": 32670 + }, + { + "epoch": 31.01, + "learning_rate": 5.720945945945946e-05, + "loss": 0.5826, + "step": 32680 + }, + { + "epoch": 31.01, + "learning_rate": 5.719594594594595e-05, + "loss": 0.4786, + "step": 32690 + }, + { + "epoch": 31.01, + "learning_rate": 5.718243243243243e-05, + "loss": 0.4461, + "step": 32700 + }, + { + "epoch": 31.01, + "learning_rate": 5.716891891891892e-05, + "loss": 0.416, + "step": 32710 + }, + { + "epoch": 31.01, + "learning_rate": 5.7155405405405404e-05, + "loss": 0.4389, + "step": 32720 + }, + { + "epoch": 31.01, + "learning_rate": 5.71418918918919e-05, + "loss": 0.4871, + "step": 32730 + }, + { + "epoch": 32.0, + "learning_rate": 5.712837837837838e-05, + "loss": 0.5455, + "step": 32740 + }, + { + "epoch": 32.0, + "learning_rate": 5.711486486486487e-05, + "loss": 0.453, + "step": 32750 + }, + { + "epoch": 32.0, + "learning_rate": 5.710135135135135e-05, + "loss": 0.463, + "step": 32760 + }, + { + "epoch": 32.0, + "learning_rate": 5.708783783783784e-05, + "loss": 0.4362, + "step": 32770 + }, + { + "epoch": 32.0, + "learning_rate": 5.7074324324324324e-05, + "loss": 0.3613, + "step": 32780 + }, + { + "epoch": 32.0, + "learning_rate": 5.706081081081082e-05, + "loss": 0.4411, + "step": 32790 + }, + { + "epoch": 32.0, + "learning_rate": 5.70472972972973e-05, + "loss": 0.5387, + "step": 32800 + }, + { + "epoch": 32.0, + "learning_rate": 5.703378378378379e-05, + "loss": 0.4446, + "step": 32810 + }, + { + "epoch": 32.0, + "learning_rate": 5.702027027027027e-05, + "loss": 0.3783, + "step": 32820 + }, + { + "epoch": 32.0, + "learning_rate": 5.700675675675676e-05, + "loss": 0.4207, + "step": 32830 + }, + { + "epoch": 32.0, + "learning_rate": 5.6993243243243244e-05, + "loss": 0.4283, + "step": 32840 + }, + { + "epoch": 32.0, + "learning_rate": 5.697972972972974e-05, + "loss": 0.4662, + "step": 32850 + }, + { + "epoch": 32.0, + "learning_rate": 5.696621621621622e-05, + "loss": 0.2862, + "step": 32860 + }, + { + "epoch": 32.0, + "learning_rate": 5.695270270270271e-05, + "loss": 0.2463, + "step": 32870 + }, + { + "epoch": 32.0, + "learning_rate": 5.693918918918919e-05, + "loss": 0.2599, + "step": 32880 + }, + { + "epoch": 32.0, + "learning_rate": 5.692567567567568e-05, + "loss": 0.3079, + "step": 32890 + }, + { + "epoch": 32.0, + "learning_rate": 5.6912162162162164e-05, + "loss": 0.929, + "step": 32900 + }, + { + "epoch": 32.0, + "learning_rate": 5.689864864864866e-05, + "loss": 0.8002, + "step": 32910 + }, + { + "epoch": 32.0, + "learning_rate": 5.688513513513514e-05, + "loss": 2.6201, + "step": 32920 + }, + { + "epoch": 32.0, + "learning_rate": 5.687162162162163e-05, + "loss": 2.5196, + "step": 32930 + }, + { + "epoch": 32.0, + "learning_rate": 5.685810810810811e-05, + "loss": 2.4522, + "step": 32940 + }, + { + "epoch": 32.0, + "learning_rate": 5.68445945945946e-05, + "loss": 2.5532, + "step": 32950 + }, + { + "epoch": 32.0, + "learning_rate": 5.6831081081081084e-05, + "loss": 1.4129, + "step": 32960 + }, + { + "epoch": 32.0, + "learning_rate": 5.681756756756758e-05, + "loss": 1.4609, + "step": 32970 + }, + { + "epoch": 32.0, + "learning_rate": 5.680405405405406e-05, + "loss": 0.8438, + "step": 32980 + }, + { + "epoch": 32.0, + "learning_rate": 5.679054054054054e-05, + "loss": 0.269, + "step": 32990 + }, + { + "epoch": 32.0, + "learning_rate": 5.677702702702703e-05, + "loss": 0.1436, + "step": 33000 + }, + { + "epoch": 32.0, + "eval_loss": 0.10825485736131668, + "eval_runtime": 128.8275, + "eval_samples_per_second": 28.006, + "eval_steps_per_second": 3.501, + "eval_wer": 0.09830871732749383, + "step": 33000 + }, + { + "epoch": 32.0, + "learning_rate": 5.676351351351351e-05, + "loss": 0.2845, + "step": 33010 + }, + { + "epoch": 32.0, + "learning_rate": 5.6750000000000004e-05, + "loss": 0.279, + "step": 33020 + }, + { + "epoch": 32.0, + "learning_rate": 5.6736486486486485e-05, + "loss": 0.3486, + "step": 33030 + }, + { + "epoch": 32.0, + "learning_rate": 5.672297297297298e-05, + "loss": 0.3856, + "step": 33040 + }, + { + "epoch": 32.0, + "learning_rate": 5.670945945945946e-05, + "loss": 0.2522, + "step": 33050 + }, + { + "epoch": 32.0, + "learning_rate": 5.669594594594595e-05, + "loss": 0.1495, + "step": 33060 + }, + { + "epoch": 32.0, + "learning_rate": 5.668243243243243e-05, + "loss": 0.2825, + "step": 33070 + }, + { + "epoch": 32.0, + "learning_rate": 5.6668918918918924e-05, + "loss": 0.2392, + "step": 33080 + }, + { + "epoch": 32.0, + "learning_rate": 5.6655405405405405e-05, + "loss": 0.2715, + "step": 33090 + }, + { + "epoch": 32.0, + "learning_rate": 5.66418918918919e-05, + "loss": 0.2454, + "step": 33100 + }, + { + "epoch": 32.0, + "learning_rate": 5.662837837837838e-05, + "loss": 0.1845, + "step": 33110 + }, + { + "epoch": 32.01, + "learning_rate": 5.661486486486487e-05, + "loss": 0.1548, + "step": 33120 + }, + { + "epoch": 32.01, + "learning_rate": 5.660135135135135e-05, + "loss": 0.1192, + "step": 33130 + }, + { + "epoch": 32.01, + "learning_rate": 5.6587837837837844e-05, + "loss": 0.1677, + "step": 33140 + }, + { + "epoch": 32.01, + "learning_rate": 5.6574324324324325e-05, + "loss": 0.1858, + "step": 33150 + }, + { + "epoch": 32.01, + "learning_rate": 5.656081081081081e-05, + "loss": 0.1996, + "step": 33160 + }, + { + "epoch": 32.01, + "learning_rate": 5.6547297297297294e-05, + "loss": 0.248, + "step": 33170 + }, + { + "epoch": 32.01, + "learning_rate": 5.653378378378379e-05, + "loss": 0.3296, + "step": 33180 + }, + { + "epoch": 32.01, + "learning_rate": 5.6521621621621625e-05, + "loss": 0.222, + "step": 33190 + }, + { + "epoch": 32.01, + "learning_rate": 5.650810810810811e-05, + "loss": 0.3005, + "step": 33200 + }, + { + "epoch": 32.01, + "learning_rate": 5.6494594594594594e-05, + "loss": 0.3004, + "step": 33210 + }, + { + "epoch": 32.01, + "learning_rate": 5.648108108108109e-05, + "loss": 0.3089, + "step": 33220 + }, + { + "epoch": 32.01, + "learning_rate": 5.646756756756757e-05, + "loss": 0.3961, + "step": 33230 + }, + { + "epoch": 32.01, + "learning_rate": 5.6454054054054064e-05, + "loss": 0.2866, + "step": 33240 + }, + { + "epoch": 32.01, + "learning_rate": 5.6440540540540545e-05, + "loss": 0.3494, + "step": 33250 + }, + { + "epoch": 32.01, + "learning_rate": 5.642702702702703e-05, + "loss": 0.5371, + "step": 33260 + }, + { + "epoch": 32.01, + "learning_rate": 5.6413513513513514e-05, + "loss": 0.503, + "step": 33270 + }, + { + "epoch": 32.01, + "learning_rate": 5.6399999999999995e-05, + "loss": 0.1692, + "step": 33280 + }, + { + "epoch": 32.01, + "learning_rate": 5.638648648648649e-05, + "loss": 0.1918, + "step": 33290 + }, + { + "epoch": 32.01, + "learning_rate": 5.637297297297297e-05, + "loss": 0.2388, + "step": 33300 + }, + { + "epoch": 32.01, + "learning_rate": 5.6359459459459466e-05, + "loss": 0.2034, + "step": 33310 + }, + { + "epoch": 32.01, + "learning_rate": 5.6345945945945947e-05, + "loss": 0.1979, + "step": 33320 + }, + { + "epoch": 32.01, + "learning_rate": 5.6332432432432434e-05, + "loss": 0.1572, + "step": 33330 + }, + { + "epoch": 32.01, + "learning_rate": 5.6318918918918915e-05, + "loss": 0.1555, + "step": 33340 + }, + { + "epoch": 32.01, + "learning_rate": 5.630540540540541e-05, + "loss": 0.2197, + "step": 33350 + }, + { + "epoch": 32.01, + "learning_rate": 5.629189189189189e-05, + "loss": 0.4269, + "step": 33360 + }, + { + "epoch": 32.01, + "learning_rate": 5.6278378378378386e-05, + "loss": 0.3671, + "step": 33370 + }, + { + "epoch": 32.01, + "learning_rate": 5.626486486486487e-05, + "loss": 0.2821, + "step": 33380 + }, + { + "epoch": 32.01, + "learning_rate": 5.6251351351351354e-05, + "loss": 0.3283, + "step": 33390 + }, + { + "epoch": 32.01, + "learning_rate": 5.6237837837837835e-05, + "loss": 0.499, + "step": 33400 + }, + { + "epoch": 32.01, + "learning_rate": 5.622432432432433e-05, + "loss": 0.2965, + "step": 33410 + }, + { + "epoch": 32.01, + "learning_rate": 5.621081081081081e-05, + "loss": 0.2015, + "step": 33420 + }, + { + "epoch": 32.01, + "learning_rate": 5.61972972972973e-05, + "loss": 0.2609, + "step": 33430 + }, + { + "epoch": 32.01, + "learning_rate": 5.618378378378378e-05, + "loss": 0.3717, + "step": 33440 + }, + { + "epoch": 32.01, + "learning_rate": 5.6170270270270274e-05, + "loss": 0.3534, + "step": 33450 + }, + { + "epoch": 32.01, + "learning_rate": 5.6156756756756756e-05, + "loss": 0.3068, + "step": 33460 + }, + { + "epoch": 32.01, + "learning_rate": 5.614324324324325e-05, + "loss": 0.2649, + "step": 33470 + }, + { + "epoch": 32.01, + "learning_rate": 5.612972972972973e-05, + "loss": 0.2627, + "step": 33480 + }, + { + "epoch": 32.01, + "learning_rate": 5.611621621621622e-05, + "loss": 0.256, + "step": 33490 + }, + { + "epoch": 32.01, + "learning_rate": 5.61027027027027e-05, + "loss": 0.2469, + "step": 33500 + }, + { + "epoch": 32.01, + "eval_loss": 0.10492494702339172, + "eval_runtime": 128.3558, + "eval_samples_per_second": 28.109, + "eval_steps_per_second": 3.514, + "eval_wer": 0.09886781903741322, + "step": 33500 + }, + { + "epoch": 32.01, + "learning_rate": 5.6089189189189195e-05, + "loss": 0.1797, + "step": 33510 + }, + { + "epoch": 32.01, + "learning_rate": 5.6075675675675676e-05, + "loss": 0.1441, + "step": 33520 + }, + { + "epoch": 32.01, + "learning_rate": 5.606216216216217e-05, + "loss": 0.2693, + "step": 33530 + }, + { + "epoch": 32.01, + "learning_rate": 5.604864864864865e-05, + "loss": 0.5858, + "step": 33540 + }, + { + "epoch": 32.01, + "learning_rate": 5.603513513513514e-05, + "loss": 0.2154, + "step": 33550 + }, + { + "epoch": 32.01, + "learning_rate": 5.602162162162162e-05, + "loss": 0.1975, + "step": 33560 + }, + { + "epoch": 32.01, + "learning_rate": 5.6008108108108115e-05, + "loss": 0.2669, + "step": 33570 + }, + { + "epoch": 32.01, + "learning_rate": 5.5994594594594596e-05, + "loss": 0.2926, + "step": 33580 + }, + { + "epoch": 32.01, + "learning_rate": 5.598108108108109e-05, + "loss": 0.2999, + "step": 33590 + }, + { + "epoch": 32.01, + "learning_rate": 5.596756756756757e-05, + "loss": 0.3664, + "step": 33600 + }, + { + "epoch": 32.01, + "learning_rate": 5.595405405405406e-05, + "loss": 0.3339, + "step": 33610 + }, + { + "epoch": 32.01, + "learning_rate": 5.594054054054054e-05, + "loss": 0.1986, + "step": 33620 + }, + { + "epoch": 32.01, + "learning_rate": 5.5927027027027035e-05, + "loss": 0.362, + "step": 33630 + }, + { + "epoch": 32.01, + "learning_rate": 5.5913513513513516e-05, + "loss": 0.3197, + "step": 33640 + }, + { + "epoch": 32.01, + "learning_rate": 5.590000000000001e-05, + "loss": 0.3852, + "step": 33650 + }, + { + "epoch": 32.01, + "learning_rate": 5.588648648648649e-05, + "loss": 0.4336, + "step": 33660 + }, + { + "epoch": 32.01, + "learning_rate": 5.587297297297298e-05, + "loss": 0.3583, + "step": 33670 + }, + { + "epoch": 32.01, + "learning_rate": 5.585945945945946e-05, + "loss": 0.5409, + "step": 33680 + }, + { + "epoch": 32.01, + "learning_rate": 5.584594594594594e-05, + "loss": 0.403, + "step": 33690 + }, + { + "epoch": 32.01, + "learning_rate": 5.5832432432432436e-05, + "loss": 0.4978, + "step": 33700 + }, + { + "epoch": 32.01, + "learning_rate": 5.581891891891892e-05, + "loss": 0.5341, + "step": 33710 + }, + { + "epoch": 32.01, + "learning_rate": 5.580540540540541e-05, + "loss": 0.3625, + "step": 33720 + }, + { + "epoch": 32.01, + "learning_rate": 5.579189189189189e-05, + "loss": 0.3558, + "step": 33730 + }, + { + "epoch": 32.01, + "learning_rate": 5.577837837837838e-05, + "loss": 0.373, + "step": 33740 + }, + { + "epoch": 32.01, + "learning_rate": 5.576486486486486e-05, + "loss": 0.3599, + "step": 33750 + }, + { + "epoch": 33.0, + "learning_rate": 5.5751351351351356e-05, + "loss": 0.5671, + "step": 33760 + }, + { + "epoch": 33.0, + "learning_rate": 5.573783783783784e-05, + "loss": 0.4014, + "step": 33770 + }, + { + "epoch": 33.0, + "learning_rate": 5.572432432432433e-05, + "loss": 0.4485, + "step": 33780 + }, + { + "epoch": 33.0, + "learning_rate": 5.571081081081081e-05, + "loss": 0.4687, + "step": 33790 + }, + { + "epoch": 33.0, + "learning_rate": 5.56972972972973e-05, + "loss": 0.3756, + "step": 33800 + }, + { + "epoch": 33.0, + "learning_rate": 5.568378378378378e-05, + "loss": 0.4475, + "step": 33810 + }, + { + "epoch": 33.0, + "learning_rate": 5.5670270270270276e-05, + "loss": 0.4705, + "step": 33820 + }, + { + "epoch": 33.0, + "learning_rate": 5.565675675675676e-05, + "loss": 0.5455, + "step": 33830 + }, + { + "epoch": 33.0, + "learning_rate": 5.564324324324325e-05, + "loss": 0.4207, + "step": 33840 + }, + { + "epoch": 33.0, + "learning_rate": 5.562972972972973e-05, + "loss": 0.4428, + "step": 33850 + }, + { + "epoch": 33.0, + "learning_rate": 5.561621621621622e-05, + "loss": 0.424, + "step": 33860 + }, + { + "epoch": 33.0, + "learning_rate": 5.56027027027027e-05, + "loss": 0.3773, + "step": 33870 + }, + { + "epoch": 33.0, + "learning_rate": 5.5589189189189196e-05, + "loss": 0.3938, + "step": 33880 + }, + { + "epoch": 33.0, + "learning_rate": 5.557567567567568e-05, + "loss": 0.2388, + "step": 33890 + }, + { + "epoch": 33.0, + "learning_rate": 5.5562162162162165e-05, + "loss": 0.2318, + "step": 33900 + }, + { + "epoch": 33.0, + "learning_rate": 5.5548648648648646e-05, + "loss": 0.2632, + "step": 33910 + }, + { + "epoch": 33.0, + "learning_rate": 5.553513513513514e-05, + "loss": 0.5697, + "step": 33920 + }, + { + "epoch": 33.0, + "learning_rate": 5.552162162162162e-05, + "loss": 1.0229, + "step": 33930 + }, + { + "epoch": 33.0, + "learning_rate": 5.5508108108108116e-05, + "loss": 2.0729, + "step": 33940 + }, + { + "epoch": 33.0, + "learning_rate": 5.54945945945946e-05, + "loss": 2.5481, + "step": 33950 + }, + { + "epoch": 33.0, + "learning_rate": 5.5481081081081085e-05, + "loss": 2.4527, + "step": 33960 + }, + { + "epoch": 33.0, + "learning_rate": 5.5467567567567566e-05, + "loss": 2.5497, + "step": 33970 + }, + { + "epoch": 33.0, + "learning_rate": 5.545405405405406e-05, + "loss": 1.7732, + "step": 33980 + }, + { + "epoch": 33.0, + "learning_rate": 5.544054054054054e-05, + "loss": 1.5224, + "step": 33990 + }, + { + "epoch": 33.0, + "learning_rate": 5.5427027027027036e-05, + "loss": 1.0054, + "step": 34000 + }, + { + "epoch": 33.0, + "eval_loss": 0.13148286938667297, + "eval_runtime": 132.7862, + "eval_samples_per_second": 27.171, + "eval_steps_per_second": 3.396, + "eval_wer": 0.10459861156408704, + "step": 34000 + }, + { + "epoch": 33.0, + "learning_rate": 5.541351351351352e-05, + "loss": 0.429, + "step": 34010 + }, + { + "epoch": 33.0, + "learning_rate": 5.5400000000000005e-05, + "loss": 0.1319, + "step": 34020 + }, + { + "epoch": 33.0, + "learning_rate": 5.5386486486486486e-05, + "loss": 0.2709, + "step": 34030 + }, + { + "epoch": 33.0, + "learning_rate": 5.537297297297298e-05, + "loss": 0.2444, + "step": 34040 + }, + { + "epoch": 33.0, + "learning_rate": 5.535945945945946e-05, + "loss": 0.2985, + "step": 34050 + }, + { + "epoch": 33.0, + "learning_rate": 5.5345945945945956e-05, + "loss": 0.4718, + "step": 34060 + }, + { + "epoch": 33.0, + "learning_rate": 5.533243243243244e-05, + "loss": 0.3191, + "step": 34070 + }, + { + "epoch": 33.0, + "learning_rate": 5.531891891891892e-05, + "loss": 0.1402, + "step": 34080 + }, + { + "epoch": 33.0, + "learning_rate": 5.5305405405405406e-05, + "loss": 0.2439, + "step": 34090 + }, + { + "epoch": 33.0, + "learning_rate": 5.529189189189189e-05, + "loss": 0.1958, + "step": 34100 + }, + { + "epoch": 33.0, + "learning_rate": 5.527837837837838e-05, + "loss": 0.2825, + "step": 34110 + }, + { + "epoch": 33.0, + "learning_rate": 5.526486486486486e-05, + "loss": 0.2559, + "step": 34120 + }, + { + "epoch": 33.0, + "learning_rate": 5.525135135135136e-05, + "loss": 0.1964, + "step": 34130 + }, + { + "epoch": 33.01, + "learning_rate": 5.523783783783784e-05, + "loss": 0.2356, + "step": 34140 + }, + { + "epoch": 33.01, + "learning_rate": 5.5224324324324326e-05, + "loss": 0.1267, + "step": 34150 + }, + { + "epoch": 33.01, + "learning_rate": 5.521081081081081e-05, + "loss": 0.2048, + "step": 34160 + }, + { + "epoch": 33.01, + "learning_rate": 5.51972972972973e-05, + "loss": 0.2222, + "step": 34170 + }, + { + "epoch": 33.01, + "learning_rate": 5.518378378378378e-05, + "loss": 0.1459, + "step": 34180 + }, + { + "epoch": 33.01, + "learning_rate": 5.517027027027028e-05, + "loss": 0.2137, + "step": 34190 + }, + { + "epoch": 33.01, + "learning_rate": 5.515675675675676e-05, + "loss": 0.3391, + "step": 34200 + }, + { + "epoch": 33.01, + "learning_rate": 5.5143243243243246e-05, + "loss": 0.2706, + "step": 34210 + }, + { + "epoch": 33.01, + "learning_rate": 5.512972972972973e-05, + "loss": 0.2422, + "step": 34220 + }, + { + "epoch": 33.01, + "learning_rate": 5.511621621621622e-05, + "loss": 0.357, + "step": 34230 + }, + { + "epoch": 33.01, + "learning_rate": 5.51027027027027e-05, + "loss": 0.2618, + "step": 34240 + }, + { + "epoch": 33.01, + "learning_rate": 5.50891891891892e-05, + "loss": 0.426, + "step": 34250 + }, + { + "epoch": 33.01, + "learning_rate": 5.507567567567568e-05, + "loss": 0.3309, + "step": 34260 + }, + { + "epoch": 33.01, + "learning_rate": 5.5062162162162166e-05, + "loss": 0.2607, + "step": 34270 + }, + { + "epoch": 33.01, + "learning_rate": 5.504864864864865e-05, + "loss": 0.5649, + "step": 34280 + }, + { + "epoch": 33.01, + "learning_rate": 5.503513513513514e-05, + "loss": 0.4989, + "step": 34290 + }, + { + "epoch": 33.01, + "learning_rate": 5.502162162162162e-05, + "loss": 0.2445, + "step": 34300 + }, + { + "epoch": 33.01, + "learning_rate": 5.500810810810811e-05, + "loss": 0.159, + "step": 34310 + }, + { + "epoch": 33.01, + "learning_rate": 5.49945945945946e-05, + "loss": 0.252, + "step": 34320 + }, + { + "epoch": 33.01, + "learning_rate": 5.4981081081081086e-05, + "loss": 0.1851, + "step": 34330 + }, + { + "epoch": 33.01, + "learning_rate": 5.496756756756757e-05, + "loss": 0.1994, + "step": 34340 + }, + { + "epoch": 33.01, + "learning_rate": 5.495405405405406e-05, + "loss": 0.1587, + "step": 34350 + }, + { + "epoch": 33.01, + "learning_rate": 5.494054054054054e-05, + "loss": 0.1551, + "step": 34360 + }, + { + "epoch": 33.01, + "learning_rate": 5.492702702702703e-05, + "loss": 0.1773, + "step": 34370 + }, + { + "epoch": 33.01, + "learning_rate": 5.491351351351351e-05, + "loss": 0.4266, + "step": 34380 + }, + { + "epoch": 33.01, + "learning_rate": 5.4900000000000006e-05, + "loss": 0.3815, + "step": 34390 + }, + { + "epoch": 33.01, + "learning_rate": 5.488648648648649e-05, + "loss": 0.2857, + "step": 34400 + }, + { + "epoch": 33.01, + "learning_rate": 5.487297297297298e-05, + "loss": 0.2776, + "step": 34410 + }, + { + "epoch": 33.01, + "learning_rate": 5.485945945945946e-05, + "loss": 0.4199, + "step": 34420 + }, + { + "epoch": 33.01, + "learning_rate": 5.484594594594595e-05, + "loss": 0.3559, + "step": 34430 + }, + { + "epoch": 33.01, + "learning_rate": 5.483243243243243e-05, + "loss": 0.1847, + "step": 34440 + }, + { + "epoch": 33.01, + "learning_rate": 5.4818918918918926e-05, + "loss": 0.2357, + "step": 34450 + }, + { + "epoch": 33.01, + "learning_rate": 5.480540540540541e-05, + "loss": 0.3068, + "step": 34460 + }, + { + "epoch": 33.01, + "learning_rate": 5.47918918918919e-05, + "loss": 0.3773, + "step": 34470 + }, + { + "epoch": 33.01, + "learning_rate": 5.477837837837838e-05, + "loss": 0.2689, + "step": 34480 + }, + { + "epoch": 33.01, + "learning_rate": 5.4764864864864864e-05, + "loss": 0.2863, + "step": 34490 + }, + { + "epoch": 33.01, + "learning_rate": 5.475135135135135e-05, + "loss": 0.2875, + "step": 34500 + }, + { + "epoch": 33.01, + "eval_loss": 0.09858305752277374, + "eval_runtime": 128.8449, + "eval_samples_per_second": 28.003, + "eval_steps_per_second": 3.5, + "eval_wer": 0.0933233937473792, + "step": 34500 + }, + { + "epoch": 33.01, + "learning_rate": 5.473783783783783e-05, + "loss": 0.2568, + "step": 34510 + }, + { + "epoch": 33.01, + "learning_rate": 5.472432432432433e-05, + "loss": 0.1914, + "step": 34520 + }, + { + "epoch": 33.01, + "learning_rate": 5.471081081081081e-05, + "loss": 0.2125, + "step": 34530 + }, + { + "epoch": 33.01, + "learning_rate": 5.46972972972973e-05, + "loss": 0.1309, + "step": 34540 + }, + { + "epoch": 33.01, + "learning_rate": 5.4683783783783784e-05, + "loss": 0.2791, + "step": 34550 + }, + { + "epoch": 33.01, + "learning_rate": 5.467027027027027e-05, + "loss": 0.5577, + "step": 34560 + }, + { + "epoch": 33.01, + "learning_rate": 5.465675675675675e-05, + "loss": 0.3256, + "step": 34570 + }, + { + "epoch": 33.01, + "learning_rate": 5.464324324324325e-05, + "loss": 0.1818, + "step": 34580 + }, + { + "epoch": 33.01, + "learning_rate": 5.462972972972973e-05, + "loss": 0.2448, + "step": 34590 + }, + { + "epoch": 33.01, + "learning_rate": 5.461621621621622e-05, + "loss": 0.2323, + "step": 34600 + }, + { + "epoch": 33.01, + "learning_rate": 5.4602702702702704e-05, + "loss": 0.2443, + "step": 34610 + }, + { + "epoch": 33.01, + "learning_rate": 5.458918918918919e-05, + "loss": 0.353, + "step": 34620 + }, + { + "epoch": 33.01, + "learning_rate": 5.457567567567567e-05, + "loss": 0.38, + "step": 34630 + }, + { + "epoch": 33.01, + "learning_rate": 5.456216216216217e-05, + "loss": 0.2115, + "step": 34640 + }, + { + "epoch": 33.01, + "learning_rate": 5.454864864864865e-05, + "loss": 0.2954, + "step": 34650 + }, + { + "epoch": 33.01, + "learning_rate": 5.453513513513514e-05, + "loss": 0.2216, + "step": 34660 + }, + { + "epoch": 33.01, + "learning_rate": 5.4521621621621624e-05, + "loss": 0.3928, + "step": 34670 + }, + { + "epoch": 33.01, + "learning_rate": 5.450810810810811e-05, + "loss": 0.4421, + "step": 34680 + }, + { + "epoch": 33.01, + "learning_rate": 5.449459459459459e-05, + "loss": 0.3282, + "step": 34690 + }, + { + "epoch": 33.01, + "learning_rate": 5.448108108108109e-05, + "loss": 0.4504, + "step": 34700 + }, + { + "epoch": 33.01, + "learning_rate": 5.446756756756757e-05, + "loss": 0.4771, + "step": 34710 + }, + { + "epoch": 33.01, + "learning_rate": 5.445405405405406e-05, + "loss": 0.44, + "step": 34720 + }, + { + "epoch": 33.01, + "learning_rate": 5.4440540540540544e-05, + "loss": 0.4954, + "step": 34730 + }, + { + "epoch": 33.01, + "learning_rate": 5.442702702702703e-05, + "loss": 0.3932, + "step": 34740 + }, + { + "epoch": 33.01, + "learning_rate": 5.441351351351351e-05, + "loss": 0.3839, + "step": 34750 + }, + { + "epoch": 33.01, + "learning_rate": 5.440000000000001e-05, + "loss": 0.3747, + "step": 34760 + }, + { + "epoch": 33.01, + "learning_rate": 5.438648648648649e-05, + "loss": 0.3922, + "step": 34770 + }, + { + "epoch": 33.01, + "learning_rate": 5.4372972972972977e-05, + "loss": 0.4774, + "step": 34780 + }, + { + "epoch": 34.0, + "learning_rate": 5.435945945945946e-05, + "loss": 0.5334, + "step": 34790 + }, + { + "epoch": 34.0, + "learning_rate": 5.434594594594595e-05, + "loss": 0.4126, + "step": 34800 + }, + { + "epoch": 34.0, + "learning_rate": 5.433243243243243e-05, + "loss": 0.4703, + "step": 34810 + }, + { + "epoch": 34.0, + "learning_rate": 5.431891891891893e-05, + "loss": 0.3939, + "step": 34820 + }, + { + "epoch": 34.0, + "learning_rate": 5.430540540540541e-05, + "loss": 0.4087, + "step": 34830 + }, + { + "epoch": 34.0, + "learning_rate": 5.4291891891891897e-05, + "loss": 0.3857, + "step": 34840 + }, + { + "epoch": 34.0, + "learning_rate": 5.427837837837838e-05, + "loss": 0.5829, + "step": 34850 + }, + { + "epoch": 34.0, + "learning_rate": 5.426486486486487e-05, + "loss": 0.4025, + "step": 34860 + }, + { + "epoch": 34.0, + "learning_rate": 5.425135135135135e-05, + "loss": 0.4082, + "step": 34870 + }, + { + "epoch": 34.0, + "learning_rate": 5.4237837837837834e-05, + "loss": 0.4271, + "step": 34880 + }, + { + "epoch": 34.0, + "learning_rate": 5.422432432432433e-05, + "loss": 0.393, + "step": 34890 + }, + { + "epoch": 34.0, + "learning_rate": 5.421081081081081e-05, + "loss": 0.3971, + "step": 34900 + }, + { + "epoch": 34.0, + "learning_rate": 5.41972972972973e-05, + "loss": 0.297, + "step": 34910 + }, + { + "epoch": 34.0, + "learning_rate": 5.418378378378378e-05, + "loss": 0.2565, + "step": 34920 + }, + { + "epoch": 34.0, + "learning_rate": 5.417027027027027e-05, + "loss": 0.2553, + "step": 34930 + }, + { + "epoch": 34.0, + "learning_rate": 5.4156756756756754e-05, + "loss": 0.3115, + "step": 34940 + }, + { + "epoch": 34.0, + "learning_rate": 5.414324324324325e-05, + "loss": 1.1867, + "step": 34950 + }, + { + "epoch": 34.0, + "learning_rate": 5.412972972972973e-05, + "loss": 1.498, + "step": 34960 + }, + { + "epoch": 34.0, + "learning_rate": 5.411621621621622e-05, + "loss": 2.5748, + "step": 34970 + }, + { + "epoch": 34.0, + "learning_rate": 5.41027027027027e-05, + "loss": 2.4109, + "step": 34980 + }, + { + "epoch": 34.0, + "learning_rate": 5.408918918918919e-05, + "loss": 2.5666, + "step": 34990 + }, + { + "epoch": 34.0, + "learning_rate": 5.4075675675675674e-05, + "loss": 2.1473, + "step": 35000 + }, + { + "epoch": 34.0, + "eval_loss": 0.11062583327293396, + "eval_runtime": 129.0373, + "eval_samples_per_second": 27.961, + "eval_steps_per_second": 3.495, + "eval_wer": 0.10855891534268276, + "step": 35000 + }, + { + "epoch": 34.0, + "learning_rate": 5.406216216216217e-05, + "loss": 1.431, + "step": 35010 + }, + { + "epoch": 34.0, + "learning_rate": 5.404864864864865e-05, + "loss": 1.3126, + "step": 35020 + }, + { + "epoch": 34.0, + "learning_rate": 5.403513513513514e-05, + "loss": 0.4752, + "step": 35030 + }, + { + "epoch": 34.0, + "learning_rate": 5.402162162162162e-05, + "loss": 0.164, + "step": 35040 + }, + { + "epoch": 34.0, + "learning_rate": 5.4008108108108113e-05, + "loss": 0.2793, + "step": 35050 + }, + { + "epoch": 34.0, + "learning_rate": 5.3994594594594594e-05, + "loss": 0.1955, + "step": 35060 + }, + { + "epoch": 34.0, + "learning_rate": 5.398108108108109e-05, + "loss": 0.325, + "step": 35070 + }, + { + "epoch": 34.0, + "learning_rate": 5.396756756756757e-05, + "loss": 0.4249, + "step": 35080 + }, + { + "epoch": 34.0, + "learning_rate": 5.395405405405406e-05, + "loss": 0.3362, + "step": 35090 + }, + { + "epoch": 34.0, + "learning_rate": 5.394054054054054e-05, + "loss": 0.171, + "step": 35100 + }, + { + "epoch": 34.0, + "learning_rate": 5.3927027027027033e-05, + "loss": 0.2247, + "step": 35110 + }, + { + "epoch": 34.0, + "learning_rate": 5.3913513513513515e-05, + "loss": 0.2329, + "step": 35120 + }, + { + "epoch": 34.0, + "learning_rate": 5.390000000000001e-05, + "loss": 0.2252, + "step": 35130 + }, + { + "epoch": 34.0, + "learning_rate": 5.388648648648649e-05, + "loss": 0.2442, + "step": 35140 + }, + { + "epoch": 34.0, + "learning_rate": 5.387297297297298e-05, + "loss": 0.2092, + "step": 35150 + }, + { + "epoch": 34.01, + "learning_rate": 5.385945945945946e-05, + "loss": 0.1736, + "step": 35160 + }, + { + "epoch": 34.01, + "learning_rate": 5.3845945945945954e-05, + "loss": 0.1355, + "step": 35170 + }, + { + "epoch": 34.01, + "learning_rate": 5.3832432432432435e-05, + "loss": 0.1227, + "step": 35180 + }, + { + "epoch": 34.01, + "learning_rate": 5.381891891891893e-05, + "loss": 0.2241, + "step": 35190 + }, + { + "epoch": 34.01, + "learning_rate": 5.380540540540541e-05, + "loss": 0.1571, + "step": 35200 + }, + { + "epoch": 34.01, + "learning_rate": 5.37918918918919e-05, + "loss": 0.2342, + "step": 35210 + }, + { + "epoch": 34.01, + "learning_rate": 5.377837837837838e-05, + "loss": 0.2705, + "step": 35220 + }, + { + "epoch": 34.01, + "learning_rate": 5.3764864864864874e-05, + "loss": 0.2875, + "step": 35230 + }, + { + "epoch": 34.01, + "learning_rate": 5.3751351351351355e-05, + "loss": 0.2183, + "step": 35240 + }, + { + "epoch": 34.01, + "learning_rate": 5.373783783783784e-05, + "loss": 0.3226, + "step": 35250 + }, + { + "epoch": 34.01, + "learning_rate": 5.3724324324324323e-05, + "loss": 0.2509, + "step": 35260 + }, + { + "epoch": 34.01, + "learning_rate": 5.371081081081082e-05, + "loss": 0.3353, + "step": 35270 + }, + { + "epoch": 34.01, + "learning_rate": 5.36972972972973e-05, + "loss": 0.3642, + "step": 35280 + }, + { + "epoch": 34.01, + "learning_rate": 5.368378378378378e-05, + "loss": 0.2281, + "step": 35290 + }, + { + "epoch": 34.01, + "learning_rate": 5.3670270270270275e-05, + "loss": 0.4985, + "step": 35300 + }, + { + "epoch": 34.01, + "learning_rate": 5.3656756756756756e-05, + "loss": 0.5439, + "step": 35310 + }, + { + "epoch": 34.01, + "learning_rate": 5.3643243243243244e-05, + "loss": 0.3953, + "step": 35320 + }, + { + "epoch": 34.01, + "learning_rate": 5.3629729729729725e-05, + "loss": 0.1224, + "step": 35330 + }, + { + "epoch": 34.01, + "learning_rate": 5.361621621621622e-05, + "loss": 0.214, + "step": 35340 + }, + { + "epoch": 34.01, + "learning_rate": 5.36027027027027e-05, + "loss": 0.1789, + "step": 35350 + }, + { + "epoch": 34.01, + "learning_rate": 5.3589189189189195e-05, + "loss": 0.1667, + "step": 35360 + }, + { + "epoch": 34.01, + "learning_rate": 5.3575675675675676e-05, + "loss": 0.1718, + "step": 35370 + }, + { + "epoch": 34.01, + "learning_rate": 5.3562162162162164e-05, + "loss": 0.1696, + "step": 35380 + }, + { + "epoch": 34.01, + "learning_rate": 5.3548648648648645e-05, + "loss": 0.1672, + "step": 35390 + }, + { + "epoch": 34.01, + "learning_rate": 5.353513513513514e-05, + "loss": 0.3363, + "step": 35400 + }, + { + "epoch": 34.01, + "learning_rate": 5.352162162162162e-05, + "loss": 0.4151, + "step": 35410 + }, + { + "epoch": 34.01, + "learning_rate": 5.3508108108108115e-05, + "loss": 0.3609, + "step": 35420 + }, + { + "epoch": 34.01, + "learning_rate": 5.3494594594594596e-05, + "loss": 0.2872, + "step": 35430 + }, + { + "epoch": 34.01, + "learning_rate": 5.3481081081081084e-05, + "loss": 0.4355, + "step": 35440 + }, + { + "epoch": 34.01, + "learning_rate": 5.3467567567567565e-05, + "loss": 0.3583, + "step": 35450 + }, + { + "epoch": 34.01, + "learning_rate": 5.345405405405406e-05, + "loss": 0.2471, + "step": 35460 + }, + { + "epoch": 34.01, + "learning_rate": 5.344054054054054e-05, + "loss": 0.196, + "step": 35470 + }, + { + "epoch": 34.01, + "learning_rate": 5.3427027027027035e-05, + "loss": 0.2579, + "step": 35480 + }, + { + "epoch": 34.01, + "learning_rate": 5.3413513513513516e-05, + "loss": 0.3492, + "step": 35490 + }, + { + "epoch": 34.01, + "learning_rate": 5.3400000000000004e-05, + "loss": 0.3689, + "step": 35500 + }, + { + "epoch": 34.01, + "eval_loss": 0.0991378128528595, + "eval_runtime": 128.3789, + "eval_samples_per_second": 28.104, + "eval_steps_per_second": 3.513, + "eval_wer": 0.09826212551833388, + "step": 35500 + }, + { + "epoch": 34.01, + "learning_rate": 5.3386486486486485e-05, + "loss": 0.2504, + "step": 35510 + }, + { + "epoch": 34.01, + "learning_rate": 5.337297297297298e-05, + "loss": 0.254, + "step": 35520 + }, + { + "epoch": 34.01, + "learning_rate": 5.335945945945946e-05, + "loss": 0.2149, + "step": 35530 + }, + { + "epoch": 34.01, + "learning_rate": 5.3345945945945955e-05, + "loss": 0.2316, + "step": 35540 + }, + { + "epoch": 34.01, + "learning_rate": 5.3332432432432436e-05, + "loss": 0.2349, + "step": 35550 + }, + { + "epoch": 34.01, + "learning_rate": 5.3318918918918924e-05, + "loss": 0.1313, + "step": 35560 + }, + { + "epoch": 34.01, + "learning_rate": 5.3305405405405405e-05, + "loss": 0.2625, + "step": 35570 + }, + { + "epoch": 34.01, + "learning_rate": 5.32918918918919e-05, + "loss": 0.3863, + "step": 35580 + }, + { + "epoch": 34.01, + "learning_rate": 5.327837837837838e-05, + "loss": 0.4046, + "step": 35590 + }, + { + "epoch": 34.01, + "learning_rate": 5.3264864864864875e-05, + "loss": 0.1622, + "step": 35600 + }, + { + "epoch": 34.01, + "learning_rate": 5.3251351351351356e-05, + "loss": 0.2308, + "step": 35610 + }, + { + "epoch": 34.01, + "learning_rate": 5.3237837837837844e-05, + "loss": 0.2887, + "step": 35620 + }, + { + "epoch": 34.01, + "learning_rate": 5.3224324324324325e-05, + "loss": 0.2853, + "step": 35630 + }, + { + "epoch": 34.01, + "learning_rate": 5.321081081081082e-05, + "loss": 0.2879, + "step": 35640 + }, + { + "epoch": 34.01, + "learning_rate": 5.31972972972973e-05, + "loss": 0.3681, + "step": 35650 + }, + { + "epoch": 34.01, + "learning_rate": 5.318378378378379e-05, + "loss": 0.2128, + "step": 35660 + }, + { + "epoch": 34.01, + "learning_rate": 5.317027027027027e-05, + "loss": 0.2541, + "step": 35670 + }, + { + "epoch": 34.01, + "learning_rate": 5.3156756756756764e-05, + "loss": 0.275, + "step": 35680 + }, + { + "epoch": 34.01, + "learning_rate": 5.3143243243243245e-05, + "loss": 0.4269, + "step": 35690 + }, + { + "epoch": 34.01, + "learning_rate": 5.3129729729729726e-05, + "loss": 0.385, + "step": 35700 + }, + { + "epoch": 34.01, + "learning_rate": 5.311621621621622e-05, + "loss": 0.4339, + "step": 35710 + }, + { + "epoch": 34.01, + "learning_rate": 5.31027027027027e-05, + "loss": 0.3535, + "step": 35720 + }, + { + "epoch": 34.01, + "learning_rate": 5.308918918918919e-05, + "loss": 0.4884, + "step": 35730 + }, + { + "epoch": 34.01, + "learning_rate": 5.307567567567567e-05, + "loss": 0.3521, + "step": 35740 + }, + { + "epoch": 34.01, + "learning_rate": 5.3062162162162165e-05, + "loss": 0.5905, + "step": 35750 + }, + { + "epoch": 34.01, + "learning_rate": 5.3048648648648646e-05, + "loss": 0.4409, + "step": 35760 + }, + { + "epoch": 34.01, + "learning_rate": 5.303513513513514e-05, + "loss": 0.3694, + "step": 35770 + }, + { + "epoch": 34.01, + "learning_rate": 5.302162162162162e-05, + "loss": 0.4235, + "step": 35780 + }, + { + "epoch": 34.01, + "learning_rate": 5.300810810810811e-05, + "loss": 0.3802, + "step": 35790 + }, + { + "epoch": 34.01, + "learning_rate": 5.299459459459459e-05, + "loss": 0.4163, + "step": 35800 + }, + { + "epoch": 35.0, + "learning_rate": 5.2981081081081085e-05, + "loss": 0.5194, + "step": 35810 + }, + { + "epoch": 35.0, + "learning_rate": 5.2967567567567566e-05, + "loss": 0.4481, + "step": 35820 + }, + { + "epoch": 35.0, + "learning_rate": 5.295405405405406e-05, + "loss": 0.461, + "step": 35830 + }, + { + "epoch": 35.0, + "learning_rate": 5.294054054054054e-05, + "loss": 0.4555, + "step": 35840 + }, + { + "epoch": 35.0, + "learning_rate": 5.292702702702703e-05, + "loss": 0.3701, + "step": 35850 + }, + { + "epoch": 35.0, + "learning_rate": 5.291351351351351e-05, + "loss": 0.4298, + "step": 35860 + }, + { + "epoch": 35.0, + "learning_rate": 5.2900000000000005e-05, + "loss": 0.6055, + "step": 35870 + }, + { + "epoch": 35.0, + "learning_rate": 5.2886486486486486e-05, + "loss": 0.4036, + "step": 35880 + }, + { + "epoch": 35.0, + "learning_rate": 5.287297297297298e-05, + "loss": 0.4097, + "step": 35890 + }, + { + "epoch": 35.0, + "learning_rate": 5.285945945945946e-05, + "loss": 0.4361, + "step": 35900 + }, + { + "epoch": 35.0, + "learning_rate": 5.284594594594595e-05, + "loss": 0.4108, + "step": 35910 + }, + { + "epoch": 35.0, + "learning_rate": 5.283243243243243e-05, + "loss": 0.4403, + "step": 35920 + }, + { + "epoch": 35.0, + "learning_rate": 5.2818918918918925e-05, + "loss": 0.2793, + "step": 35930 + }, + { + "epoch": 35.0, + "learning_rate": 5.2805405405405406e-05, + "loss": 0.2661, + "step": 35940 + }, + { + "epoch": 35.0, + "learning_rate": 5.27918918918919e-05, + "loss": 0.2726, + "step": 35950 + }, + { + "epoch": 35.0, + "learning_rate": 5.277837837837838e-05, + "loss": 0.2698, + "step": 35960 + }, + { + "epoch": 35.0, + "learning_rate": 5.276486486486487e-05, + "loss": 1.0085, + "step": 35970 + }, + { + "epoch": 35.0, + "learning_rate": 5.275135135135135e-05, + "loss": 0.9839, + "step": 35980 + }, + { + "epoch": 35.0, + "learning_rate": 5.2737837837837845e-05, + "loss": 2.5858, + "step": 35990 + }, + { + "epoch": 35.0, + "learning_rate": 5.2724324324324326e-05, + "loss": 2.4004, + "step": 36000 + }, + { + "epoch": 35.0, + "eval_loss": 0.13400040566921234, + "eval_runtime": 138.7368, + "eval_samples_per_second": 26.006, + "eval_steps_per_second": 3.251, + "eval_wer": 0.13469692028141453, + "step": 36000 + }, + { + "epoch": 35.0, + "learning_rate": 5.271081081081082e-05, + "loss": 2.5416, + "step": 36010 + }, + { + "epoch": 35.0, + "learning_rate": 5.26972972972973e-05, + "loss": 2.5734, + "step": 36020 + }, + { + "epoch": 35.0, + "learning_rate": 5.268378378378379e-05, + "loss": 1.2357, + "step": 36030 + }, + { + "epoch": 35.0, + "learning_rate": 5.267027027027027e-05, + "loss": 1.4962, + "step": 36040 + }, + { + "epoch": 35.0, + "learning_rate": 5.2656756756756765e-05, + "loss": 0.6954, + "step": 36050 + }, + { + "epoch": 35.0, + "learning_rate": 5.2643243243243246e-05, + "loss": 0.2503, + "step": 36060 + }, + { + "epoch": 35.0, + "learning_rate": 5.262972972972974e-05, + "loss": 0.1681, + "step": 36070 + }, + { + "epoch": 35.0, + "learning_rate": 5.261621621621622e-05, + "loss": 0.2456, + "step": 36080 + }, + { + "epoch": 35.0, + "learning_rate": 5.26027027027027e-05, + "loss": 0.2892, + "step": 36090 + }, + { + "epoch": 35.0, + "learning_rate": 5.258918918918919e-05, + "loss": 0.3605, + "step": 36100 + }, + { + "epoch": 35.0, + "learning_rate": 5.257567567567567e-05, + "loss": 0.3607, + "step": 36110 + }, + { + "epoch": 35.0, + "learning_rate": 5.2562162162162166e-05, + "loss": 0.1781, + "step": 36120 + }, + { + "epoch": 35.0, + "learning_rate": 5.254864864864865e-05, + "loss": 0.1555, + "step": 36130 + }, + { + "epoch": 35.0, + "learning_rate": 5.2535135135135135e-05, + "loss": 0.2688, + "step": 36140 + }, + { + "epoch": 35.0, + "learning_rate": 5.2521621621621616e-05, + "loss": 0.1977, + "step": 36150 + }, + { + "epoch": 35.0, + "learning_rate": 5.250810810810811e-05, + "loss": 0.2401, + "step": 36160 + }, + { + "epoch": 35.0, + "learning_rate": 5.249459459459459e-05, + "loss": 0.2436, + "step": 36170 + }, + { + "epoch": 35.01, + "learning_rate": 5.2481081081081086e-05, + "loss": 0.2198, + "step": 36180 + }, + { + "epoch": 35.01, + "learning_rate": 5.246756756756757e-05, + "loss": 0.1716, + "step": 36190 + }, + { + "epoch": 35.01, + "learning_rate": 5.2454054054054055e-05, + "loss": 0.128, + "step": 36200 + }, + { + "epoch": 35.01, + "learning_rate": 5.2440540540540536e-05, + "loss": 0.2177, + "step": 36210 + }, + { + "epoch": 35.01, + "learning_rate": 5.242702702702703e-05, + "loss": 0.2013, + "step": 36220 + }, + { + "epoch": 35.01, + "learning_rate": 5.241351351351351e-05, + "loss": 0.1867, + "step": 36230 + }, + { + "epoch": 35.01, + "learning_rate": 5.2400000000000007e-05, + "loss": 0.2809, + "step": 36240 + }, + { + "epoch": 35.01, + "learning_rate": 5.238648648648649e-05, + "loss": 0.3115, + "step": 36250 + }, + { + "epoch": 35.01, + "learning_rate": 5.2372972972972975e-05, + "loss": 0.216, + "step": 36260 + }, + { + "epoch": 35.01, + "learning_rate": 5.2359459459459456e-05, + "loss": 0.2969, + "step": 36270 + }, + { + "epoch": 35.01, + "learning_rate": 5.234594594594595e-05, + "loss": 0.3257, + "step": 36280 + }, + { + "epoch": 35.01, + "learning_rate": 5.233243243243243e-05, + "loss": 0.3134, + "step": 36290 + }, + { + "epoch": 35.01, + "learning_rate": 5.2318918918918927e-05, + "loss": 0.3358, + "step": 36300 + }, + { + "epoch": 35.01, + "learning_rate": 5.230540540540541e-05, + "loss": 0.2328, + "step": 36310 + }, + { + "epoch": 35.01, + "learning_rate": 5.2291891891891895e-05, + "loss": 0.3851, + "step": 36320 + }, + { + "epoch": 35.01, + "learning_rate": 5.2278378378378376e-05, + "loss": 0.5276, + "step": 36330 + }, + { + "epoch": 35.01, + "learning_rate": 5.226486486486487e-05, + "loss": 0.4321, + "step": 36340 + }, + { + "epoch": 35.01, + "learning_rate": 5.225135135135135e-05, + "loss": 0.1546, + "step": 36350 + }, + { + "epoch": 35.01, + "learning_rate": 5.223783783783785e-05, + "loss": 0.2116, + "step": 36360 + }, + { + "epoch": 35.01, + "learning_rate": 5.222432432432433e-05, + "loss": 0.2, + "step": 36370 + }, + { + "epoch": 35.01, + "learning_rate": 5.2210810810810815e-05, + "loss": 0.1682, + "step": 36380 + }, + { + "epoch": 35.01, + "learning_rate": 5.2197297297297297e-05, + "loss": 0.157, + "step": 36390 + }, + { + "epoch": 35.01, + "learning_rate": 5.218378378378379e-05, + "loss": 0.1691, + "step": 36400 + }, + { + "epoch": 35.01, + "learning_rate": 5.217027027027027e-05, + "loss": 0.1657, + "step": 36410 + }, + { + "epoch": 35.01, + "learning_rate": 5.215675675675677e-05, + "loss": 0.1913, + "step": 36420 + }, + { + "epoch": 35.01, + "learning_rate": 5.214324324324325e-05, + "loss": 0.412, + "step": 36430 + }, + { + "epoch": 35.01, + "learning_rate": 5.2129729729729736e-05, + "loss": 0.3166, + "step": 36440 + }, + { + "epoch": 35.01, + "learning_rate": 5.2116216216216217e-05, + "loss": 0.243, + "step": 36450 + }, + { + "epoch": 35.01, + "learning_rate": 5.210270270270271e-05, + "loss": 0.3017, + "step": 36460 + }, + { + "epoch": 35.01, + "learning_rate": 5.208918918918919e-05, + "loss": 0.4474, + "step": 36470 + }, + { + "epoch": 35.01, + "learning_rate": 5.207567567567569e-05, + "loss": 0.2137, + "step": 36480 + }, + { + "epoch": 35.01, + "learning_rate": 5.206216216216217e-05, + "loss": 0.1976, + "step": 36490 + }, + { + "epoch": 35.01, + "learning_rate": 5.204864864864865e-05, + "loss": 0.2321, + "step": 36500 + }, + { + "epoch": 35.01, + "eval_loss": 0.0982365608215332, + "eval_runtime": 129.0355, + "eval_samples_per_second": 27.961, + "eval_steps_per_second": 3.495, + "eval_wer": 0.0941620463122583, + "step": 36500 + }, + { + "epoch": 35.01, + "learning_rate": 5.203513513513514e-05, + "loss": 0.3294, + "step": 36510 + }, + { + "epoch": 35.01, + "learning_rate": 5.202162162162162e-05, + "loss": 0.3388, + "step": 36520 + }, + { + "epoch": 35.01, + "learning_rate": 5.200810810810811e-05, + "loss": 0.2719, + "step": 36530 + }, + { + "epoch": 35.01, + "learning_rate": 5.199459459459459e-05, + "loss": 0.2861, + "step": 36540 + }, + { + "epoch": 35.01, + "learning_rate": 5.198108108108108e-05, + "loss": 0.2705, + "step": 36550 + }, + { + "epoch": 35.01, + "learning_rate": 5.196756756756757e-05, + "loss": 0.2112, + "step": 36560 + }, + { + "epoch": 35.01, + "learning_rate": 5.195405405405406e-05, + "loss": 0.269, + "step": 36570 + }, + { + "epoch": 35.01, + "learning_rate": 5.194054054054054e-05, + "loss": 0.1362, + "step": 36580 + }, + { + "epoch": 35.01, + "learning_rate": 5.192702702702703e-05, + "loss": 0.1649, + "step": 36590 + }, + { + "epoch": 35.01, + "learning_rate": 5.191351351351351e-05, + "loss": 0.2885, + "step": 36600 + }, + { + "epoch": 35.01, + "learning_rate": 5.19e-05, + "loss": 0.5846, + "step": 36610 + }, + { + "epoch": 35.01, + "learning_rate": 5.188648648648648e-05, + "loss": 0.1882, + "step": 36620 + }, + { + "epoch": 35.01, + "learning_rate": 5.187297297297298e-05, + "loss": 0.1753, + "step": 36630 + }, + { + "epoch": 35.01, + "learning_rate": 5.185945945945946e-05, + "loss": 0.2601, + "step": 36640 + }, + { + "epoch": 35.01, + "learning_rate": 5.184594594594595e-05, + "loss": 0.2482, + "step": 36650 + }, + { + "epoch": 35.01, + "learning_rate": 5.1832432432432433e-05, + "loss": 0.2557, + "step": 36660 + }, + { + "epoch": 35.01, + "learning_rate": 5.181891891891892e-05, + "loss": 0.3316, + "step": 36670 + }, + { + "epoch": 35.01, + "learning_rate": 5.18054054054054e-05, + "loss": 0.3161, + "step": 36680 + }, + { + "epoch": 35.01, + "learning_rate": 5.17918918918919e-05, + "loss": 0.2205, + "step": 36690 + }, + { + "epoch": 35.01, + "learning_rate": 5.177837837837838e-05, + "loss": 0.2943, + "step": 36700 + }, + { + "epoch": 35.01, + "learning_rate": 5.176486486486487e-05, + "loss": 0.3305, + "step": 36710 + }, + { + "epoch": 35.01, + "learning_rate": 5.1751351351351353e-05, + "loss": 0.3147, + "step": 36720 + }, + { + "epoch": 35.01, + "learning_rate": 5.173783783783784e-05, + "loss": 0.4516, + "step": 36730 + }, + { + "epoch": 35.01, + "learning_rate": 5.172432432432432e-05, + "loss": 0.3801, + "step": 36740 + }, + { + "epoch": 35.01, + "learning_rate": 5.171081081081082e-05, + "loss": 0.478, + "step": 36750 + }, + { + "epoch": 35.01, + "learning_rate": 5.16972972972973e-05, + "loss": 0.3795, + "step": 36760 + }, + { + "epoch": 35.01, + "learning_rate": 5.168378378378379e-05, + "loss": 0.4509, + "step": 36770 + }, + { + "epoch": 35.01, + "learning_rate": 5.1670270270270274e-05, + "loss": 0.4797, + "step": 36780 + }, + { + "epoch": 35.01, + "learning_rate": 5.165675675675676e-05, + "loss": 0.3752, + "step": 36790 + }, + { + "epoch": 35.01, + "learning_rate": 5.164324324324324e-05, + "loss": 0.3543, + "step": 36800 + }, + { + "epoch": 35.01, + "learning_rate": 5.162972972972974e-05, + "loss": 0.3732, + "step": 36810 + }, + { + "epoch": 35.01, + "learning_rate": 5.161621621621622e-05, + "loss": 0.3627, + "step": 36820 + }, + { + "epoch": 36.0, + "learning_rate": 5.160270270270271e-05, + "loss": 0.5099, + "step": 36830 + }, + { + "epoch": 36.0, + "learning_rate": 5.1589189189189194e-05, + "loss": 0.3934, + "step": 36840 + }, + { + "epoch": 36.0, + "learning_rate": 5.157567567567568e-05, + "loss": 0.4335, + "step": 36850 + }, + { + "epoch": 36.0, + "learning_rate": 5.156216216216216e-05, + "loss": 0.461, + "step": 36860 + }, + { + "epoch": 36.0, + "learning_rate": 5.154864864864866e-05, + "loss": 0.3367, + "step": 36870 + }, + { + "epoch": 36.0, + "learning_rate": 5.153513513513514e-05, + "loss": 0.3919, + "step": 36880 + }, + { + "epoch": 36.0, + "learning_rate": 5.152162162162162e-05, + "loss": 0.4666, + "step": 36890 + }, + { + "epoch": 36.0, + "learning_rate": 5.1508108108108114e-05, + "loss": 0.5004, + "step": 36900 + }, + { + "epoch": 36.0, + "learning_rate": 5.1494594594594595e-05, + "loss": 0.3642, + "step": 36910 + }, + { + "epoch": 36.0, + "learning_rate": 5.148108108108108e-05, + "loss": 0.4182, + "step": 36920 + }, + { + "epoch": 36.0, + "learning_rate": 5.1467567567567564e-05, + "loss": 0.4374, + "step": 36930 + }, + { + "epoch": 36.0, + "learning_rate": 5.145405405405406e-05, + "loss": 0.3666, + "step": 36940 + }, + { + "epoch": 36.0, + "learning_rate": 5.144054054054054e-05, + "loss": 0.3474, + "step": 36950 + }, + { + "epoch": 36.0, + "learning_rate": 5.1427027027027034e-05, + "loss": 0.2493, + "step": 36960 + }, + { + "epoch": 36.0, + "learning_rate": 5.1413513513513515e-05, + "loss": 0.2666, + "step": 36970 + }, + { + "epoch": 36.0, + "learning_rate": 5.14e-05, + "loss": 0.2226, + "step": 36980 + }, + { + "epoch": 36.0, + "learning_rate": 5.1386486486486484e-05, + "loss": 0.6622, + "step": 36990 + }, + { + "epoch": 36.0, + "learning_rate": 5.137297297297298e-05, + "loss": 0.8946, + "step": 37000 + }, + { + "epoch": 36.0, + "eval_loss": 0.10528739541769028, + "eval_runtime": 127.996, + "eval_samples_per_second": 28.188, + "eval_steps_per_second": 3.524, + "eval_wer": 0.10977030238084144, + "step": 37000 + }, + { + "epoch": 36.0, + "learning_rate": 5.135945945945946e-05, + "loss": 2.2419, + "step": 37010 + }, + { + "epoch": 36.0, + "learning_rate": 5.134594594594595e-05, + "loss": 2.5334, + "step": 37020 + }, + { + "epoch": 36.0, + "learning_rate": 5.133243243243243e-05, + "loss": 2.4673, + "step": 37030 + }, + { + "epoch": 36.0, + "learning_rate": 5.131891891891892e-05, + "loss": 2.5279, + "step": 37040 + }, + { + "epoch": 36.0, + "learning_rate": 5.1305405405405404e-05, + "loss": 1.6497, + "step": 37050 + }, + { + "epoch": 36.0, + "learning_rate": 5.12918918918919e-05, + "loss": 1.4723, + "step": 37060 + }, + { + "epoch": 36.0, + "learning_rate": 5.127837837837838e-05, + "loss": 0.9009, + "step": 37070 + }, + { + "epoch": 36.0, + "learning_rate": 5.126486486486487e-05, + "loss": 0.3583, + "step": 37080 + }, + { + "epoch": 36.0, + "learning_rate": 5.125135135135135e-05, + "loss": 0.1319, + "step": 37090 + }, + { + "epoch": 36.0, + "learning_rate": 5.123783783783784e-05, + "loss": 0.1965, + "step": 37100 + }, + { + "epoch": 36.0, + "learning_rate": 5.1224324324324324e-05, + "loss": 0.2604, + "step": 37110 + }, + { + "epoch": 36.0, + "learning_rate": 5.121081081081082e-05, + "loss": 0.2477, + "step": 37120 + }, + { + "epoch": 36.0, + "learning_rate": 5.11972972972973e-05, + "loss": 0.4269, + "step": 37130 + }, + { + "epoch": 36.0, + "learning_rate": 5.118378378378379e-05, + "loss": 0.2501, + "step": 37140 + }, + { + "epoch": 36.0, + "learning_rate": 5.117027027027027e-05, + "loss": 0.1481, + "step": 37150 + }, + { + "epoch": 36.0, + "learning_rate": 5.115675675675676e-05, + "loss": 0.2648, + "step": 37160 + }, + { + "epoch": 36.0, + "learning_rate": 5.1143243243243244e-05, + "loss": 0.1699, + "step": 37170 + }, + { + "epoch": 36.0, + "learning_rate": 5.112972972972974e-05, + "loss": 0.233, + "step": 37180 + }, + { + "epoch": 36.0, + "learning_rate": 5.111621621621622e-05, + "loss": 0.2724, + "step": 37190 + }, + { + "epoch": 36.0, + "learning_rate": 5.110270270270271e-05, + "loss": 0.1958, + "step": 37200 + }, + { + "epoch": 36.01, + "learning_rate": 5.108918918918919e-05, + "loss": 0.1733, + "step": 37210 + }, + { + "epoch": 36.01, + "learning_rate": 5.107567567567568e-05, + "loss": 0.1119, + "step": 37220 + }, + { + "epoch": 36.01, + "learning_rate": 5.1062162162162164e-05, + "loss": 0.1878, + "step": 37230 + }, + { + "epoch": 36.01, + "learning_rate": 5.104864864864866e-05, + "loss": 0.1906, + "step": 37240 + }, + { + "epoch": 36.01, + "learning_rate": 5.103513513513514e-05, + "loss": 0.1544, + "step": 37250 + }, + { + "epoch": 36.01, + "learning_rate": 5.102162162162163e-05, + "loss": 0.182, + "step": 37260 + }, + { + "epoch": 36.01, + "learning_rate": 5.100810810810811e-05, + "loss": 0.347, + "step": 37270 + }, + { + "epoch": 36.01, + "learning_rate": 5.09945945945946e-05, + "loss": 0.2496, + "step": 37280 + }, + { + "epoch": 36.01, + "learning_rate": 5.0981081081081084e-05, + "loss": 0.26, + "step": 37290 + }, + { + "epoch": 36.01, + "learning_rate": 5.0967567567567565e-05, + "loss": 0.3292, + "step": 37300 + }, + { + "epoch": 36.01, + "learning_rate": 5.095405405405406e-05, + "loss": 0.2629, + "step": 37310 + }, + { + "epoch": 36.01, + "learning_rate": 5.094054054054054e-05, + "loss": 0.3464, + "step": 37320 + }, + { + "epoch": 36.01, + "learning_rate": 5.092702702702703e-05, + "loss": 0.2929, + "step": 37330 + }, + { + "epoch": 36.01, + "learning_rate": 5.091351351351351e-05, + "loss": 0.2881, + "step": 37340 + }, + { + "epoch": 36.01, + "learning_rate": 5.0900000000000004e-05, + "loss": 0.5632, + "step": 37350 + }, + { + "epoch": 36.01, + "learning_rate": 5.0886486486486485e-05, + "loss": 0.5002, + "step": 37360 + }, + { + "epoch": 36.01, + "learning_rate": 5.087297297297298e-05, + "loss": 0.1807, + "step": 37370 + }, + { + "epoch": 36.01, + "learning_rate": 5.085945945945946e-05, + "loss": 0.1426, + "step": 37380 + }, + { + "epoch": 36.01, + "learning_rate": 5.084594594594595e-05, + "loss": 0.2392, + "step": 37390 + }, + { + "epoch": 36.01, + "learning_rate": 5.083243243243243e-05, + "loss": 0.1961, + "step": 37400 + }, + { + "epoch": 36.01, + "learning_rate": 5.0818918918918924e-05, + "loss": 0.1851, + "step": 37410 + }, + { + "epoch": 36.01, + "learning_rate": 5.0805405405405405e-05, + "loss": 0.1704, + "step": 37420 + }, + { + "epoch": 36.01, + "learning_rate": 5.07918918918919e-05, + "loss": 0.1515, + "step": 37430 + }, + { + "epoch": 36.01, + "learning_rate": 5.077837837837838e-05, + "loss": 0.1919, + "step": 37440 + }, + { + "epoch": 36.01, + "learning_rate": 5.076486486486487e-05, + "loss": 0.4289, + "step": 37450 + }, + { + "epoch": 36.01, + "learning_rate": 5.075135135135135e-05, + "loss": 0.3668, + "step": 37460 + }, + { + "epoch": 36.01, + "learning_rate": 5.0737837837837844e-05, + "loss": 0.3112, + "step": 37470 + }, + { + "epoch": 36.01, + "learning_rate": 5.0724324324324325e-05, + "loss": 0.3035, + "step": 37480 + }, + { + "epoch": 36.01, + "learning_rate": 5.071216216216217e-05, + "loss": 0.4011, + "step": 37490 + }, + { + "epoch": 36.01, + "learning_rate": 5.069864864864865e-05, + "loss": 0.323, + "step": 37500 + }, + { + "epoch": 36.01, + "eval_loss": 0.1064189076423645, + "eval_runtime": 129.2808, + "eval_samples_per_second": 27.908, + "eval_steps_per_second": 3.489, + "eval_wer": 0.10105763406793086, + "step": 37500 + }, + { + "epoch": 36.01, + "learning_rate": 5.0685135135135144e-05, + "loss": 0.1801, + "step": 37510 + }, + { + "epoch": 36.01, + "learning_rate": 5.0671621621621626e-05, + "loss": 0.2266, + "step": 37520 + }, + { + "epoch": 36.01, + "learning_rate": 5.065810810810811e-05, + "loss": 0.3148, + "step": 37530 + }, + { + "epoch": 36.01, + "learning_rate": 5.0644594594594594e-05, + "loss": 0.361, + "step": 37540 + }, + { + "epoch": 36.01, + "learning_rate": 5.063108108108109e-05, + "loss": 0.2817, + "step": 37550 + }, + { + "epoch": 36.01, + "learning_rate": 5.061756756756757e-05, + "loss": 0.2362, + "step": 37560 + }, + { + "epoch": 36.01, + "learning_rate": 5.0604054054054065e-05, + "loss": 0.2451, + "step": 37570 + }, + { + "epoch": 36.01, + "learning_rate": 5.0590540540540546e-05, + "loss": 0.2224, + "step": 37580 + }, + { + "epoch": 36.01, + "learning_rate": 5.0577027027027027e-05, + "loss": 0.2119, + "step": 37590 + }, + { + "epoch": 36.01, + "learning_rate": 5.0563513513513514e-05, + "loss": 0.2, + "step": 37600 + }, + { + "epoch": 36.01, + "learning_rate": 5.0549999999999995e-05, + "loss": 0.1441, + "step": 37610 + }, + { + "epoch": 36.01, + "learning_rate": 5.053648648648649e-05, + "loss": 0.2612, + "step": 37620 + }, + { + "epoch": 36.01, + "learning_rate": 5.052297297297297e-05, + "loss": 0.5694, + "step": 37630 + }, + { + "epoch": 36.01, + "learning_rate": 5.0509459459459466e-05, + "loss": 0.2295, + "step": 37640 + }, + { + "epoch": 36.01, + "learning_rate": 5.049594594594595e-05, + "loss": 0.1824, + "step": 37650 + }, + { + "epoch": 36.01, + "learning_rate": 5.0482432432432434e-05, + "loss": 0.2365, + "step": 37660 + }, + { + "epoch": 36.01, + "learning_rate": 5.0468918918918915e-05, + "loss": 0.203, + "step": 37670 + }, + { + "epoch": 36.01, + "learning_rate": 5.045540540540541e-05, + "loss": 0.2194, + "step": 37680 + }, + { + "epoch": 36.01, + "learning_rate": 5.044189189189189e-05, + "loss": 0.3419, + "step": 37690 + }, + { + "epoch": 36.01, + "learning_rate": 5.0428378378378386e-05, + "loss": 0.3471, + "step": 37700 + }, + { + "epoch": 36.01, + "learning_rate": 5.041486486486487e-05, + "loss": 0.1814, + "step": 37710 + }, + { + "epoch": 36.01, + "learning_rate": 5.0401351351351355e-05, + "loss": 0.3222, + "step": 37720 + }, + { + "epoch": 36.01, + "learning_rate": 5.0387837837837836e-05, + "loss": 0.2532, + "step": 37730 + }, + { + "epoch": 36.01, + "learning_rate": 5.037432432432433e-05, + "loss": 0.437, + "step": 37740 + }, + { + "epoch": 36.01, + "learning_rate": 5.036081081081081e-05, + "loss": 0.4059, + "step": 37750 + }, + { + "epoch": 36.01, + "learning_rate": 5.03472972972973e-05, + "loss": 0.2988, + "step": 37760 + }, + { + "epoch": 36.01, + "learning_rate": 5.033378378378378e-05, + "loss": 0.4394, + "step": 37770 + }, + { + "epoch": 36.01, + "learning_rate": 5.0320270270270275e-05, + "loss": 0.3485, + "step": 37780 + }, + { + "epoch": 36.01, + "learning_rate": 5.0306756756756756e-05, + "loss": 0.4065, + "step": 37790 + }, + { + "epoch": 36.01, + "learning_rate": 5.029324324324325e-05, + "loss": 0.4752, + "step": 37800 + }, + { + "epoch": 36.01, + "learning_rate": 5.027972972972973e-05, + "loss": 0.3719, + "step": 37810 + }, + { + "epoch": 36.01, + "learning_rate": 5.026621621621622e-05, + "loss": 0.3917, + "step": 37820 + }, + { + "epoch": 36.01, + "learning_rate": 5.02527027027027e-05, + "loss": 0.4025, + "step": 37830 + }, + { + "epoch": 36.01, + "learning_rate": 5.0239189189189195e-05, + "loss": 0.3684, + "step": 37840 + }, + { + "epoch": 36.01, + "learning_rate": 5.0225675675675676e-05, + "loss": 0.5605, + "step": 37850 + }, + { + "epoch": 37.0, + "learning_rate": 5.021216216216217e-05, + "loss": 0.4325, + "step": 37860 + }, + { + "epoch": 37.0, + "learning_rate": 5.019864864864865e-05, + "loss": 0.3974, + "step": 37870 + }, + { + "epoch": 37.0, + "learning_rate": 5.018513513513514e-05, + "loss": 0.4614, + "step": 37880 + }, + { + "epoch": 37.0, + "learning_rate": 5.017162162162162e-05, + "loss": 0.3826, + "step": 37890 + }, + { + "epoch": 37.0, + "learning_rate": 5.0158108108108115e-05, + "loss": 0.3908, + "step": 37900 + }, + { + "epoch": 37.0, + "learning_rate": 5.0144594594594596e-05, + "loss": 0.4109, + "step": 37910 + }, + { + "epoch": 37.0, + "learning_rate": 5.013108108108109e-05, + "loss": 0.567, + "step": 37920 + }, + { + "epoch": 37.0, + "learning_rate": 5.011756756756757e-05, + "loss": 0.4053, + "step": 37930 + }, + { + "epoch": 37.0, + "learning_rate": 5.010405405405406e-05, + "loss": 0.4007, + "step": 37940 + }, + { + "epoch": 37.0, + "learning_rate": 5.009054054054054e-05, + "loss": 0.4384, + "step": 37950 + }, + { + "epoch": 37.0, + "learning_rate": 5.0077027027027035e-05, + "loss": 0.4026, + "step": 37960 + }, + { + "epoch": 37.0, + "learning_rate": 5.0063513513513516e-05, + "loss": 0.3603, + "step": 37970 + }, + { + "epoch": 37.0, + "learning_rate": 5.005e-05, + "loss": 0.2604, + "step": 37980 + }, + { + "epoch": 37.0, + "learning_rate": 5.003648648648649e-05, + "loss": 0.2457, + "step": 37990 + }, + { + "epoch": 37.0, + "learning_rate": 5.002297297297297e-05, + "loss": 0.2526, + "step": 38000 + }, + { + "epoch": 37.0, + "eval_loss": 0.11046508699655533, + "eval_runtime": 130.6991, + "eval_samples_per_second": 27.605, + "eval_steps_per_second": 3.451, + "eval_wer": 0.10567022317476588, + "step": 38000 + }, + { + "epoch": 37.0, + "learning_rate": 5.000945945945946e-05, + "loss": 0.304, + "step": 38010 + }, + { + "epoch": 37.0, + "learning_rate": 4.999594594594595e-05, + "loss": 1.1548, + "step": 38020 + }, + { + "epoch": 37.0, + "learning_rate": 4.9982432432432436e-05, + "loss": 1.6486, + "step": 38030 + }, + { + "epoch": 37.0, + "learning_rate": 4.9968918918918924e-05, + "loss": 2.5525, + "step": 38040 + }, + { + "epoch": 37.0, + "learning_rate": 4.995540540540541e-05, + "loss": 2.421, + "step": 38050 + }, + { + "epoch": 37.0, + "learning_rate": 4.994189189189189e-05, + "loss": 2.5466, + "step": 38060 + }, + { + "epoch": 37.0, + "learning_rate": 4.992837837837838e-05, + "loss": 2.0558, + "step": 38070 + }, + { + "epoch": 37.0, + "learning_rate": 4.991486486486487e-05, + "loss": 1.4931, + "step": 38080 + }, + { + "epoch": 37.0, + "learning_rate": 4.9901351351351356e-05, + "loss": 1.1443, + "step": 38090 + }, + { + "epoch": 37.0, + "learning_rate": 4.9887837837837844e-05, + "loss": 0.4145, + "step": 38100 + }, + { + "epoch": 37.0, + "learning_rate": 4.987432432432433e-05, + "loss": 0.1366, + "step": 38110 + }, + { + "epoch": 37.0, + "learning_rate": 4.986081081081081e-05, + "loss": 0.2218, + "step": 38120 + }, + { + "epoch": 37.0, + "learning_rate": 4.98472972972973e-05, + "loss": 0.205, + "step": 38130 + }, + { + "epoch": 37.0, + "learning_rate": 4.983378378378379e-05, + "loss": 0.2815, + "step": 38140 + }, + { + "epoch": 37.0, + "learning_rate": 4.9820270270270276e-05, + "loss": 0.4347, + "step": 38150 + }, + { + "epoch": 37.0, + "learning_rate": 4.9806756756756764e-05, + "loss": 0.2775, + "step": 38160 + }, + { + "epoch": 37.0, + "learning_rate": 4.979324324324325e-05, + "loss": 0.1446, + "step": 38170 + }, + { + "epoch": 37.0, + "learning_rate": 4.977972972972973e-05, + "loss": 0.1607, + "step": 38180 + }, + { + "epoch": 37.0, + "learning_rate": 4.9766216216216214e-05, + "loss": 0.2306, + "step": 38190 + }, + { + "epoch": 37.0, + "learning_rate": 4.97527027027027e-05, + "loss": 0.2261, + "step": 38200 + }, + { + "epoch": 37.0, + "learning_rate": 4.973918918918919e-05, + "loss": 0.2512, + "step": 38210 + }, + { + "epoch": 37.0, + "learning_rate": 4.972567567567568e-05, + "loss": 0.1864, + "step": 38220 + }, + { + "epoch": 37.01, + "learning_rate": 4.9712162162162165e-05, + "loss": 0.1791, + "step": 38230 + }, + { + "epoch": 37.01, + "learning_rate": 4.9698648648648646e-05, + "loss": 0.1188, + "step": 38240 + }, + { + "epoch": 37.01, + "learning_rate": 4.9685135135135134e-05, + "loss": 0.1459, + "step": 38250 + }, + { + "epoch": 37.01, + "learning_rate": 4.967162162162162e-05, + "loss": 0.2086, + "step": 38260 + }, + { + "epoch": 37.01, + "learning_rate": 4.965810810810811e-05, + "loss": 0.1262, + "step": 38270 + }, + { + "epoch": 37.01, + "learning_rate": 4.96445945945946e-05, + "loss": 0.2157, + "step": 38280 + }, + { + "epoch": 37.01, + "learning_rate": 4.9631081081081085e-05, + "loss": 0.2871, + "step": 38290 + }, + { + "epoch": 37.01, + "learning_rate": 4.9617567567567566e-05, + "loss": 0.22, + "step": 38300 + }, + { + "epoch": 37.01, + "learning_rate": 4.9604054054054054e-05, + "loss": 0.2494, + "step": 38310 + }, + { + "epoch": 37.01, + "learning_rate": 4.959054054054054e-05, + "loss": 0.3676, + "step": 38320 + }, + { + "epoch": 37.01, + "learning_rate": 4.957702702702703e-05, + "loss": 0.2873, + "step": 38330 + }, + { + "epoch": 37.01, + "learning_rate": 4.956351351351352e-05, + "loss": 0.3577, + "step": 38340 + }, + { + "epoch": 37.01, + "learning_rate": 4.9550000000000005e-05, + "loss": 0.3804, + "step": 38350 + }, + { + "epoch": 37.01, + "learning_rate": 4.9536486486486486e-05, + "loss": 0.2321, + "step": 38360 + }, + { + "epoch": 37.01, + "learning_rate": 4.9522972972972974e-05, + "loss": 0.5268, + "step": 38370 + }, + { + "epoch": 37.01, + "learning_rate": 4.950945945945946e-05, + "loss": 0.5626, + "step": 38380 + }, + { + "epoch": 37.01, + "learning_rate": 4.949594594594595e-05, + "loss": 0.33, + "step": 38390 + }, + { + "epoch": 37.01, + "learning_rate": 4.948243243243244e-05, + "loss": 0.1277, + "step": 38400 + }, + { + "epoch": 37.01, + "learning_rate": 4.9468918918918925e-05, + "loss": 0.2737, + "step": 38410 + }, + { + "epoch": 37.01, + "learning_rate": 4.9455405405405406e-05, + "loss": 0.1569, + "step": 38420 + }, + { + "epoch": 37.01, + "learning_rate": 4.9441891891891894e-05, + "loss": 0.1981, + "step": 38430 + }, + { + "epoch": 37.01, + "learning_rate": 4.942837837837838e-05, + "loss": 0.1693, + "step": 38440 + }, + { + "epoch": 37.01, + "learning_rate": 4.941486486486487e-05, + "loss": 0.1553, + "step": 38450 + }, + { + "epoch": 37.01, + "learning_rate": 4.940135135135136e-05, + "loss": 0.125, + "step": 38460 + }, + { + "epoch": 37.01, + "learning_rate": 4.938783783783784e-05, + "loss": 0.3543, + "step": 38470 + }, + { + "epoch": 37.01, + "learning_rate": 4.9374324324324326e-05, + "loss": 0.391, + "step": 38480 + }, + { + "epoch": 37.01, + "learning_rate": 4.9360810810810814e-05, + "loss": 0.3488, + "step": 38490 + }, + { + "epoch": 37.01, + "learning_rate": 4.93472972972973e-05, + "loss": 0.2479, + "step": 38500 + }, + { + "epoch": 37.01, + "eval_loss": 0.10067124664783478, + "eval_runtime": 147.2074, + "eval_samples_per_second": 24.51, + "eval_steps_per_second": 3.064, + "eval_wer": 0.10003261426641197, + "step": 38500 + }, + { + "epoch": 37.01, + "learning_rate": 4.933378378378379e-05, + "loss": 0.3906, + "step": 38510 + }, + { + "epoch": 37.01, + "learning_rate": 4.932027027027028e-05, + "loss": 0.3386, + "step": 38520 + }, + { + "epoch": 37.01, + "learning_rate": 4.930675675675676e-05, + "loss": 0.2292, + "step": 38530 + }, + { + "epoch": 37.01, + "learning_rate": 4.9293243243243246e-05, + "loss": 0.1887, + "step": 38540 + }, + { + "epoch": 37.01, + "learning_rate": 4.9279729729729734e-05, + "loss": 0.2276, + "step": 38550 + }, + { + "epoch": 37.01, + "learning_rate": 4.926621621621622e-05, + "loss": 0.3484, + "step": 38560 + }, + { + "epoch": 37.01, + "learning_rate": 4.925270270270271e-05, + "loss": 0.3599, + "step": 38570 + }, + { + "epoch": 37.01, + "learning_rate": 4.92391891891892e-05, + "loss": 0.2273, + "step": 38580 + }, + { + "epoch": 37.01, + "learning_rate": 4.922567567567568e-05, + "loss": 0.2874, + "step": 38590 + }, + { + "epoch": 37.01, + "learning_rate": 4.921216216216216e-05, + "loss": 0.2035, + "step": 38600 + }, + { + "epoch": 37.01, + "learning_rate": 4.919864864864865e-05, + "loss": 0.2087, + "step": 38610 + }, + { + "epoch": 37.01, + "learning_rate": 4.9185135135135135e-05, + "loss": 0.2593, + "step": 38620 + }, + { + "epoch": 37.01, + "learning_rate": 4.917162162162162e-05, + "loss": 0.1368, + "step": 38630 + }, + { + "epoch": 37.01, + "learning_rate": 4.915810810810811e-05, + "loss": 0.2374, + "step": 38640 + }, + { + "epoch": 37.01, + "learning_rate": 4.914459459459459e-05, + "loss": 0.4336, + "step": 38650 + }, + { + "epoch": 37.01, + "learning_rate": 4.913108108108108e-05, + "loss": 0.3787, + "step": 38660 + }, + { + "epoch": 37.01, + "learning_rate": 4.911756756756757e-05, + "loss": 0.1642, + "step": 38670 + }, + { + "epoch": 37.01, + "learning_rate": 4.9104054054054055e-05, + "loss": 0.2042, + "step": 38680 + }, + { + "epoch": 37.01, + "learning_rate": 4.909054054054054e-05, + "loss": 0.2375, + "step": 38690 + }, + { + "epoch": 37.01, + "learning_rate": 4.907702702702703e-05, + "loss": 0.242, + "step": 38700 + }, + { + "epoch": 37.01, + "learning_rate": 4.906351351351351e-05, + "loss": 0.3005, + "step": 38710 + }, + { + "epoch": 37.01, + "learning_rate": 4.905e-05, + "loss": 0.3465, + "step": 38720 + }, + { + "epoch": 37.01, + "learning_rate": 4.903648648648649e-05, + "loss": 0.1857, + "step": 38730 + }, + { + "epoch": 37.01, + "learning_rate": 4.9022972972972975e-05, + "loss": 0.2811, + "step": 38740 + }, + { + "epoch": 37.01, + "learning_rate": 4.900945945945946e-05, + "loss": 0.2565, + "step": 38750 + }, + { + "epoch": 37.01, + "learning_rate": 4.899594594594595e-05, + "loss": 0.4198, + "step": 38760 + }, + { + "epoch": 37.01, + "learning_rate": 4.898243243243243e-05, + "loss": 0.3974, + "step": 38770 + }, + { + "epoch": 37.01, + "learning_rate": 4.896891891891892e-05, + "loss": 0.3692, + "step": 38780 + }, + { + "epoch": 37.01, + "learning_rate": 4.895540540540541e-05, + "loss": 0.3503, + "step": 38790 + }, + { + "epoch": 37.01, + "learning_rate": 4.8941891891891895e-05, + "loss": 0.464, + "step": 38800 + }, + { + "epoch": 37.01, + "learning_rate": 4.892837837837838e-05, + "loss": 0.3673, + "step": 38810 + }, + { + "epoch": 37.01, + "learning_rate": 4.891486486486487e-05, + "loss": 0.5519, + "step": 38820 + }, + { + "epoch": 37.01, + "learning_rate": 4.890135135135135e-05, + "loss": 0.3952, + "step": 38830 + }, + { + "epoch": 37.01, + "learning_rate": 4.888783783783784e-05, + "loss": 0.4077, + "step": 38840 + }, + { + "epoch": 37.01, + "learning_rate": 4.887432432432433e-05, + "loss": 0.387, + "step": 38850 + }, + { + "epoch": 37.01, + "learning_rate": 4.8860810810810815e-05, + "loss": 0.3265, + "step": 38860 + }, + { + "epoch": 37.01, + "learning_rate": 4.88472972972973e-05, + "loss": 0.4806, + "step": 38870 + }, + { + "epoch": 38.0, + "learning_rate": 4.8833783783783784e-05, + "loss": 0.4373, + "step": 38880 + }, + { + "epoch": 38.0, + "learning_rate": 4.882027027027027e-05, + "loss": 0.3971, + "step": 38890 + }, + { + "epoch": 38.0, + "learning_rate": 4.880675675675676e-05, + "loss": 0.3982, + "step": 38900 + }, + { + "epoch": 38.0, + "learning_rate": 4.879324324324325e-05, + "loss": 0.4107, + "step": 38910 + }, + { + "epoch": 38.0, + "learning_rate": 4.8779729729729735e-05, + "loss": 0.4135, + "step": 38920 + }, + { + "epoch": 38.0, + "learning_rate": 4.876621621621622e-05, + "loss": 0.398, + "step": 38930 + }, + { + "epoch": 38.0, + "learning_rate": 4.8752702702702704e-05, + "loss": 0.5655, + "step": 38940 + }, + { + "epoch": 38.0, + "learning_rate": 4.873918918918919e-05, + "loss": 0.3716, + "step": 38950 + }, + { + "epoch": 38.0, + "learning_rate": 4.872567567567568e-05, + "loss": 0.4038, + "step": 38960 + }, + { + "epoch": 38.0, + "learning_rate": 4.871216216216217e-05, + "loss": 0.4223, + "step": 38970 + }, + { + "epoch": 38.0, + "learning_rate": 4.8698648648648655e-05, + "loss": 0.4088, + "step": 38980 + }, + { + "epoch": 38.0, + "learning_rate": 4.8685135135135137e-05, + "loss": 0.4165, + "step": 38990 + }, + { + "epoch": 38.0, + "learning_rate": 4.8671621621621624e-05, + "loss": 0.255, + "step": 39000 + }, + { + "epoch": 38.0, + "eval_loss": 0.10054945200681686, + "eval_runtime": 129.944, + "eval_samples_per_second": 27.766, + "eval_steps_per_second": 3.471, + "eval_wer": 0.09858826818245353, + "step": 39000 + }, + { + "epoch": 38.0, + "learning_rate": 4.8658108108108105e-05, + "loss": 0.2406, + "step": 39010 + }, + { + "epoch": 38.0, + "learning_rate": 4.864459459459459e-05, + "loss": 0.2423, + "step": 39020 + }, + { + "epoch": 38.0, + "learning_rate": 4.863108108108108e-05, + "loss": 0.2519, + "step": 39030 + }, + { + "epoch": 38.0, + "learning_rate": 4.861756756756757e-05, + "loss": 1.0583, + "step": 39040 + }, + { + "epoch": 38.0, + "learning_rate": 4.8604054054054057e-05, + "loss": 1.0773, + "step": 39050 + }, + { + "epoch": 38.0, + "learning_rate": 4.8590540540540544e-05, + "loss": 2.5696, + "step": 39060 + }, + { + "epoch": 38.0, + "learning_rate": 4.8577027027027025e-05, + "loss": 2.4098, + "step": 39070 + }, + { + "epoch": 38.0, + "learning_rate": 4.856351351351351e-05, + "loss": 2.5434, + "step": 39080 + }, + { + "epoch": 38.0, + "learning_rate": 4.855e-05, + "loss": 2.4176, + "step": 39090 + }, + { + "epoch": 38.0, + "learning_rate": 4.853648648648649e-05, + "loss": 1.2725, + "step": 39100 + }, + { + "epoch": 38.0, + "learning_rate": 4.852297297297298e-05, + "loss": 1.4104, + "step": 39110 + }, + { + "epoch": 38.0, + "learning_rate": 4.850945945945946e-05, + "loss": 0.6284, + "step": 39120 + }, + { + "epoch": 38.0, + "learning_rate": 4.8495945945945945e-05, + "loss": 0.2053, + "step": 39130 + }, + { + "epoch": 38.0, + "learning_rate": 4.848243243243243e-05, + "loss": 0.1738, + "step": 39140 + }, + { + "epoch": 38.0, + "learning_rate": 4.846891891891892e-05, + "loss": 0.1839, + "step": 39150 + }, + { + "epoch": 38.0, + "learning_rate": 4.845540540540541e-05, + "loss": 0.3016, + "step": 39160 + }, + { + "epoch": 38.0, + "learning_rate": 4.84418918918919e-05, + "loss": 0.3615, + "step": 39170 + }, + { + "epoch": 38.0, + "learning_rate": 4.842837837837838e-05, + "loss": 0.3683, + "step": 39180 + }, + { + "epoch": 38.0, + "learning_rate": 4.8414864864864866e-05, + "loss": 0.1825, + "step": 39190 + }, + { + "epoch": 38.0, + "learning_rate": 4.840135135135135e-05, + "loss": 0.1402, + "step": 39200 + }, + { + "epoch": 38.0, + "learning_rate": 4.838783783783784e-05, + "loss": 0.2444, + "step": 39210 + }, + { + "epoch": 38.0, + "learning_rate": 4.837432432432433e-05, + "loss": 0.2151, + "step": 39220 + }, + { + "epoch": 38.0, + "learning_rate": 4.836081081081082e-05, + "loss": 0.2731, + "step": 39230 + }, + { + "epoch": 38.0, + "learning_rate": 4.83472972972973e-05, + "loss": 0.1916, + "step": 39240 + }, + { + "epoch": 38.01, + "learning_rate": 4.8333783783783786e-05, + "loss": 0.1612, + "step": 39250 + }, + { + "epoch": 38.01, + "learning_rate": 4.8320270270270273e-05, + "loss": 0.1644, + "step": 39260 + }, + { + "epoch": 38.01, + "learning_rate": 4.830675675675676e-05, + "loss": 0.1327, + "step": 39270 + }, + { + "epoch": 38.01, + "learning_rate": 4.829324324324325e-05, + "loss": 0.208, + "step": 39280 + }, + { + "epoch": 38.01, + "learning_rate": 4.827972972972974e-05, + "loss": 0.1692, + "step": 39290 + }, + { + "epoch": 38.01, + "learning_rate": 4.826621621621622e-05, + "loss": 0.1748, + "step": 39300 + }, + { + "epoch": 38.01, + "learning_rate": 4.8252702702702706e-05, + "loss": 0.2403, + "step": 39310 + }, + { + "epoch": 38.01, + "learning_rate": 4.8239189189189193e-05, + "loss": 0.2865, + "step": 39320 + }, + { + "epoch": 38.01, + "learning_rate": 4.822567567567568e-05, + "loss": 0.1969, + "step": 39330 + }, + { + "epoch": 38.01, + "learning_rate": 4.821216216216217e-05, + "loss": 0.3008, + "step": 39340 + }, + { + "epoch": 38.01, + "learning_rate": 4.819864864864865e-05, + "loss": 0.2632, + "step": 39350 + }, + { + "epoch": 38.01, + "learning_rate": 4.818513513513514e-05, + "loss": 0.3058, + "step": 39360 + }, + { + "epoch": 38.01, + "learning_rate": 4.8171621621621626e-05, + "loss": 0.2898, + "step": 39370 + }, + { + "epoch": 38.01, + "learning_rate": 4.8158108108108114e-05, + "loss": 0.2453, + "step": 39380 + }, + { + "epoch": 38.01, + "learning_rate": 4.8144594594594595e-05, + "loss": 0.4112, + "step": 39390 + }, + { + "epoch": 38.01, + "learning_rate": 4.813108108108108e-05, + "loss": 0.5956, + "step": 39400 + }, + { + "epoch": 38.01, + "learning_rate": 4.811756756756757e-05, + "loss": 0.3809, + "step": 39410 + }, + { + "epoch": 38.01, + "learning_rate": 4.810405405405405e-05, + "loss": 0.1301, + "step": 39420 + }, + { + "epoch": 38.01, + "learning_rate": 4.809054054054054e-05, + "loss": 0.2316, + "step": 39430 + }, + { + "epoch": 38.01, + "learning_rate": 4.807702702702703e-05, + "loss": 0.2011, + "step": 39440 + }, + { + "epoch": 38.01, + "learning_rate": 4.8063513513513515e-05, + "loss": 0.1964, + "step": 39450 + }, + { + "epoch": 38.01, + "learning_rate": 4.805e-05, + "loss": 0.1679, + "step": 39460 + }, + { + "epoch": 38.01, + "learning_rate": 4.803648648648649e-05, + "loss": 0.1535, + "step": 39470 + }, + { + "epoch": 38.01, + "learning_rate": 4.802297297297297e-05, + "loss": 0.1692, + "step": 39480 + }, + { + "epoch": 38.01, + "learning_rate": 4.800945945945946e-05, + "loss": 0.2393, + "step": 39490 + }, + { + "epoch": 38.01, + "learning_rate": 4.799594594594595e-05, + "loss": 0.4181, + "step": 39500 + }, + { + "epoch": 38.01, + "eval_loss": 0.09583058953285217, + "eval_runtime": 129.5494, + "eval_samples_per_second": 27.85, + "eval_steps_per_second": 3.481, + "eval_wer": 0.09336998555653916, + "step": 39500 + }, + { + "epoch": 38.01, + "learning_rate": 4.7982432432432435e-05, + "loss": 0.3604, + "step": 39510 + }, + { + "epoch": 38.01, + "learning_rate": 4.796891891891892e-05, + "loss": 0.2281, + "step": 39520 + }, + { + "epoch": 38.01, + "learning_rate": 4.795540540540541e-05, + "loss": 0.3675, + "step": 39530 + }, + { + "epoch": 38.01, + "learning_rate": 4.794189189189189e-05, + "loss": 0.4595, + "step": 39540 + }, + { + "epoch": 38.01, + "learning_rate": 4.792837837837838e-05, + "loss": 0.196, + "step": 39550 + }, + { + "epoch": 38.01, + "learning_rate": 4.791486486486487e-05, + "loss": 0.1932, + "step": 39560 + }, + { + "epoch": 38.01, + "learning_rate": 4.7901351351351355e-05, + "loss": 0.2035, + "step": 39570 + }, + { + "epoch": 38.01, + "learning_rate": 4.788783783783784e-05, + "loss": 0.3432, + "step": 39580 + }, + { + "epoch": 38.01, + "learning_rate": 4.7874324324324324e-05, + "loss": 0.3209, + "step": 39590 + }, + { + "epoch": 38.01, + "learning_rate": 4.786081081081081e-05, + "loss": 0.2905, + "step": 39600 + }, + { + "epoch": 38.01, + "learning_rate": 4.78472972972973e-05, + "loss": 0.2589, + "step": 39610 + }, + { + "epoch": 38.01, + "learning_rate": 4.783378378378379e-05, + "loss": 0.2707, + "step": 39620 + }, + { + "epoch": 38.01, + "learning_rate": 4.7820270270270275e-05, + "loss": 0.2221, + "step": 39630 + }, + { + "epoch": 38.01, + "learning_rate": 4.780675675675676e-05, + "loss": 0.2414, + "step": 39640 + }, + { + "epoch": 38.01, + "learning_rate": 4.7793243243243244e-05, + "loss": 0.1362, + "step": 39650 + }, + { + "epoch": 38.01, + "learning_rate": 4.777972972972973e-05, + "loss": 0.2274, + "step": 39660 + }, + { + "epoch": 38.01, + "learning_rate": 4.776621621621622e-05, + "loss": 0.2903, + "step": 39670 + }, + { + "epoch": 38.01, + "learning_rate": 4.775270270270271e-05, + "loss": 0.5216, + "step": 39680 + }, + { + "epoch": 38.01, + "learning_rate": 4.7739189189189195e-05, + "loss": 0.1811, + "step": 39690 + }, + { + "epoch": 38.01, + "learning_rate": 4.772567567567568e-05, + "loss": 0.2041, + "step": 39700 + }, + { + "epoch": 38.01, + "learning_rate": 4.7712162162162164e-05, + "loss": 0.2172, + "step": 39710 + }, + { + "epoch": 38.01, + "learning_rate": 4.769864864864865e-05, + "loss": 0.2485, + "step": 39720 + }, + { + "epoch": 38.01, + "learning_rate": 4.768513513513514e-05, + "loss": 0.2403, + "step": 39730 + }, + { + "epoch": 38.01, + "learning_rate": 4.767162162162163e-05, + "loss": 0.3359, + "step": 39740 + }, + { + "epoch": 38.01, + "learning_rate": 4.7658108108108115e-05, + "loss": 0.2749, + "step": 39750 + }, + { + "epoch": 38.01, + "learning_rate": 4.7644594594594596e-05, + "loss": 0.2126, + "step": 39760 + }, + { + "epoch": 38.01, + "learning_rate": 4.7631081081081084e-05, + "loss": 0.2942, + "step": 39770 + }, + { + "epoch": 38.01, + "learning_rate": 4.761891891891892e-05, + "loss": 0.3603, + "step": 39780 + }, + { + "epoch": 38.01, + "learning_rate": 4.760540540540541e-05, + "loss": 0.343, + "step": 39790 + }, + { + "epoch": 38.01, + "learning_rate": 4.7591891891891896e-05, + "loss": 0.4541, + "step": 39800 + }, + { + "epoch": 38.01, + "learning_rate": 4.757837837837838e-05, + "loss": 0.3213, + "step": 39810 + }, + { + "epoch": 38.01, + "learning_rate": 4.7564864864864865e-05, + "loss": 0.4814, + "step": 39820 + }, + { + "epoch": 38.01, + "learning_rate": 4.755135135135135e-05, + "loss": 0.4323, + "step": 39830 + }, + { + "epoch": 38.01, + "learning_rate": 4.753783783783784e-05, + "loss": 0.4851, + "step": 39840 + }, + { + "epoch": 38.01, + "learning_rate": 4.752432432432433e-05, + "loss": 0.4075, + "step": 39850 + }, + { + "epoch": 38.01, + "learning_rate": 4.751081081081081e-05, + "loss": 0.3591, + "step": 39860 + }, + { + "epoch": 38.01, + "learning_rate": 4.74972972972973e-05, + "loss": 0.3597, + "step": 39870 + }, + { + "epoch": 38.01, + "learning_rate": 4.7483783783783785e-05, + "loss": 0.3409, + "step": 39880 + }, + { + "epoch": 38.01, + "learning_rate": 4.747027027027027e-05, + "loss": 0.3552, + "step": 39890 + }, + { + "epoch": 39.0, + "learning_rate": 4.745675675675676e-05, + "loss": 0.4719, + "step": 39900 + }, + { + "epoch": 39.0, + "learning_rate": 4.744324324324325e-05, + "loss": 0.3509, + "step": 39910 + }, + { + "epoch": 39.0, + "learning_rate": 4.742972972972973e-05, + "loss": 0.4332, + "step": 39920 + }, + { + "epoch": 39.0, + "learning_rate": 4.741621621621622e-05, + "loss": 0.4327, + "step": 39930 + }, + { + "epoch": 39.0, + "learning_rate": 4.7402702702702705e-05, + "loss": 0.3258, + "step": 39940 + }, + { + "epoch": 39.0, + "learning_rate": 4.738918918918919e-05, + "loss": 0.3986, + "step": 39950 + }, + { + "epoch": 39.0, + "learning_rate": 4.737567567567568e-05, + "loss": 0.4558, + "step": 39960 + }, + { + "epoch": 39.0, + "learning_rate": 4.736216216216217e-05, + "loss": 0.4462, + "step": 39970 + }, + { + "epoch": 39.0, + "learning_rate": 4.734864864864865e-05, + "loss": 0.381, + "step": 39980 + }, + { + "epoch": 39.0, + "learning_rate": 4.733513513513514e-05, + "loss": 0.3854, + "step": 39990 + }, + { + "epoch": 39.0, + "learning_rate": 4.7321621621621625e-05, + "loss": 0.4028, + "step": 40000 + }, + { + "epoch": 39.0, + "eval_loss": 0.09857729822397232, + "eval_runtime": 128.1124, + "eval_samples_per_second": 28.163, + "eval_steps_per_second": 3.52, + "eval_wer": 0.09742347295345478, + "step": 40000 + }, + { + "epoch": 39.0, + "learning_rate": 4.730810810810811e-05, + "loss": 0.392, + "step": 40010 + }, + { + "epoch": 39.0, + "learning_rate": 4.72945945945946e-05, + "loss": 0.3129, + "step": 40020 + }, + { + "epoch": 39.0, + "learning_rate": 4.728108108108109e-05, + "loss": 0.2381, + "step": 40030 + }, + { + "epoch": 39.0, + "learning_rate": 4.726756756756757e-05, + "loss": 0.2503, + "step": 40040 + }, + { + "epoch": 39.0, + "learning_rate": 4.725405405405406e-05, + "loss": 0.2286, + "step": 40050 + }, + { + "epoch": 39.0, + "learning_rate": 4.7240540540540545e-05, + "loss": 0.8035, + "step": 40060 + }, + { + "epoch": 39.0, + "learning_rate": 4.7227027027027026e-05, + "loss": 0.7912, + "step": 40070 + }, + { + "epoch": 39.0, + "learning_rate": 4.7213513513513514e-05, + "loss": 2.4603, + "step": 40080 + }, + { + "epoch": 39.0, + "learning_rate": 4.72e-05, + "loss": 2.5179, + "step": 40090 + }, + { + "epoch": 39.0, + "learning_rate": 4.718648648648648e-05, + "loss": 2.4242, + "step": 40100 + }, + { + "epoch": 39.0, + "learning_rate": 4.717297297297297e-05, + "loss": 2.5324, + "step": 40110 + }, + { + "epoch": 39.0, + "learning_rate": 4.715945945945946e-05, + "loss": 1.5058, + "step": 40120 + }, + { + "epoch": 39.0, + "learning_rate": 4.7145945945945947e-05, + "loss": 1.4186, + "step": 40130 + }, + { + "epoch": 39.0, + "learning_rate": 4.7132432432432434e-05, + "loss": 0.797, + "step": 40140 + }, + { + "epoch": 39.0, + "learning_rate": 4.711891891891892e-05, + "loss": 0.373, + "step": 40150 + }, + { + "epoch": 39.0, + "learning_rate": 4.71054054054054e-05, + "loss": 0.1378, + "step": 40160 + }, + { + "epoch": 39.0, + "learning_rate": 4.709189189189189e-05, + "loss": 0.2445, + "step": 40170 + }, + { + "epoch": 39.0, + "learning_rate": 4.707837837837838e-05, + "loss": 0.2223, + "step": 40180 + }, + { + "epoch": 39.0, + "learning_rate": 4.7064864864864867e-05, + "loss": 0.2858, + "step": 40190 + }, + { + "epoch": 39.0, + "learning_rate": 4.7051351351351354e-05, + "loss": 0.3567, + "step": 40200 + }, + { + "epoch": 39.0, + "learning_rate": 4.703783783783784e-05, + "loss": 0.2073, + "step": 40210 + }, + { + "epoch": 39.0, + "learning_rate": 4.702432432432432e-05, + "loss": 0.123, + "step": 40220 + }, + { + "epoch": 39.0, + "learning_rate": 4.701081081081081e-05, + "loss": 0.2488, + "step": 40230 + }, + { + "epoch": 39.0, + "learning_rate": 4.69972972972973e-05, + "loss": 0.1578, + "step": 40240 + }, + { + "epoch": 39.0, + "learning_rate": 4.698378378378379e-05, + "loss": 0.2795, + "step": 40250 + }, + { + "epoch": 39.0, + "learning_rate": 4.6970270270270274e-05, + "loss": 0.2399, + "step": 40260 + }, + { + "epoch": 39.0, + "learning_rate": 4.695675675675676e-05, + "loss": 0.1681, + "step": 40270 + }, + { + "epoch": 39.01, + "learning_rate": 4.694324324324324e-05, + "loss": 0.1703, + "step": 40280 + }, + { + "epoch": 39.01, + "learning_rate": 4.692972972972973e-05, + "loss": 0.1117, + "step": 40290 + }, + { + "epoch": 39.01, + "learning_rate": 4.691621621621622e-05, + "loss": 0.2058, + "step": 40300 + }, + { + "epoch": 39.01, + "learning_rate": 4.690270270270271e-05, + "loss": 0.1953, + "step": 40310 + }, + { + "epoch": 39.01, + "learning_rate": 4.6889189189189195e-05, + "loss": 0.1575, + "step": 40320 + }, + { + "epoch": 39.01, + "learning_rate": 4.6875675675675676e-05, + "loss": 0.2032, + "step": 40330 + }, + { + "epoch": 39.01, + "learning_rate": 4.686216216216216e-05, + "loss": 0.3437, + "step": 40340 + }, + { + "epoch": 39.01, + "learning_rate": 4.684864864864865e-05, + "loss": 0.1791, + "step": 40350 + }, + { + "epoch": 39.01, + "learning_rate": 4.683513513513514e-05, + "loss": 0.259, + "step": 40360 + }, + { + "epoch": 39.01, + "learning_rate": 4.682162162162163e-05, + "loss": 0.4001, + "step": 40370 + }, + { + "epoch": 39.01, + "learning_rate": 4.6808108108108115e-05, + "loss": 0.311, + "step": 40380 + }, + { + "epoch": 39.01, + "learning_rate": 4.6794594594594596e-05, + "loss": 0.3589, + "step": 40390 + }, + { + "epoch": 39.01, + "learning_rate": 4.6781081081081083e-05, + "loss": 0.2716, + "step": 40400 + }, + { + "epoch": 39.01, + "learning_rate": 4.676756756756757e-05, + "loss": 0.2779, + "step": 40410 + }, + { + "epoch": 39.01, + "learning_rate": 4.675405405405406e-05, + "loss": 0.6005, + "step": 40420 + }, + { + "epoch": 39.01, + "learning_rate": 4.674054054054055e-05, + "loss": 0.5114, + "step": 40430 + }, + { + "epoch": 39.01, + "learning_rate": 4.6727027027027035e-05, + "loss": 0.1299, + "step": 40440 + }, + { + "epoch": 39.01, + "learning_rate": 4.6713513513513516e-05, + "loss": 0.1591, + "step": 40450 + }, + { + "epoch": 39.01, + "learning_rate": 4.6700000000000003e-05, + "loss": 0.2197, + "step": 40460 + }, + { + "epoch": 39.01, + "learning_rate": 4.668648648648649e-05, + "loss": 0.1873, + "step": 40470 + }, + { + "epoch": 39.01, + "learning_rate": 4.667297297297297e-05, + "loss": 0.168, + "step": 40480 + }, + { + "epoch": 39.01, + "learning_rate": 4.665945945945946e-05, + "loss": 0.1849, + "step": 40490 + }, + { + "epoch": 39.01, + "learning_rate": 4.664594594594595e-05, + "loss": 0.1516, + "step": 40500 + }, + { + "epoch": 39.01, + "eval_loss": 0.09935334324836731, + "eval_runtime": 144.5017, + "eval_samples_per_second": 24.969, + "eval_steps_per_second": 3.121, + "eval_wer": 0.08968923263290314, + "step": 40500 + }, + { + "epoch": 39.01, + "learning_rate": 4.6632432432432436e-05, + "loss": 0.1728, + "step": 40510 + }, + { + "epoch": 39.01, + "learning_rate": 4.661891891891892e-05, + "loss": 0.4434, + "step": 40520 + }, + { + "epoch": 39.01, + "learning_rate": 4.6605405405405405e-05, + "loss": 0.3211, + "step": 40530 + }, + { + "epoch": 39.01, + "learning_rate": 4.659189189189189e-05, + "loss": 0.2202, + "step": 40540 + }, + { + "epoch": 39.01, + "learning_rate": 4.657837837837838e-05, + "loss": 0.2751, + "step": 40550 + }, + { + "epoch": 39.01, + "learning_rate": 4.656486486486487e-05, + "loss": 0.4397, + "step": 40560 + }, + { + "epoch": 39.01, + "learning_rate": 4.655135135135135e-05, + "loss": 0.2599, + "step": 40570 + }, + { + "epoch": 39.01, + "learning_rate": 4.653783783783784e-05, + "loss": 0.1575, + "step": 40580 + }, + { + "epoch": 39.01, + "learning_rate": 4.6524324324324325e-05, + "loss": 0.2326, + "step": 40590 + }, + { + "epoch": 39.01, + "learning_rate": 4.651081081081081e-05, + "loss": 0.3107, + "step": 40600 + }, + { + "epoch": 39.01, + "learning_rate": 4.64972972972973e-05, + "loss": 0.289, + "step": 40610 + }, + { + "epoch": 39.01, + "learning_rate": 4.648378378378379e-05, + "loss": 0.242, + "step": 40620 + }, + { + "epoch": 39.01, + "learning_rate": 4.647027027027027e-05, + "loss": 0.2267, + "step": 40630 + }, + { + "epoch": 39.01, + "learning_rate": 4.645675675675676e-05, + "loss": 0.2789, + "step": 40640 + }, + { + "epoch": 39.01, + "learning_rate": 4.6443243243243245e-05, + "loss": 0.2281, + "step": 40650 + }, + { + "epoch": 39.01, + "learning_rate": 4.642972972972973e-05, + "loss": 0.2264, + "step": 40660 + }, + { + "epoch": 39.01, + "learning_rate": 4.641621621621622e-05, + "loss": 0.1705, + "step": 40670 + }, + { + "epoch": 39.01, + "learning_rate": 4.640270270270271e-05, + "loss": 0.1101, + "step": 40680 + }, + { + "epoch": 39.01, + "learning_rate": 4.638918918918919e-05, + "loss": 0.2401, + "step": 40690 + }, + { + "epoch": 39.01, + "learning_rate": 4.637567567567568e-05, + "loss": 0.5144, + "step": 40700 + }, + { + "epoch": 39.01, + "learning_rate": 4.6362162162162165e-05, + "loss": 0.1643, + "step": 40710 + }, + { + "epoch": 39.01, + "learning_rate": 4.634864864864865e-05, + "loss": 0.1603, + "step": 40720 + }, + { + "epoch": 39.01, + "learning_rate": 4.633513513513514e-05, + "loss": 0.2264, + "step": 40730 + }, + { + "epoch": 39.01, + "learning_rate": 4.632162162162162e-05, + "loss": 0.2391, + "step": 40740 + }, + { + "epoch": 39.01, + "learning_rate": 4.630810810810811e-05, + "loss": 0.2784, + "step": 40750 + }, + { + "epoch": 39.01, + "learning_rate": 4.62945945945946e-05, + "loss": 0.3098, + "step": 40760 + }, + { + "epoch": 39.01, + "learning_rate": 4.6281081081081085e-05, + "loss": 0.2863, + "step": 40770 + }, + { + "epoch": 39.01, + "learning_rate": 4.626756756756757e-05, + "loss": 0.2079, + "step": 40780 + }, + { + "epoch": 39.01, + "learning_rate": 4.625405405405406e-05, + "loss": 0.2869, + "step": 40790 + }, + { + "epoch": 39.01, + "learning_rate": 4.624054054054054e-05, + "loss": 0.2515, + "step": 40800 + }, + { + "epoch": 39.01, + "learning_rate": 4.622702702702703e-05, + "loss": 0.3727, + "step": 40810 + }, + { + "epoch": 39.01, + "learning_rate": 4.621351351351352e-05, + "loss": 0.4502, + "step": 40820 + }, + { + "epoch": 39.01, + "learning_rate": 4.6200000000000005e-05, + "loss": 0.323, + "step": 40830 + }, + { + "epoch": 39.01, + "learning_rate": 4.618648648648649e-05, + "loss": 0.4423, + "step": 40840 + }, + { + "epoch": 39.01, + "learning_rate": 4.617297297297298e-05, + "loss": 0.3729, + "step": 40850 + }, + { + "epoch": 39.01, + "learning_rate": 4.615945945945946e-05, + "loss": 0.4564, + "step": 40860 + }, + { + "epoch": 39.01, + "learning_rate": 4.614594594594595e-05, + "loss": 0.4913, + "step": 40870 + }, + { + "epoch": 39.01, + "learning_rate": 4.613243243243243e-05, + "loss": 0.3305, + "step": 40880 + }, + { + "epoch": 39.01, + "learning_rate": 4.611891891891892e-05, + "loss": 0.3428, + "step": 40890 + }, + { + "epoch": 39.01, + "learning_rate": 4.6105405405405406e-05, + "loss": 0.3632, + "step": 40900 + }, + { + "epoch": 39.01, + "learning_rate": 4.6091891891891894e-05, + "loss": 0.3056, + "step": 40910 + }, + { + "epoch": 39.01, + "learning_rate": 4.607837837837838e-05, + "loss": 0.5013, + "step": 40920 + }, + { + "epoch": 40.0, + "learning_rate": 4.606486486486486e-05, + "loss": 0.3827, + "step": 40930 + }, + { + "epoch": 40.0, + "learning_rate": 4.605135135135135e-05, + "loss": 0.3923, + "step": 40940 + }, + { + "epoch": 40.0, + "learning_rate": 4.603783783783784e-05, + "loss": 0.437, + "step": 40950 + }, + { + "epoch": 40.0, + "learning_rate": 4.6024324324324326e-05, + "loss": 0.3304, + "step": 40960 + }, + { + "epoch": 40.0, + "learning_rate": 4.6010810810810814e-05, + "loss": 0.3907, + "step": 40970 + }, + { + "epoch": 40.0, + "learning_rate": 4.5997297297297295e-05, + "loss": 0.3918, + "step": 40980 + }, + { + "epoch": 40.0, + "learning_rate": 4.598378378378378e-05, + "loss": 0.5075, + "step": 40990 + }, + { + "epoch": 40.0, + "learning_rate": 4.597027027027027e-05, + "loss": 0.3648, + "step": 41000 + }, + { + "epoch": 40.0, + "eval_loss": 0.09911862760782242, + "eval_runtime": 130.7096, + "eval_samples_per_second": 27.603, + "eval_steps_per_second": 3.45, + "eval_wer": 0.09574616782369659, + "step": 41000 + }, + { + "epoch": 40.0, + "learning_rate": 4.595675675675676e-05, + "loss": 0.3935, + "step": 41010 + }, + { + "epoch": 40.0, + "learning_rate": 4.5943243243243246e-05, + "loss": 0.4591, + "step": 41020 + }, + { + "epoch": 40.0, + "learning_rate": 4.5929729729729734e-05, + "loss": 0.3737, + "step": 41030 + }, + { + "epoch": 40.0, + "learning_rate": 4.5916216216216215e-05, + "loss": 0.3652, + "step": 41040 + }, + { + "epoch": 40.0, + "learning_rate": 4.59027027027027e-05, + "loss": 0.2429, + "step": 41050 + }, + { + "epoch": 40.0, + "learning_rate": 4.588918918918919e-05, + "loss": 0.2307, + "step": 41060 + }, + { + "epoch": 40.0, + "learning_rate": 4.587567567567568e-05, + "loss": 0.2455, + "step": 41070 + }, + { + "epoch": 40.0, + "learning_rate": 4.5862162162162166e-05, + "loss": 0.422, + "step": 41080 + }, + { + "epoch": 40.0, + "learning_rate": 4.5848648648648654e-05, + "loss": 1.082, + "step": 41090 + }, + { + "epoch": 40.0, + "learning_rate": 4.5835135135135135e-05, + "loss": 1.7914, + "step": 41100 + }, + { + "epoch": 40.0, + "learning_rate": 4.582162162162162e-05, + "loss": 2.5427, + "step": 41110 + }, + { + "epoch": 40.0, + "learning_rate": 4.580810810810811e-05, + "loss": 2.3807, + "step": 41120 + }, + { + "epoch": 40.0, + "learning_rate": 4.57945945945946e-05, + "loss": 2.5046, + "step": 41130 + }, + { + "epoch": 40.0, + "learning_rate": 4.5781081081081086e-05, + "loss": 1.8208, + "step": 41140 + }, + { + "epoch": 40.0, + "learning_rate": 4.5767567567567574e-05, + "loss": 1.4926, + "step": 41150 + }, + { + "epoch": 40.0, + "learning_rate": 4.5754054054054055e-05, + "loss": 0.9988, + "step": 41160 + }, + { + "epoch": 40.0, + "learning_rate": 4.574054054054054e-05, + "loss": 0.4537, + "step": 41170 + }, + { + "epoch": 40.0, + "learning_rate": 4.572702702702703e-05, + "loss": 0.1425, + "step": 41180 + }, + { + "epoch": 40.0, + "learning_rate": 4.571351351351352e-05, + "loss": 0.2392, + "step": 41190 + }, + { + "epoch": 40.0, + "learning_rate": 4.5700000000000006e-05, + "loss": 0.2273, + "step": 41200 + }, + { + "epoch": 40.0, + "learning_rate": 4.568648648648649e-05, + "loss": 0.2598, + "step": 41210 + }, + { + "epoch": 40.0, + "learning_rate": 4.5672972972972975e-05, + "loss": 0.4169, + "step": 41220 + }, + { + "epoch": 40.0, + "learning_rate": 4.565945945945946e-05, + "loss": 0.2973, + "step": 41230 + }, + { + "epoch": 40.0, + "learning_rate": 4.564594594594595e-05, + "loss": 0.1357, + "step": 41240 + }, + { + "epoch": 40.0, + "learning_rate": 4.563243243243244e-05, + "loss": 0.202, + "step": 41250 + }, + { + "epoch": 40.0, + "learning_rate": 4.5618918918918926e-05, + "loss": 0.199, + "step": 41260 + }, + { + "epoch": 40.0, + "learning_rate": 4.560540540540541e-05, + "loss": 0.2044, + "step": 41270 + }, + { + "epoch": 40.0, + "learning_rate": 4.559189189189189e-05, + "loss": 0.2671, + "step": 41280 + }, + { + "epoch": 40.0, + "learning_rate": 4.5578378378378376e-05, + "loss": 0.1982, + "step": 41290 + }, + { + "epoch": 40.01, + "learning_rate": 4.5564864864864864e-05, + "loss": 0.1636, + "step": 41300 + }, + { + "epoch": 40.01, + "learning_rate": 4.555135135135135e-05, + "loss": 0.11, + "step": 41310 + }, + { + "epoch": 40.01, + "learning_rate": 4.553783783783784e-05, + "loss": 0.1573, + "step": 41320 + }, + { + "epoch": 40.01, + "learning_rate": 4.552432432432433e-05, + "loss": 0.1916, + "step": 41330 + }, + { + "epoch": 40.01, + "learning_rate": 4.551081081081081e-05, + "loss": 0.1159, + "step": 41340 + }, + { + "epoch": 40.01, + "learning_rate": 4.5497297297297296e-05, + "loss": 0.1966, + "step": 41350 + }, + { + "epoch": 40.01, + "learning_rate": 4.5483783783783784e-05, + "loss": 0.2923, + "step": 41360 + }, + { + "epoch": 40.01, + "learning_rate": 4.547027027027027e-05, + "loss": 0.2438, + "step": 41370 + }, + { + "epoch": 40.01, + "learning_rate": 4.545675675675676e-05, + "loss": 0.2073, + "step": 41380 + }, + { + "epoch": 40.01, + "learning_rate": 4.544324324324325e-05, + "loss": 0.2997, + "step": 41390 + }, + { + "epoch": 40.01, + "learning_rate": 4.542972972972973e-05, + "loss": 0.2623, + "step": 41400 + }, + { + "epoch": 40.01, + "learning_rate": 4.5416216216216216e-05, + "loss": 0.3155, + "step": 41410 + }, + { + "epoch": 40.01, + "learning_rate": 4.5402702702702704e-05, + "loss": 0.3187, + "step": 41420 + }, + { + "epoch": 40.01, + "learning_rate": 4.538918918918919e-05, + "loss": 0.1987, + "step": 41430 + }, + { + "epoch": 40.01, + "learning_rate": 4.537567567567568e-05, + "loss": 0.4986, + "step": 41440 + }, + { + "epoch": 40.01, + "learning_rate": 4.536216216216216e-05, + "loss": 0.4897, + "step": 41450 + }, + { + "epoch": 40.01, + "learning_rate": 4.534864864864865e-05, + "loss": 0.2298, + "step": 41460 + }, + { + "epoch": 40.01, + "learning_rate": 4.5335135135135136e-05, + "loss": 0.1239, + "step": 41470 + }, + { + "epoch": 40.01, + "learning_rate": 4.5321621621621624e-05, + "loss": 0.2293, + "step": 41480 + }, + { + "epoch": 40.01, + "learning_rate": 4.530810810810811e-05, + "loss": 0.1734, + "step": 41490 + }, + { + "epoch": 40.01, + "learning_rate": 4.52945945945946e-05, + "loss": 0.196, + "step": 41500 + }, + { + "epoch": 40.01, + "eval_loss": 0.09559222310781479, + "eval_runtime": 130.6006, + "eval_samples_per_second": 27.626, + "eval_steps_per_second": 3.453, + "eval_wer": 0.08950286539626334, + "step": 41500 + }, + { + "epoch": 40.01, + "learning_rate": 4.528108108108108e-05, + "loss": 0.1644, + "step": 41510 + }, + { + "epoch": 40.01, + "learning_rate": 4.526756756756757e-05, + "loss": 0.1579, + "step": 41520 + }, + { + "epoch": 40.01, + "learning_rate": 4.5254054054054056e-05, + "loss": 0.141, + "step": 41530 + }, + { + "epoch": 40.01, + "learning_rate": 4.5240540540540544e-05, + "loss": 0.3371, + "step": 41540 + }, + { + "epoch": 40.01, + "learning_rate": 4.522702702702703e-05, + "loss": 0.4138, + "step": 41550 + }, + { + "epoch": 40.01, + "learning_rate": 4.521351351351352e-05, + "loss": 0.3119, + "step": 41560 + }, + { + "epoch": 40.01, + "learning_rate": 4.52e-05, + "loss": 0.2322, + "step": 41570 + }, + { + "epoch": 40.01, + "learning_rate": 4.518648648648649e-05, + "loss": 0.3937, + "step": 41580 + }, + { + "epoch": 40.01, + "learning_rate": 4.5172972972972977e-05, + "loss": 0.3316, + "step": 41590 + }, + { + "epoch": 40.01, + "learning_rate": 4.5159459459459464e-05, + "loss": 0.1624, + "step": 41600 + }, + { + "epoch": 40.01, + "learning_rate": 4.514594594594595e-05, + "loss": 0.1795, + "step": 41610 + }, + { + "epoch": 40.01, + "learning_rate": 4.513243243243244e-05, + "loss": 0.2611, + "step": 41620 + }, + { + "epoch": 40.01, + "learning_rate": 4.511891891891892e-05, + "loss": 0.3387, + "step": 41630 + }, + { + "epoch": 40.01, + "learning_rate": 4.510540540540541e-05, + "loss": 0.3507, + "step": 41640 + }, + { + "epoch": 40.01, + "learning_rate": 4.5091891891891897e-05, + "loss": 0.2079, + "step": 41650 + }, + { + "epoch": 40.01, + "learning_rate": 4.5078378378378384e-05, + "loss": 0.2832, + "step": 41660 + }, + { + "epoch": 40.01, + "learning_rate": 4.506486486486487e-05, + "loss": 0.2423, + "step": 41670 + }, + { + "epoch": 40.01, + "learning_rate": 4.505135135135135e-05, + "loss": 0.1801, + "step": 41680 + }, + { + "epoch": 40.01, + "learning_rate": 4.5037837837837834e-05, + "loss": 0.2014, + "step": 41690 + }, + { + "epoch": 40.01, + "learning_rate": 4.502432432432432e-05, + "loss": 0.099, + "step": 41700 + }, + { + "epoch": 40.01, + "learning_rate": 4.501081081081081e-05, + "loss": 0.2002, + "step": 41710 + }, + { + "epoch": 40.01, + "learning_rate": 4.49972972972973e-05, + "loss": 0.4237, + "step": 41720 + }, + { + "epoch": 40.01, + "learning_rate": 4.4983783783783785e-05, + "loss": 0.2954, + "step": 41730 + }, + { + "epoch": 40.01, + "learning_rate": 4.497027027027027e-05, + "loss": 0.1806, + "step": 41740 + }, + { + "epoch": 40.01, + "learning_rate": 4.4956756756756754e-05, + "loss": 0.2095, + "step": 41750 + }, + { + "epoch": 40.01, + "learning_rate": 4.494324324324324e-05, + "loss": 0.214, + "step": 41760 + }, + { + "epoch": 40.01, + "learning_rate": 4.492972972972973e-05, + "loss": 0.2343, + "step": 41770 + }, + { + "epoch": 40.01, + "learning_rate": 4.491621621621622e-05, + "loss": 0.3027, + "step": 41780 + }, + { + "epoch": 40.01, + "learning_rate": 4.4902702702702706e-05, + "loss": 0.3232, + "step": 41790 + }, + { + "epoch": 40.01, + "learning_rate": 4.488918918918919e-05, + "loss": 0.1725, + "step": 41800 + }, + { + "epoch": 40.01, + "learning_rate": 4.4875675675675674e-05, + "loss": 0.2729, + "step": 41810 + }, + { + "epoch": 40.01, + "learning_rate": 4.486216216216216e-05, + "loss": 0.2277, + "step": 41820 + }, + { + "epoch": 40.01, + "learning_rate": 4.484864864864865e-05, + "loss": 0.3545, + "step": 41830 + }, + { + "epoch": 40.01, + "learning_rate": 4.483513513513514e-05, + "loss": 0.3855, + "step": 41840 + }, + { + "epoch": 40.01, + "learning_rate": 4.4821621621621626e-05, + "loss": 0.3347, + "step": 41850 + }, + { + "epoch": 40.01, + "learning_rate": 4.480810810810811e-05, + "loss": 0.3151, + "step": 41860 + }, + { + "epoch": 40.01, + "learning_rate": 4.4794594594594594e-05, + "loss": 0.4753, + "step": 41870 + }, + { + "epoch": 40.01, + "learning_rate": 4.478108108108108e-05, + "loss": 0.3593, + "step": 41880 + }, + { + "epoch": 40.01, + "learning_rate": 4.476756756756757e-05, + "loss": 0.4803, + "step": 41890 + }, + { + "epoch": 40.01, + "learning_rate": 4.475405405405406e-05, + "loss": 0.3857, + "step": 41900 + }, + { + "epoch": 40.01, + "learning_rate": 4.4740540540540546e-05, + "loss": 0.3792, + "step": 41910 + }, + { + "epoch": 40.01, + "learning_rate": 4.472702702702703e-05, + "loss": 0.3416, + "step": 41920 + }, + { + "epoch": 40.01, + "learning_rate": 4.4713513513513515e-05, + "loss": 0.3608, + "step": 41930 + }, + { + "epoch": 40.01, + "learning_rate": 4.47e-05, + "loss": 0.4811, + "step": 41940 + }, + { + "epoch": 41.0, + "learning_rate": 4.468648648648649e-05, + "loss": 0.438, + "step": 41950 + }, + { + "epoch": 41.0, + "learning_rate": 4.467297297297298e-05, + "loss": 0.3839, + "step": 41960 + }, + { + "epoch": 41.0, + "learning_rate": 4.4659459459459466e-05, + "loss": 0.4539, + "step": 41970 + }, + { + "epoch": 41.0, + "learning_rate": 4.464594594594595e-05, + "loss": 0.3643, + "step": 41980 + }, + { + "epoch": 41.0, + "learning_rate": 4.4632432432432435e-05, + "loss": 0.358, + "step": 41990 + }, + { + "epoch": 41.0, + "learning_rate": 4.461891891891892e-05, + "loss": 0.3855, + "step": 42000 + }, + { + "epoch": 41.0, + "eval_loss": 0.09052729606628418, + "eval_runtime": 145.0591, + "eval_samples_per_second": 24.873, + "eval_steps_per_second": 3.109, + "eval_wer": 0.09034151796114243, + "step": 42000 + }, + { + "epoch": 41.0, + "learning_rate": 4.460540540540541e-05, + "loss": 0.5687, + "step": 42010 + }, + { + "epoch": 41.0, + "learning_rate": 4.45918918918919e-05, + "loss": 0.3735, + "step": 42020 + }, + { + "epoch": 41.0, + "learning_rate": 4.4578378378378386e-05, + "loss": 0.3753, + "step": 42030 + }, + { + "epoch": 41.0, + "learning_rate": 4.456486486486487e-05, + "loss": 0.4309, + "step": 42040 + }, + { + "epoch": 41.0, + "learning_rate": 4.4551351351351355e-05, + "loss": 0.3759, + "step": 42050 + }, + { + "epoch": 41.0, + "learning_rate": 4.453783783783784e-05, + "loss": 0.4132, + "step": 42060 + }, + { + "epoch": 41.0, + "learning_rate": 4.452432432432433e-05, + "loss": 0.263, + "step": 42070 + }, + { + "epoch": 41.0, + "learning_rate": 4.451081081081081e-05, + "loss": 0.2316, + "step": 42080 + }, + { + "epoch": 41.0, + "learning_rate": 4.44972972972973e-05, + "loss": 0.2301, + "step": 42090 + }, + { + "epoch": 41.0, + "learning_rate": 4.448378378378378e-05, + "loss": 0.2523, + "step": 42100 + }, + { + "epoch": 41.0, + "learning_rate": 4.447027027027027e-05, + "loss": 1.0302, + "step": 42110 + }, + { + "epoch": 41.0, + "learning_rate": 4.4456756756756756e-05, + "loss": 1.2883, + "step": 42120 + }, + { + "epoch": 41.0, + "learning_rate": 4.4443243243243244e-05, + "loss": 2.5565, + "step": 42130 + }, + { + "epoch": 41.0, + "learning_rate": 4.442972972972973e-05, + "loss": 2.3677, + "step": 42140 + }, + { + "epoch": 41.0, + "learning_rate": 4.441621621621622e-05, + "loss": 2.5398, + "step": 42150 + }, + { + "epoch": 41.0, + "learning_rate": 4.4404054054054056e-05, + "loss": 2.2147, + "step": 42160 + }, + { + "epoch": 41.0, + "learning_rate": 4.4390540540540544e-05, + "loss": 1.3749, + "step": 42170 + }, + { + "epoch": 41.0, + "learning_rate": 4.437702702702703e-05, + "loss": 1.2438, + "step": 42180 + }, + { + "epoch": 41.0, + "learning_rate": 4.436351351351351e-05, + "loss": 0.5014, + "step": 42190 + }, + { + "epoch": 41.0, + "learning_rate": 4.435e-05, + "loss": 0.1625, + "step": 42200 + }, + { + "epoch": 41.0, + "learning_rate": 4.433648648648649e-05, + "loss": 0.2118, + "step": 42210 + }, + { + "epoch": 41.0, + "learning_rate": 4.4322972972972976e-05, + "loss": 0.1682, + "step": 42220 + }, + { + "epoch": 41.0, + "learning_rate": 4.4309459459459464e-05, + "loss": 0.3038, + "step": 42230 + }, + { + "epoch": 41.0, + "learning_rate": 4.429594594594595e-05, + "loss": 0.3445, + "step": 42240 + }, + { + "epoch": 41.0, + "learning_rate": 4.428243243243243e-05, + "loss": 0.3575, + "step": 42250 + }, + { + "epoch": 41.0, + "learning_rate": 4.426891891891892e-05, + "loss": 0.1621, + "step": 42260 + }, + { + "epoch": 41.0, + "learning_rate": 4.425540540540541e-05, + "loss": 0.1494, + "step": 42270 + }, + { + "epoch": 41.0, + "learning_rate": 4.4241891891891896e-05, + "loss": 0.1963, + "step": 42280 + }, + { + "epoch": 41.0, + "learning_rate": 4.4228378378378384e-05, + "loss": 0.1692, + "step": 42290 + }, + { + "epoch": 41.0, + "learning_rate": 4.421486486486487e-05, + "loss": 0.2282, + "step": 42300 + }, + { + "epoch": 41.0, + "learning_rate": 4.420135135135135e-05, + "loss": 0.204, + "step": 42310 + }, + { + "epoch": 41.01, + "learning_rate": 4.418783783783784e-05, + "loss": 0.1699, + "step": 42320 + }, + { + "epoch": 41.01, + "learning_rate": 4.417432432432433e-05, + "loss": 0.1299, + "step": 42330 + }, + { + "epoch": 41.01, + "learning_rate": 4.4160810810810816e-05, + "loss": 0.1074, + "step": 42340 + }, + { + "epoch": 41.01, + "learning_rate": 4.4147297297297304e-05, + "loss": 0.1972, + "step": 42350 + }, + { + "epoch": 41.01, + "learning_rate": 4.413378378378379e-05, + "loss": 0.1866, + "step": 42360 + }, + { + "epoch": 41.01, + "learning_rate": 4.412027027027027e-05, + "loss": 0.1515, + "step": 42370 + }, + { + "epoch": 41.01, + "learning_rate": 4.4106756756756754e-05, + "loss": 0.2415, + "step": 42380 + }, + { + "epoch": 41.01, + "learning_rate": 4.409324324324324e-05, + "loss": 0.2501, + "step": 42390 + }, + { + "epoch": 41.01, + "learning_rate": 4.407972972972973e-05, + "loss": 0.1913, + "step": 42400 + }, + { + "epoch": 41.01, + "learning_rate": 4.406621621621622e-05, + "loss": 0.2481, + "step": 42410 + }, + { + "epoch": 41.01, + "learning_rate": 4.4052702702702705e-05, + "loss": 0.2926, + "step": 42420 + }, + { + "epoch": 41.01, + "learning_rate": 4.4039189189189186e-05, + "loss": 0.2879, + "step": 42430 + }, + { + "epoch": 41.01, + "learning_rate": 4.4025675675675674e-05, + "loss": 0.3268, + "step": 42440 + }, + { + "epoch": 41.01, + "learning_rate": 4.401216216216216e-05, + "loss": 0.1705, + "step": 42450 + }, + { + "epoch": 41.01, + "learning_rate": 4.399864864864865e-05, + "loss": 0.3855, + "step": 42460 + }, + { + "epoch": 41.01, + "learning_rate": 4.398513513513514e-05, + "loss": 0.4648, + "step": 42470 + }, + { + "epoch": 41.01, + "learning_rate": 4.3971621621621625e-05, + "loss": 0.362, + "step": 42480 + }, + { + "epoch": 41.01, + "learning_rate": 4.3958108108108106e-05, + "loss": 0.1424, + "step": 42490 + }, + { + "epoch": 41.01, + "learning_rate": 4.3944594594594594e-05, + "loss": 0.2194, + "step": 42500 + }, + { + "epoch": 41.01, + "eval_loss": 0.10119093209505081, + "eval_runtime": 127.5053, + "eval_samples_per_second": 28.297, + "eval_steps_per_second": 3.537, + "eval_wer": 0.08992219167870288, + "step": 42500 + }, + { + "epoch": 41.01, + "learning_rate": 4.393108108108108e-05, + "loss": 0.1907, + "step": 42510 + }, + { + "epoch": 41.01, + "learning_rate": 4.391756756756757e-05, + "loss": 0.1553, + "step": 42520 + }, + { + "epoch": 41.01, + "learning_rate": 4.390405405405406e-05, + "loss": 0.1636, + "step": 42530 + }, + { + "epoch": 41.01, + "learning_rate": 4.3890540540540545e-05, + "loss": 0.1442, + "step": 42540 + }, + { + "epoch": 41.01, + "learning_rate": 4.3877027027027026e-05, + "loss": 0.1265, + "step": 42550 + }, + { + "epoch": 41.01, + "learning_rate": 4.3863513513513514e-05, + "loss": 0.2585, + "step": 42560 + }, + { + "epoch": 41.01, + "learning_rate": 4.385e-05, + "loss": 0.3801, + "step": 42570 + }, + { + "epoch": 41.01, + "learning_rate": 4.383648648648649e-05, + "loss": 0.336, + "step": 42580 + }, + { + "epoch": 41.01, + "learning_rate": 4.382297297297298e-05, + "loss": 0.224, + "step": 42590 + }, + { + "epoch": 41.01, + "learning_rate": 4.3809459459459465e-05, + "loss": 0.3605, + "step": 42600 + }, + { + "epoch": 41.01, + "learning_rate": 4.3795945945945946e-05, + "loss": 0.41, + "step": 42610 + }, + { + "epoch": 41.01, + "learning_rate": 4.3782432432432434e-05, + "loss": 0.1991, + "step": 42620 + }, + { + "epoch": 41.01, + "learning_rate": 4.376891891891892e-05, + "loss": 0.1794, + "step": 42630 + }, + { + "epoch": 41.01, + "learning_rate": 4.375540540540541e-05, + "loss": 0.237, + "step": 42640 + }, + { + "epoch": 41.01, + "learning_rate": 4.37418918918919e-05, + "loss": 0.321, + "step": 42650 + }, + { + "epoch": 41.01, + "learning_rate": 4.372837837837838e-05, + "loss": 0.3387, + "step": 42660 + }, + { + "epoch": 41.01, + "learning_rate": 4.3714864864864866e-05, + "loss": 0.2351, + "step": 42670 + }, + { + "epoch": 41.01, + "learning_rate": 4.3701351351351354e-05, + "loss": 0.2022, + "step": 42680 + }, + { + "epoch": 41.01, + "learning_rate": 4.368783783783784e-05, + "loss": 0.2149, + "step": 42690 + }, + { + "epoch": 41.01, + "learning_rate": 4.367432432432433e-05, + "loss": 0.2145, + "step": 42700 + }, + { + "epoch": 41.01, + "learning_rate": 4.366081081081082e-05, + "loss": 0.2327, + "step": 42710 + }, + { + "epoch": 41.01, + "learning_rate": 4.36472972972973e-05, + "loss": 0.1284, + "step": 42720 + }, + { + "epoch": 41.01, + "learning_rate": 4.3633783783783787e-05, + "loss": 0.2062, + "step": 42730 + }, + { + "epoch": 41.01, + "learning_rate": 4.3620270270270274e-05, + "loss": 0.3067, + "step": 42740 + }, + { + "epoch": 41.01, + "learning_rate": 4.360675675675676e-05, + "loss": 0.4646, + "step": 42750 + }, + { + "epoch": 41.01, + "learning_rate": 4.359324324324325e-05, + "loss": 0.1588, + "step": 42760 + }, + { + "epoch": 41.01, + "learning_rate": 4.357972972972973e-05, + "loss": 0.2105, + "step": 42770 + }, + { + "epoch": 41.01, + "learning_rate": 4.356621621621622e-05, + "loss": 0.27, + "step": 42780 + }, + { + "epoch": 41.01, + "learning_rate": 4.35527027027027e-05, + "loss": 0.2318, + "step": 42790 + }, + { + "epoch": 41.01, + "learning_rate": 4.353918918918919e-05, + "loss": 0.2519, + "step": 42800 + }, + { + "epoch": 41.01, + "learning_rate": 4.3525675675675675e-05, + "loss": 0.3298, + "step": 42810 + }, + { + "epoch": 41.01, + "learning_rate": 4.351216216216216e-05, + "loss": 0.2111, + "step": 42820 + }, + { + "epoch": 41.01, + "learning_rate": 4.349864864864865e-05, + "loss": 0.1957, + "step": 42830 + }, + { + "epoch": 41.01, + "learning_rate": 4.348513513513513e-05, + "loss": 0.2621, + "step": 42840 + }, + { + "epoch": 41.01, + "learning_rate": 4.347162162162162e-05, + "loss": 0.3247, + "step": 42850 + }, + { + "epoch": 41.01, + "learning_rate": 4.345810810810811e-05, + "loss": 0.2983, + "step": 42860 + }, + { + "epoch": 41.01, + "learning_rate": 4.3444594594594596e-05, + "loss": 0.4023, + "step": 42870 + }, + { + "epoch": 41.01, + "learning_rate": 4.343108108108108e-05, + "loss": 0.2747, + "step": 42880 + }, + { + "epoch": 41.01, + "learning_rate": 4.341756756756757e-05, + "loss": 0.4421, + "step": 42890 + }, + { + "epoch": 41.01, + "learning_rate": 4.340405405405405e-05, + "loss": 0.3011, + "step": 42900 + }, + { + "epoch": 41.01, + "learning_rate": 4.339054054054054e-05, + "loss": 0.4918, + "step": 42910 + }, + { + "epoch": 41.01, + "learning_rate": 4.337702702702703e-05, + "loss": 0.3922, + "step": 42920 + }, + { + "epoch": 41.01, + "learning_rate": 4.3363513513513516e-05, + "loss": 0.3435, + "step": 42930 + }, + { + "epoch": 41.01, + "learning_rate": 4.335e-05, + "loss": 0.3398, + "step": 42940 + }, + { + "epoch": 41.01, + "learning_rate": 4.333648648648649e-05, + "loss": 0.3595, + "step": 42950 + }, + { + "epoch": 41.01, + "learning_rate": 4.332297297297297e-05, + "loss": 0.4029, + "step": 42960 + }, + { + "epoch": 42.0, + "learning_rate": 4.330945945945946e-05, + "loss": 0.4439, + "step": 42970 + }, + { + "epoch": 42.0, + "learning_rate": 4.329594594594595e-05, + "loss": 0.3902, + "step": 42980 + }, + { + "epoch": 42.0, + "learning_rate": 4.3282432432432436e-05, + "loss": 0.3964, + "step": 42990 + }, + { + "epoch": 42.0, + "learning_rate": 4.3268918918918923e-05, + "loss": 0.3641, + "step": 43000 + }, + { + "epoch": 42.0, + "eval_loss": 0.09582129120826721, + "eval_runtime": 129.3202, + "eval_samples_per_second": 27.9, + "eval_steps_per_second": 3.487, + "eval_wer": 0.09020174253366259, + "step": 43000 + }, + { + "epoch": 42.0, + "learning_rate": 4.325540540540541e-05, + "loss": 0.3102, + "step": 43010 + }, + { + "epoch": 42.0, + "learning_rate": 4.324189189189189e-05, + "loss": 0.3859, + "step": 43020 + }, + { + "epoch": 42.0, + "learning_rate": 4.322837837837838e-05, + "loss": 0.5013, + "step": 43030 + }, + { + "epoch": 42.0, + "learning_rate": 4.321486486486487e-05, + "loss": 0.438, + "step": 43040 + }, + { + "epoch": 42.0, + "learning_rate": 4.3201351351351356e-05, + "loss": 0.3389, + "step": 43050 + }, + { + "epoch": 42.0, + "learning_rate": 4.3187837837837844e-05, + "loss": 0.4231, + "step": 43060 + }, + { + "epoch": 42.0, + "learning_rate": 4.3174324324324325e-05, + "loss": 0.37, + "step": 43070 + }, + { + "epoch": 42.0, + "learning_rate": 4.316081081081081e-05, + "loss": 0.4036, + "step": 43080 + }, + { + "epoch": 42.0, + "learning_rate": 4.31472972972973e-05, + "loss": 0.2621, + "step": 43090 + }, + { + "epoch": 42.0, + "learning_rate": 4.313378378378379e-05, + "loss": 0.2552, + "step": 43100 + }, + { + "epoch": 42.0, + "learning_rate": 4.3120270270270276e-05, + "loss": 0.2413, + "step": 43110 + }, + { + "epoch": 42.0, + "learning_rate": 4.3106756756756764e-05, + "loss": 0.2483, + "step": 43120 + }, + { + "epoch": 42.0, + "learning_rate": 4.3093243243243245e-05, + "loss": 0.9616, + "step": 43130 + }, + { + "epoch": 42.0, + "learning_rate": 4.307972972972973e-05, + "loss": 0.7057, + "step": 43140 + }, + { + "epoch": 42.0, + "learning_rate": 4.306621621621622e-05, + "loss": 2.5947, + "step": 43150 + }, + { + "epoch": 42.0, + "learning_rate": 4.305270270270271e-05, + "loss": 2.5186, + "step": 43160 + }, + { + "epoch": 42.0, + "learning_rate": 4.303918918918919e-05, + "loss": 2.3962, + "step": 43170 + }, + { + "epoch": 42.0, + "learning_rate": 4.302567567567568e-05, + "loss": 2.5149, + "step": 43180 + }, + { + "epoch": 42.0, + "learning_rate": 4.3012162162162165e-05, + "loss": 1.3386, + "step": 43190 + }, + { + "epoch": 42.0, + "learning_rate": 4.2998648648648646e-05, + "loss": 1.4029, + "step": 43200 + }, + { + "epoch": 42.0, + "learning_rate": 4.2985135135135133e-05, + "loss": 0.8061, + "step": 43210 + }, + { + "epoch": 42.0, + "learning_rate": 4.297162162162162e-05, + "loss": 0.2339, + "step": 43220 + }, + { + "epoch": 42.0, + "learning_rate": 4.295810810810811e-05, + "loss": 0.128, + "step": 43230 + }, + { + "epoch": 42.0, + "learning_rate": 4.29445945945946e-05, + "loss": 0.1989, + "step": 43240 + }, + { + "epoch": 42.0, + "learning_rate": 4.2931081081081085e-05, + "loss": 0.2474, + "step": 43250 + }, + { + "epoch": 42.0, + "learning_rate": 4.2917567567567566e-05, + "loss": 0.3087, + "step": 43260 + }, + { + "epoch": 42.0, + "learning_rate": 4.2904054054054054e-05, + "loss": 0.353, + "step": 43270 + }, + { + "epoch": 42.0, + "learning_rate": 4.289054054054054e-05, + "loss": 0.1931, + "step": 43280 + }, + { + "epoch": 42.0, + "learning_rate": 4.287702702702703e-05, + "loss": 0.1316, + "step": 43290 + }, + { + "epoch": 42.0, + "learning_rate": 4.286351351351352e-05, + "loss": 0.2194, + "step": 43300 + }, + { + "epoch": 42.0, + "learning_rate": 4.285e-05, + "loss": 0.1609, + "step": 43310 + }, + { + "epoch": 42.0, + "learning_rate": 4.2836486486486486e-05, + "loss": 0.2185, + "step": 43320 + }, + { + "epoch": 42.0, + "learning_rate": 4.2822972972972974e-05, + "loss": 0.2136, + "step": 43330 + }, + { + "epoch": 42.0, + "learning_rate": 4.280945945945946e-05, + "loss": 0.1409, + "step": 43340 + }, + { + "epoch": 42.01, + "learning_rate": 4.279594594594595e-05, + "loss": 0.1236, + "step": 43350 + }, + { + "epoch": 42.01, + "learning_rate": 4.278243243243244e-05, + "loss": 0.1052, + "step": 43360 + }, + { + "epoch": 42.01, + "learning_rate": 4.276891891891892e-05, + "loss": 0.1851, + "step": 43370 + }, + { + "epoch": 42.01, + "learning_rate": 4.2755405405405406e-05, + "loss": 0.1943, + "step": 43380 + }, + { + "epoch": 42.01, + "learning_rate": 4.2741891891891894e-05, + "loss": 0.138, + "step": 43390 + }, + { + "epoch": 42.01, + "learning_rate": 4.272837837837838e-05, + "loss": 0.1803, + "step": 43400 + }, + { + "epoch": 42.01, + "learning_rate": 4.271486486486487e-05, + "loss": 0.3332, + "step": 43410 + }, + { + "epoch": 42.01, + "learning_rate": 4.270135135135136e-05, + "loss": 0.2055, + "step": 43420 + }, + { + "epoch": 42.01, + "learning_rate": 4.268783783783784e-05, + "loss": 0.2296, + "step": 43430 + }, + { + "epoch": 42.01, + "learning_rate": 4.2674324324324326e-05, + "loss": 0.3068, + "step": 43440 + }, + { + "epoch": 42.01, + "learning_rate": 4.2660810810810814e-05, + "loss": 0.2913, + "step": 43450 + }, + { + "epoch": 42.01, + "learning_rate": 4.26472972972973e-05, + "loss": 0.3231, + "step": 43460 + }, + { + "epoch": 42.01, + "learning_rate": 4.263378378378379e-05, + "loss": 0.2129, + "step": 43470 + }, + { + "epoch": 42.01, + "learning_rate": 4.262027027027028e-05, + "loss": 0.312, + "step": 43480 + }, + { + "epoch": 42.01, + "learning_rate": 4.260675675675676e-05, + "loss": 0.5762, + "step": 43490 + }, + { + "epoch": 42.01, + "learning_rate": 4.2593243243243246e-05, + "loss": 0.4243, + "step": 43500 + }, + { + "epoch": 42.01, + "eval_loss": 0.0958673357963562, + "eval_runtime": 130.3617, + "eval_samples_per_second": 27.677, + "eval_steps_per_second": 3.46, + "eval_wer": 0.08847784559474445, + "step": 43500 + }, + { + "epoch": 42.01, + "learning_rate": 4.2579729729729734e-05, + "loss": 0.1496, + "step": 43510 + }, + { + "epoch": 42.01, + "learning_rate": 4.256621621621622e-05, + "loss": 0.2235, + "step": 43520 + }, + { + "epoch": 42.01, + "learning_rate": 4.255270270270271e-05, + "loss": 0.2026, + "step": 43530 + }, + { + "epoch": 42.01, + "learning_rate": 4.254054054054054e-05, + "loss": 0.1606, + "step": 43540 + }, + { + "epoch": 42.01, + "learning_rate": 4.252702702702703e-05, + "loss": 0.1474, + "step": 43550 + }, + { + "epoch": 42.01, + "learning_rate": 4.2513513513513515e-05, + "loss": 0.1306, + "step": 43560 + }, + { + "epoch": 42.01, + "learning_rate": 4.25e-05, + "loss": 0.1593, + "step": 43570 + }, + { + "epoch": 42.01, + "learning_rate": 4.248648648648649e-05, + "loss": 0.1555, + "step": 43580 + }, + { + "epoch": 42.01, + "learning_rate": 4.247297297297297e-05, + "loss": 0.375, + "step": 43590 + }, + { + "epoch": 42.01, + "learning_rate": 4.245945945945946e-05, + "loss": 0.3234, + "step": 43600 + }, + { + "epoch": 42.01, + "learning_rate": 4.244594594594595e-05, + "loss": 0.2624, + "step": 43610 + }, + { + "epoch": 42.01, + "learning_rate": 4.2432432432432435e-05, + "loss": 0.314, + "step": 43620 + }, + { + "epoch": 42.01, + "learning_rate": 4.241891891891892e-05, + "loss": 0.3979, + "step": 43630 + }, + { + "epoch": 42.01, + "learning_rate": 4.2405405405405404e-05, + "loss": 0.1912, + "step": 43640 + }, + { + "epoch": 42.01, + "learning_rate": 4.239189189189189e-05, + "loss": 0.1712, + "step": 43650 + }, + { + "epoch": 42.01, + "learning_rate": 4.237837837837838e-05, + "loss": 0.2257, + "step": 43660 + }, + { + "epoch": 42.01, + "learning_rate": 4.236486486486487e-05, + "loss": 0.3325, + "step": 43670 + }, + { + "epoch": 42.01, + "learning_rate": 4.2351351351351355e-05, + "loss": 0.3389, + "step": 43680 + }, + { + "epoch": 42.01, + "learning_rate": 4.233783783783784e-05, + "loss": 0.2607, + "step": 43690 + }, + { + "epoch": 42.01, + "learning_rate": 4.2324324324324324e-05, + "loss": 0.2262, + "step": 43700 + }, + { + "epoch": 42.01, + "learning_rate": 4.231081081081081e-05, + "loss": 0.2579, + "step": 43710 + }, + { + "epoch": 42.01, + "learning_rate": 4.22972972972973e-05, + "loss": 0.1988, + "step": 43720 + }, + { + "epoch": 42.01, + "learning_rate": 4.228378378378379e-05, + "loss": 0.2246, + "step": 43730 + }, + { + "epoch": 42.01, + "learning_rate": 4.2270270270270275e-05, + "loss": 0.122, + "step": 43740 + }, + { + "epoch": 42.01, + "learning_rate": 4.225675675675676e-05, + "loss": 0.152, + "step": 43750 + }, + { + "epoch": 42.01, + "learning_rate": 4.2243243243243244e-05, + "loss": 0.2208, + "step": 43760 + }, + { + "epoch": 42.01, + "learning_rate": 4.222972972972973e-05, + "loss": 0.5191, + "step": 43770 + }, + { + "epoch": 42.01, + "learning_rate": 4.221621621621622e-05, + "loss": 0.1307, + "step": 43780 + }, + { + "epoch": 42.01, + "learning_rate": 4.220270270270271e-05, + "loss": 0.1529, + "step": 43790 + }, + { + "epoch": 42.01, + "learning_rate": 4.2189189189189195e-05, + "loss": 0.2111, + "step": 43800 + }, + { + "epoch": 42.01, + "learning_rate": 4.2175675675675677e-05, + "loss": 0.2983, + "step": 43810 + }, + { + "epoch": 42.01, + "learning_rate": 4.2162162162162164e-05, + "loss": 0.2601, + "step": 43820 + }, + { + "epoch": 42.01, + "learning_rate": 4.214864864864865e-05, + "loss": 0.2807, + "step": 43830 + }, + { + "epoch": 42.01, + "learning_rate": 4.213513513513514e-05, + "loss": 0.2978, + "step": 43840 + }, + { + "epoch": 42.01, + "learning_rate": 4.212162162162163e-05, + "loss": 0.1497, + "step": 43850 + }, + { + "epoch": 42.01, + "learning_rate": 4.210810810810811e-05, + "loss": 0.2591, + "step": 43860 + }, + { + "epoch": 42.01, + "learning_rate": 4.2094594594594597e-05, + "loss": 0.339, + "step": 43870 + }, + { + "epoch": 42.01, + "learning_rate": 4.208108108108108e-05, + "loss": 0.3348, + "step": 43880 + }, + { + "epoch": 42.01, + "learning_rate": 4.2067567567567565e-05, + "loss": 0.3923, + "step": 43890 + }, + { + "epoch": 42.01, + "learning_rate": 4.205405405405405e-05, + "loss": 0.3054, + "step": 43900 + }, + { + "epoch": 42.01, + "learning_rate": 4.204054054054054e-05, + "loss": 0.4436, + "step": 43910 + }, + { + "epoch": 42.01, + "learning_rate": 4.202702702702703e-05, + "loss": 0.3197, + "step": 43920 + }, + { + "epoch": 42.01, + "learning_rate": 4.201351351351352e-05, + "loss": 0.4081, + "step": 43930 + }, + { + "epoch": 42.01, + "learning_rate": 4.2e-05, + "loss": 0.4114, + "step": 43940 + }, + { + "epoch": 42.01, + "learning_rate": 4.1986486486486485e-05, + "loss": 0.3258, + "step": 43950 + }, + { + "epoch": 42.01, + "learning_rate": 4.197297297297297e-05, + "loss": 0.334, + "step": 43960 + }, + { + "epoch": 42.01, + "learning_rate": 4.195945945945946e-05, + "loss": 0.3812, + "step": 43970 + }, + { + "epoch": 42.01, + "learning_rate": 4.194594594594595e-05, + "loss": 0.3087, + "step": 43980 + }, + { + "epoch": 43.0, + "learning_rate": 4.193243243243244e-05, + "loss": 0.5303, + "step": 43990 + }, + { + "epoch": 43.0, + "learning_rate": 4.191891891891892e-05, + "loss": 0.3872, + "step": 44000 + }, + { + "epoch": 43.0, + "eval_loss": 0.09279397130012512, + "eval_runtime": 130.5683, + "eval_samples_per_second": 27.633, + "eval_steps_per_second": 3.454, + "eval_wer": 0.08698690770162605, + "step": 44000 + }, + { + "epoch": 43.0, + "learning_rate": 4.1905405405405406e-05, + "loss": 0.3703, + "step": 44010 + }, + { + "epoch": 43.0, + "learning_rate": 4.189189189189189e-05, + "loss": 0.3922, + "step": 44020 + }, + { + "epoch": 43.0, + "learning_rate": 4.187837837837838e-05, + "loss": 0.3323, + "step": 44030 + }, + { + "epoch": 43.0, + "learning_rate": 4.186486486486487e-05, + "loss": 0.3564, + "step": 44040 + }, + { + "epoch": 43.0, + "learning_rate": 4.185135135135135e-05, + "loss": 0.4071, + "step": 44050 + }, + { + "epoch": 43.0, + "learning_rate": 4.183783783783784e-05, + "loss": 0.4919, + "step": 44060 + }, + { + "epoch": 43.0, + "learning_rate": 4.1824324324324326e-05, + "loss": 0.3605, + "step": 44070 + }, + { + "epoch": 43.0, + "learning_rate": 4.1810810810810813e-05, + "loss": 0.3773, + "step": 44080 + }, + { + "epoch": 43.0, + "learning_rate": 4.17972972972973e-05, + "loss": 0.3988, + "step": 44090 + }, + { + "epoch": 43.0, + "learning_rate": 4.178378378378379e-05, + "loss": 0.3873, + "step": 44100 + }, + { + "epoch": 43.0, + "learning_rate": 4.177027027027027e-05, + "loss": 0.3284, + "step": 44110 + }, + { + "epoch": 43.0, + "learning_rate": 4.175675675675676e-05, + "loss": 0.226, + "step": 44120 + }, + { + "epoch": 43.0, + "learning_rate": 4.1743243243243246e-05, + "loss": 0.2315, + "step": 44130 + }, + { + "epoch": 43.0, + "learning_rate": 4.1729729729729733e-05, + "loss": 0.2244, + "step": 44140 + }, + { + "epoch": 43.0, + "learning_rate": 4.171621621621622e-05, + "loss": 0.5274, + "step": 44150 + }, + { + "epoch": 43.0, + "learning_rate": 4.170270270270271e-05, + "loss": 0.9033, + "step": 44160 + }, + { + "epoch": 43.0, + "learning_rate": 4.168918918918919e-05, + "loss": 1.9995, + "step": 44170 + }, + { + "epoch": 43.0, + "learning_rate": 4.167567567567568e-05, + "loss": 2.5217, + "step": 44180 + }, + { + "epoch": 43.0, + "learning_rate": 4.1662162162162166e-05, + "loss": 2.3984, + "step": 44190 + }, + { + "epoch": 43.0, + "learning_rate": 4.1648648648648654e-05, + "loss": 2.5036, + "step": 44200 + }, + { + "epoch": 43.0, + "learning_rate": 4.163513513513514e-05, + "loss": 1.7018, + "step": 44210 + }, + { + "epoch": 43.0, + "learning_rate": 4.162162162162163e-05, + "loss": 1.4427, + "step": 44220 + }, + { + "epoch": 43.0, + "learning_rate": 4.160810810810811e-05, + "loss": 0.9233, + "step": 44230 + }, + { + "epoch": 43.0, + "learning_rate": 4.15945945945946e-05, + "loss": 0.3393, + "step": 44240 + }, + { + "epoch": 43.0, + "learning_rate": 4.1581081081081086e-05, + "loss": 0.1368, + "step": 44250 + }, + { + "epoch": 43.0, + "learning_rate": 4.156756756756757e-05, + "loss": 0.2123, + "step": 44260 + }, + { + "epoch": 43.0, + "learning_rate": 4.1554054054054055e-05, + "loss": 0.2089, + "step": 44270 + }, + { + "epoch": 43.0, + "learning_rate": 4.154054054054054e-05, + "loss": 0.2461, + "step": 44280 + }, + { + "epoch": 43.0, + "learning_rate": 4.1527027027027023e-05, + "loss": 0.4092, + "step": 44290 + }, + { + "epoch": 43.0, + "learning_rate": 4.151351351351351e-05, + "loss": 0.2067, + "step": 44300 + }, + { + "epoch": 43.0, + "learning_rate": 4.15e-05, + "loss": 0.1168, + "step": 44310 + }, + { + "epoch": 43.0, + "learning_rate": 4.148648648648649e-05, + "loss": 0.1996, + "step": 44320 + }, + { + "epoch": 43.0, + "learning_rate": 4.1472972972972975e-05, + "loss": 0.1529, + "step": 44330 + }, + { + "epoch": 43.0, + "learning_rate": 4.145945945945946e-05, + "loss": 0.2234, + "step": 44340 + }, + { + "epoch": 43.0, + "learning_rate": 4.1445945945945944e-05, + "loss": 0.2254, + "step": 44350 + }, + { + "epoch": 43.0, + "learning_rate": 4.143243243243243e-05, + "loss": 0.1762, + "step": 44360 + }, + { + "epoch": 43.01, + "learning_rate": 4.141891891891892e-05, + "loss": 0.1678, + "step": 44370 + }, + { + "epoch": 43.01, + "learning_rate": 4.140540540540541e-05, + "loss": 0.1022, + "step": 44380 + }, + { + "epoch": 43.01, + "learning_rate": 4.1391891891891895e-05, + "loss": 0.1201, + "step": 44390 + }, + { + "epoch": 43.01, + "learning_rate": 4.137837837837838e-05, + "loss": 0.2226, + "step": 44400 + }, + { + "epoch": 43.01, + "learning_rate": 4.1364864864864864e-05, + "loss": 0.1169, + "step": 44410 + }, + { + "epoch": 43.01, + "learning_rate": 4.135135135135135e-05, + "loss": 0.2128, + "step": 44420 + }, + { + "epoch": 43.01, + "learning_rate": 4.133783783783784e-05, + "loss": 0.2889, + "step": 44430 + }, + { + "epoch": 43.01, + "learning_rate": 4.132432432432433e-05, + "loss": 0.1994, + "step": 44440 + }, + { + "epoch": 43.01, + "learning_rate": 4.1310810810810815e-05, + "loss": 0.2082, + "step": 44450 + }, + { + "epoch": 43.01, + "learning_rate": 4.12972972972973e-05, + "loss": 0.2767, + "step": 44460 + }, + { + "epoch": 43.01, + "learning_rate": 4.1283783783783784e-05, + "loss": 0.2622, + "step": 44470 + }, + { + "epoch": 43.01, + "learning_rate": 4.127027027027027e-05, + "loss": 0.3341, + "step": 44480 + }, + { + "epoch": 43.01, + "learning_rate": 4.125675675675676e-05, + "loss": 0.2453, + "step": 44490 + }, + { + "epoch": 43.01, + "learning_rate": 4.124324324324325e-05, + "loss": 0.2174, + "step": 44500 + }, + { + "epoch": 43.01, + "eval_loss": 0.09941111505031586, + "eval_runtime": 130.0294, + "eval_samples_per_second": 27.748, + "eval_steps_per_second": 3.468, + "eval_wer": 0.08428458277034898, + "step": 44500 + }, + { + "epoch": 43.01, + "learning_rate": 4.1229729729729735e-05, + "loss": 0.4317, + "step": 44510 + }, + { + "epoch": 43.01, + "learning_rate": 4.1216216216216216e-05, + "loss": 0.4934, + "step": 44520 + }, + { + "epoch": 43.01, + "learning_rate": 4.1202702702702704e-05, + "loss": 0.1917, + "step": 44530 + }, + { + "epoch": 43.01, + "learning_rate": 4.118918918918919e-05, + "loss": 0.1409, + "step": 44540 + }, + { + "epoch": 43.01, + "learning_rate": 4.117567567567568e-05, + "loss": 0.2066, + "step": 44550 + }, + { + "epoch": 43.01, + "learning_rate": 4.116216216216217e-05, + "loss": 0.1832, + "step": 44560 + }, + { + "epoch": 43.01, + "learning_rate": 4.1148648648648655e-05, + "loss": 0.1527, + "step": 44570 + }, + { + "epoch": 43.01, + "learning_rate": 4.1135135135135136e-05, + "loss": 0.1458, + "step": 44580 + }, + { + "epoch": 43.01, + "learning_rate": 4.1121621621621624e-05, + "loss": 0.1438, + "step": 44590 + }, + { + "epoch": 43.01, + "learning_rate": 4.110810810810811e-05, + "loss": 0.1257, + "step": 44600 + }, + { + "epoch": 43.01, + "learning_rate": 4.10945945945946e-05, + "loss": 0.3531, + "step": 44610 + }, + { + "epoch": 43.01, + "learning_rate": 4.108108108108109e-05, + "loss": 0.3863, + "step": 44620 + }, + { + "epoch": 43.01, + "learning_rate": 4.1067567567567575e-05, + "loss": 0.2936, + "step": 44630 + }, + { + "epoch": 43.01, + "learning_rate": 4.1054054054054056e-05, + "loss": 0.2748, + "step": 44640 + }, + { + "epoch": 43.01, + "learning_rate": 4.1040540540540544e-05, + "loss": 0.3572, + "step": 44650 + }, + { + "epoch": 43.01, + "learning_rate": 4.1027027027027025e-05, + "loss": 0.3151, + "step": 44660 + }, + { + "epoch": 43.01, + "learning_rate": 4.101351351351351e-05, + "loss": 0.1525, + "step": 44670 + }, + { + "epoch": 43.01, + "learning_rate": 4.1e-05, + "loss": 0.206, + "step": 44680 + }, + { + "epoch": 43.01, + "learning_rate": 4.098648648648649e-05, + "loss": 0.2578, + "step": 44690 + }, + { + "epoch": 43.01, + "learning_rate": 4.0972972972972976e-05, + "loss": 0.3185, + "step": 44700 + }, + { + "epoch": 43.01, + "learning_rate": 4.095945945945946e-05, + "loss": 0.246, + "step": 44710 + }, + { + "epoch": 43.01, + "learning_rate": 4.0945945945945945e-05, + "loss": 0.2197, + "step": 44720 + }, + { + "epoch": 43.01, + "learning_rate": 4.093243243243243e-05, + "loss": 0.2433, + "step": 44730 + }, + { + "epoch": 43.01, + "learning_rate": 4.091891891891892e-05, + "loss": 0.194, + "step": 44740 + }, + { + "epoch": 43.01, + "learning_rate": 4.090540540540541e-05, + "loss": 0.1778, + "step": 44750 + }, + { + "epoch": 43.01, + "learning_rate": 4.089189189189189e-05, + "loss": 0.1741, + "step": 44760 + }, + { + "epoch": 43.01, + "learning_rate": 4.087837837837838e-05, + "loss": 0.1135, + "step": 44770 + }, + { + "epoch": 43.01, + "learning_rate": 4.0864864864864865e-05, + "loss": 0.2327, + "step": 44780 + }, + { + "epoch": 43.01, + "learning_rate": 4.085135135135135e-05, + "loss": 0.4914, + "step": 44790 + }, + { + "epoch": 43.01, + "learning_rate": 4.083783783783784e-05, + "loss": 0.2466, + "step": 44800 + }, + { + "epoch": 43.01, + "learning_rate": 4.082432432432433e-05, + "loss": 0.163, + "step": 44810 + }, + { + "epoch": 43.01, + "learning_rate": 4.081081081081081e-05, + "loss": 0.2267, + "step": 44820 + }, + { + "epoch": 43.01, + "learning_rate": 4.07972972972973e-05, + "loss": 0.1973, + "step": 44830 + }, + { + "epoch": 43.01, + "learning_rate": 4.0783783783783785e-05, + "loss": 0.2017, + "step": 44840 + }, + { + "epoch": 43.01, + "learning_rate": 4.077027027027027e-05, + "loss": 0.2717, + "step": 44850 + }, + { + "epoch": 43.01, + "learning_rate": 4.075675675675676e-05, + "loss": 0.3405, + "step": 44860 + }, + { + "epoch": 43.01, + "learning_rate": 4.074324324324325e-05, + "loss": 0.1743, + "step": 44870 + }, + { + "epoch": 43.01, + "learning_rate": 4.072972972972973e-05, + "loss": 0.2227, + "step": 44880 + }, + { + "epoch": 43.01, + "learning_rate": 4.071621621621622e-05, + "loss": 0.2077, + "step": 44890 + }, + { + "epoch": 43.01, + "learning_rate": 4.0702702702702705e-05, + "loss": 0.358, + "step": 44900 + }, + { + "epoch": 43.01, + "learning_rate": 4.068918918918919e-05, + "loss": 0.3254, + "step": 44910 + }, + { + "epoch": 43.01, + "learning_rate": 4.067567567567568e-05, + "loss": 0.2914, + "step": 44920 + }, + { + "epoch": 43.01, + "learning_rate": 4.066216216216216e-05, + "loss": 0.3435, + "step": 44930 + }, + { + "epoch": 43.01, + "learning_rate": 4.064864864864865e-05, + "loss": 0.4235, + "step": 44940 + }, + { + "epoch": 43.01, + "learning_rate": 4.063513513513514e-05, + "loss": 0.3204, + "step": 44950 + }, + { + "epoch": 43.01, + "learning_rate": 4.0621621621621625e-05, + "loss": 0.4168, + "step": 44960 + }, + { + "epoch": 43.01, + "learning_rate": 4.060810810810811e-05, + "loss": 0.3445, + "step": 44970 + }, + { + "epoch": 43.01, + "learning_rate": 4.05945945945946e-05, + "loss": 0.2937, + "step": 44980 + }, + { + "epoch": 43.01, + "learning_rate": 4.058108108108108e-05, + "loss": 0.2895, + "step": 44990 + }, + { + "epoch": 43.01, + "learning_rate": 4.056756756756757e-05, + "loss": 0.2875, + "step": 45000 + }, + { + "epoch": 43.01, + "eval_loss": 0.09440000355243683, + "eval_runtime": 132.6391, + "eval_samples_per_second": 27.202, + "eval_steps_per_second": 3.4, + "eval_wer": 0.08652098961002656, + "step": 45000 + }, + { + "epoch": 43.01, + "learning_rate": 4.055405405405406e-05, + "loss": 0.4197, + "step": 45010 + }, + { + "epoch": 44.0, + "learning_rate": 4.0540540540540545e-05, + "loss": 0.3951, + "step": 45020 + }, + { + "epoch": 44.0, + "learning_rate": 4.052702702702703e-05, + "loss": 0.3543, + "step": 45030 + }, + { + "epoch": 44.0, + "learning_rate": 4.051351351351352e-05, + "loss": 0.4458, + "step": 45040 + }, + { + "epoch": 44.0, + "learning_rate": 4.05e-05, + "loss": 0.3303, + "step": 45050 + }, + { + "epoch": 44.0, + "learning_rate": 4.048648648648648e-05, + "loss": 0.3648, + "step": 45060 + }, + { + "epoch": 44.0, + "learning_rate": 4.047297297297297e-05, + "loss": 0.353, + "step": 45070 + }, + { + "epoch": 44.0, + "learning_rate": 4.045945945945946e-05, + "loss": 0.5643, + "step": 45080 + }, + { + "epoch": 44.0, + "learning_rate": 4.0445945945945946e-05, + "loss": 0.3946, + "step": 45090 + }, + { + "epoch": 44.0, + "learning_rate": 4.0432432432432434e-05, + "loss": 0.3674, + "step": 45100 + }, + { + "epoch": 44.0, + "learning_rate": 4.041891891891892e-05, + "loss": 0.422, + "step": 45110 + }, + { + "epoch": 44.0, + "learning_rate": 4.04054054054054e-05, + "loss": 0.3512, + "step": 45120 + }, + { + "epoch": 44.0, + "learning_rate": 4.039189189189189e-05, + "loss": 0.3553, + "step": 45130 + }, + { + "epoch": 44.0, + "learning_rate": 4.037837837837838e-05, + "loss": 0.2412, + "step": 45140 + }, + { + "epoch": 44.0, + "learning_rate": 4.0364864864864866e-05, + "loss": 0.2252, + "step": 45150 + }, + { + "epoch": 44.0, + "learning_rate": 4.0351351351351354e-05, + "loss": 0.2083, + "step": 45160 + }, + { + "epoch": 44.0, + "learning_rate": 4.0337837837837835e-05, + "loss": 0.2562, + "step": 45170 + }, + { + "epoch": 44.0, + "learning_rate": 4.032432432432432e-05, + "loss": 1.1443, + "step": 45180 + }, + { + "epoch": 44.0, + "learning_rate": 4.031081081081081e-05, + "loss": 1.4649, + "step": 45190 + }, + { + "epoch": 44.0, + "learning_rate": 4.02972972972973e-05, + "loss": 2.5439, + "step": 45200 + }, + { + "epoch": 44.0, + "learning_rate": 4.0283783783783786e-05, + "loss": 2.3745, + "step": 45210 + }, + { + "epoch": 44.0, + "learning_rate": 4.0270270270270274e-05, + "loss": 2.5129, + "step": 45220 + }, + { + "epoch": 44.0, + "learning_rate": 4.0256756756756755e-05, + "loss": 2.0636, + "step": 45230 + }, + { + "epoch": 44.0, + "learning_rate": 4.024324324324324e-05, + "loss": 1.3607, + "step": 45240 + }, + { + "epoch": 44.0, + "learning_rate": 4.022972972972973e-05, + "loss": 1.2888, + "step": 45250 + }, + { + "epoch": 44.0, + "learning_rate": 4.021621621621622e-05, + "loss": 0.4008, + "step": 45260 + }, + { + "epoch": 44.0, + "learning_rate": 4.0202702702702707e-05, + "loss": 0.1347, + "step": 45270 + }, + { + "epoch": 44.0, + "learning_rate": 4.0189189189189194e-05, + "loss": 0.1663, + "step": 45280 + }, + { + "epoch": 44.0, + "learning_rate": 4.0175675675675675e-05, + "loss": 0.1447, + "step": 45290 + }, + { + "epoch": 44.0, + "learning_rate": 4.016216216216216e-05, + "loss": 0.2749, + "step": 45300 + }, + { + "epoch": 44.0, + "learning_rate": 4.014864864864865e-05, + "loss": 0.3467, + "step": 45310 + }, + { + "epoch": 44.0, + "learning_rate": 4.013513513513514e-05, + "loss": 0.2483, + "step": 45320 + }, + { + "epoch": 44.0, + "learning_rate": 4.0121621621621627e-05, + "loss": 0.1631, + "step": 45330 + }, + { + "epoch": 44.0, + "learning_rate": 4.0108108108108114e-05, + "loss": 0.1699, + "step": 45340 + }, + { + "epoch": 44.0, + "learning_rate": 4.0094594594594595e-05, + "loss": 0.1755, + "step": 45350 + }, + { + "epoch": 44.0, + "learning_rate": 4.008108108108108e-05, + "loss": 0.2381, + "step": 45360 + }, + { + "epoch": 44.0, + "learning_rate": 4.006756756756757e-05, + "loss": 0.2325, + "step": 45370 + }, + { + "epoch": 44.0, + "learning_rate": 4.005405405405406e-05, + "loss": 0.1774, + "step": 45380 + }, + { + "epoch": 44.01, + "learning_rate": 4.004054054054055e-05, + "loss": 0.1441, + "step": 45390 + }, + { + "epoch": 44.01, + "learning_rate": 4.002702702702703e-05, + "loss": 0.1001, + "step": 45400 + }, + { + "epoch": 44.01, + "learning_rate": 4.0013513513513515e-05, + "loss": 0.1021, + "step": 45410 + }, + { + "epoch": 44.01, + "learning_rate": 4e-05, + "loss": 0.2263, + "step": 45420 + }, + { + "epoch": 44.01, + "learning_rate": 3.998648648648649e-05, + "loss": 0.1503, + "step": 45430 + }, + { + "epoch": 44.01, + "learning_rate": 3.997297297297298e-05, + "loss": 0.1775, + "step": 45440 + }, + { + "epoch": 44.01, + "learning_rate": 3.995945945945947e-05, + "loss": 0.2493, + "step": 45450 + }, + { + "epoch": 44.01, + "learning_rate": 3.994594594594595e-05, + "loss": 0.2651, + "step": 45460 + }, + { + "epoch": 44.01, + "learning_rate": 3.993243243243243e-05, + "loss": 0.1885, + "step": 45470 + }, + { + "epoch": 44.01, + "learning_rate": 3.9918918918918917e-05, + "loss": 0.2859, + "step": 45480 + }, + { + "epoch": 44.01, + "learning_rate": 3.9905405405405404e-05, + "loss": 0.2491, + "step": 45490 + }, + { + "epoch": 44.01, + "learning_rate": 3.989189189189189e-05, + "loss": 0.3295, + "step": 45500 + }, + { + "epoch": 44.01, + "eval_loss": 0.09721682220697403, + "eval_runtime": 127.7359, + "eval_samples_per_second": 28.246, + "eval_steps_per_second": 3.531, + "eval_wer": 0.08386525648790942, + "step": 45500 + }, + { + "epoch": 44.01, + "learning_rate": 3.987837837837838e-05, + "loss": 0.3309, + "step": 45510 + }, + { + "epoch": 44.01, + "learning_rate": 3.986486486486487e-05, + "loss": 0.1995, + "step": 45520 + }, + { + "epoch": 44.01, + "learning_rate": 3.985135135135135e-05, + "loss": 0.4523, + "step": 45530 + }, + { + "epoch": 44.01, + "learning_rate": 3.983783783783784e-05, + "loss": 0.5104, + "step": 45540 + }, + { + "epoch": 44.01, + "learning_rate": 3.9824324324324324e-05, + "loss": 0.2859, + "step": 45550 + }, + { + "epoch": 44.01, + "learning_rate": 3.981081081081081e-05, + "loss": 0.1025, + "step": 45560 + }, + { + "epoch": 44.01, + "learning_rate": 3.97972972972973e-05, + "loss": 0.202, + "step": 45570 + }, + { + "epoch": 44.01, + "learning_rate": 3.978378378378379e-05, + "loss": 0.1934, + "step": 45580 + }, + { + "epoch": 44.01, + "learning_rate": 3.977027027027027e-05, + "loss": 0.1433, + "step": 45590 + }, + { + "epoch": 44.01, + "learning_rate": 3.975675675675676e-05, + "loss": 0.1385, + "step": 45600 + }, + { + "epoch": 44.01, + "learning_rate": 3.9743243243243244e-05, + "loss": 0.1526, + "step": 45610 + }, + { + "epoch": 44.01, + "learning_rate": 3.972972972972973e-05, + "loss": 0.1363, + "step": 45620 + }, + { + "epoch": 44.01, + "learning_rate": 3.971621621621622e-05, + "loss": 0.3119, + "step": 45630 + }, + { + "epoch": 44.01, + "learning_rate": 3.97027027027027e-05, + "loss": 0.3627, + "step": 45640 + }, + { + "epoch": 44.01, + "learning_rate": 3.968918918918919e-05, + "loss": 0.3268, + "step": 45650 + }, + { + "epoch": 44.01, + "learning_rate": 3.967567567567568e-05, + "loss": 0.1989, + "step": 45660 + }, + { + "epoch": 44.01, + "learning_rate": 3.9662162162162165e-05, + "loss": 0.369, + "step": 45670 + }, + { + "epoch": 44.01, + "learning_rate": 3.964864864864865e-05, + "loss": 0.3889, + "step": 45680 + }, + { + "epoch": 44.01, + "learning_rate": 3.963513513513514e-05, + "loss": 0.1991, + "step": 45690 + }, + { + "epoch": 44.01, + "learning_rate": 3.962162162162162e-05, + "loss": 0.1818, + "step": 45700 + }, + { + "epoch": 44.01, + "learning_rate": 3.960810810810811e-05, + "loss": 0.2263, + "step": 45710 + }, + { + "epoch": 44.01, + "learning_rate": 3.95945945945946e-05, + "loss": 0.281, + "step": 45720 + }, + { + "epoch": 44.01, + "learning_rate": 3.9581081081081085e-05, + "loss": 0.3241, + "step": 45730 + }, + { + "epoch": 44.01, + "learning_rate": 3.956756756756757e-05, + "loss": 0.2423, + "step": 45740 + }, + { + "epoch": 44.01, + "learning_rate": 3.955405405405406e-05, + "loss": 0.2431, + "step": 45750 + }, + { + "epoch": 44.01, + "learning_rate": 3.954054054054054e-05, + "loss": 0.1825, + "step": 45760 + }, + { + "epoch": 44.01, + "learning_rate": 3.952702702702703e-05, + "loss": 0.1922, + "step": 45770 + }, + { + "epoch": 44.01, + "learning_rate": 3.951351351351352e-05, + "loss": 0.2298, + "step": 45780 + }, + { + "epoch": 44.01, + "learning_rate": 3.9500000000000005e-05, + "loss": 0.0919, + "step": 45790 + }, + { + "epoch": 44.01, + "learning_rate": 3.948648648648649e-05, + "loss": 0.2257, + "step": 45800 + }, + { + "epoch": 44.01, + "learning_rate": 3.947297297297298e-05, + "loss": 0.3062, + "step": 45810 + }, + { + "epoch": 44.01, + "learning_rate": 3.945945945945946e-05, + "loss": 0.3576, + "step": 45820 + }, + { + "epoch": 44.01, + "learning_rate": 3.944594594594595e-05, + "loss": 0.1537, + "step": 45830 + }, + { + "epoch": 44.01, + "learning_rate": 3.943243243243244e-05, + "loss": 0.1631, + "step": 45840 + }, + { + "epoch": 44.01, + "learning_rate": 3.9418918918918925e-05, + "loss": 0.2358, + "step": 45850 + }, + { + "epoch": 44.01, + "learning_rate": 3.940540540540541e-05, + "loss": 0.2071, + "step": 45860 + }, + { + "epoch": 44.01, + "learning_rate": 3.9391891891891894e-05, + "loss": 0.2361, + "step": 45870 + }, + { + "epoch": 44.01, + "learning_rate": 3.9378378378378375e-05, + "loss": 0.2978, + "step": 45880 + }, + { + "epoch": 44.01, + "learning_rate": 3.936486486486486e-05, + "loss": 0.1769, + "step": 45890 + }, + { + "epoch": 44.01, + "learning_rate": 3.935135135135135e-05, + "loss": 0.1973, + "step": 45900 + }, + { + "epoch": 44.01, + "learning_rate": 3.933783783783784e-05, + "loss": 0.2161, + "step": 45910 + }, + { + "epoch": 44.01, + "learning_rate": 3.9324324324324326e-05, + "loss": 0.3595, + "step": 45920 + }, + { + "epoch": 44.01, + "learning_rate": 3.9310810810810814e-05, + "loss": 0.2697, + "step": 45930 + }, + { + "epoch": 44.01, + "learning_rate": 3.9297297297297295e-05, + "loss": 0.371, + "step": 45940 + }, + { + "epoch": 44.01, + "learning_rate": 3.928378378378378e-05, + "loss": 0.259, + "step": 45950 + }, + { + "epoch": 44.01, + "learning_rate": 3.927027027027027e-05, + "loss": 0.5754, + "step": 45960 + }, + { + "epoch": 44.01, + "learning_rate": 3.925675675675676e-05, + "loss": 0.3042, + "step": 45970 + }, + { + "epoch": 44.01, + "learning_rate": 3.9243243243243246e-05, + "loss": 0.4424, + "step": 45980 + }, + { + "epoch": 44.01, + "learning_rate": 3.9229729729729734e-05, + "loss": 0.3648, + "step": 45990 + }, + { + "epoch": 44.01, + "learning_rate": 3.9216216216216215e-05, + "loss": 0.3715, + "step": 46000 + }, + { + "epoch": 44.01, + "eval_loss": 0.089134082198143, + "eval_runtime": 128.0512, + "eval_samples_per_second": 28.176, + "eval_steps_per_second": 3.522, + "eval_wer": 0.08325956296883008, + "step": 46000 + }, + { + "epoch": 44.01, + "learning_rate": 3.92027027027027e-05, + "loss": 0.308, + "step": 46010 + }, + { + "epoch": 44.01, + "learning_rate": 3.918918918918919e-05, + "loss": 0.3302, + "step": 46020 + }, + { + "epoch": 44.01, + "learning_rate": 3.917567567567568e-05, + "loss": 0.3732, + "step": 46030 + }, + { + "epoch": 45.0, + "learning_rate": 3.9162162162162166e-05, + "loss": 0.3696, + "step": 46040 + }, + { + "epoch": 45.0, + "learning_rate": 3.914864864864865e-05, + "loss": 0.3865, + "step": 46050 + }, + { + "epoch": 45.0, + "learning_rate": 3.9135135135135135e-05, + "loss": 0.4097, + "step": 46060 + }, + { + "epoch": 45.0, + "learning_rate": 3.912162162162162e-05, + "loss": 0.357, + "step": 46070 + }, + { + "epoch": 45.0, + "learning_rate": 3.910810810810811e-05, + "loss": 0.3259, + "step": 46080 + }, + { + "epoch": 45.0, + "learning_rate": 3.90945945945946e-05, + "loss": 0.3619, + "step": 46090 + }, + { + "epoch": 45.0, + "learning_rate": 3.9081081081081086e-05, + "loss": 0.5642, + "step": 46100 + }, + { + "epoch": 45.0, + "learning_rate": 3.906756756756757e-05, + "loss": 0.3747, + "step": 46110 + }, + { + "epoch": 45.0, + "learning_rate": 3.9054054054054055e-05, + "loss": 0.3525, + "step": 46120 + }, + { + "epoch": 45.0, + "learning_rate": 3.904054054054054e-05, + "loss": 0.4092, + "step": 46130 + }, + { + "epoch": 45.0, + "learning_rate": 3.902702702702703e-05, + "loss": 0.3947, + "step": 46140 + }, + { + "epoch": 45.0, + "learning_rate": 3.901351351351352e-05, + "loss": 0.3678, + "step": 46150 + }, + { + "epoch": 45.0, + "learning_rate": 3.9000000000000006e-05, + "loss": 0.243, + "step": 46160 + }, + { + "epoch": 45.0, + "learning_rate": 3.898648648648649e-05, + "loss": 0.2171, + "step": 46170 + }, + { + "epoch": 45.0, + "learning_rate": 3.8972972972972975e-05, + "loss": 0.2256, + "step": 46180 + }, + { + "epoch": 45.0, + "learning_rate": 3.895945945945946e-05, + "loss": 0.2338, + "step": 46190 + }, + { + "epoch": 45.0, + "learning_rate": 3.894594594594595e-05, + "loss": 0.8821, + "step": 46200 + }, + { + "epoch": 45.0, + "learning_rate": 3.893243243243244e-05, + "loss": 0.9021, + "step": 46210 + }, + { + "epoch": 45.0, + "learning_rate": 3.8918918918918926e-05, + "loss": 2.5876, + "step": 46220 + }, + { + "epoch": 45.0, + "learning_rate": 3.890540540540541e-05, + "loss": 2.3508, + "step": 46230 + }, + { + "epoch": 45.0, + "learning_rate": 3.8891891891891895e-05, + "loss": 2.533, + "step": 46240 + }, + { + "epoch": 45.0, + "learning_rate": 3.887837837837838e-05, + "loss": 2.5077, + "step": 46250 + }, + { + "epoch": 45.0, + "learning_rate": 3.886486486486487e-05, + "loss": 1.1271, + "step": 46260 + }, + { + "epoch": 45.0, + "learning_rate": 3.885135135135135e-05, + "loss": 1.442, + "step": 46270 + }, + { + "epoch": 45.0, + "learning_rate": 3.883783783783784e-05, + "loss": 0.6055, + "step": 46280 + }, + { + "epoch": 45.0, + "learning_rate": 3.882432432432432e-05, + "loss": 0.2262, + "step": 46290 + }, + { + "epoch": 45.0, + "learning_rate": 3.881081081081081e-05, + "loss": 0.1464, + "step": 46300 + }, + { + "epoch": 45.0, + "learning_rate": 3.8797297297297296e-05, + "loss": 0.1678, + "step": 46310 + }, + { + "epoch": 45.0, + "learning_rate": 3.8783783783783784e-05, + "loss": 0.2585, + "step": 46320 + }, + { + "epoch": 45.0, + "learning_rate": 3.877027027027027e-05, + "loss": 0.2762, + "step": 46330 + }, + { + "epoch": 45.0, + "learning_rate": 3.875675675675676e-05, + "loss": 0.3225, + "step": 46340 + }, + { + "epoch": 45.0, + "learning_rate": 3.874324324324324e-05, + "loss": 0.1766, + "step": 46350 + }, + { + "epoch": 45.0, + "learning_rate": 3.872972972972973e-05, + "loss": 0.1287, + "step": 46360 + }, + { + "epoch": 45.0, + "learning_rate": 3.8716216216216216e-05, + "loss": 0.2403, + "step": 46370 + }, + { + "epoch": 45.0, + "learning_rate": 3.8702702702702704e-05, + "loss": 0.1981, + "step": 46380 + }, + { + "epoch": 45.0, + "learning_rate": 3.868918918918919e-05, + "loss": 0.2417, + "step": 46390 + }, + { + "epoch": 45.0, + "learning_rate": 3.867567567567568e-05, + "loss": 0.212, + "step": 46400 + }, + { + "epoch": 45.01, + "learning_rate": 3.866216216216216e-05, + "loss": 0.1858, + "step": 46410 + }, + { + "epoch": 45.01, + "learning_rate": 3.864864864864865e-05, + "loss": 0.1219, + "step": 46420 + }, + { + "epoch": 45.01, + "learning_rate": 3.8635135135135136e-05, + "loss": 0.1173, + "step": 46430 + }, + { + "epoch": 45.01, + "learning_rate": 3.8621621621621624e-05, + "loss": 0.1728, + "step": 46440 + }, + { + "epoch": 45.01, + "learning_rate": 3.860810810810811e-05, + "loss": 0.1882, + "step": 46450 + }, + { + "epoch": 45.01, + "learning_rate": 3.85945945945946e-05, + "loss": 0.1219, + "step": 46460 + }, + { + "epoch": 45.01, + "learning_rate": 3.858108108108108e-05, + "loss": 0.2, + "step": 46470 + }, + { + "epoch": 45.01, + "learning_rate": 3.856756756756757e-05, + "loss": 0.2736, + "step": 46480 + }, + { + "epoch": 45.01, + "learning_rate": 3.8554054054054056e-05, + "loss": 0.1744, + "step": 46490 + }, + { + "epoch": 45.01, + "learning_rate": 3.8540540540540544e-05, + "loss": 0.2301, + "step": 46500 + }, + { + "epoch": 45.01, + "eval_loss": 0.09711813181638718, + "eval_runtime": 144.3674, + "eval_samples_per_second": 24.992, + "eval_steps_per_second": 3.124, + "eval_wer": 0.08619484694590691, + "step": 46500 + }, + { + "epoch": 45.01, + "learning_rate": 3.852702702702703e-05, + "loss": 0.2794, + "step": 46510 + }, + { + "epoch": 45.01, + "learning_rate": 3.851351351351351e-05, + "loss": 0.3053, + "step": 46520 + }, + { + "epoch": 45.01, + "learning_rate": 3.85e-05, + "loss": 0.2952, + "step": 46530 + }, + { + "epoch": 45.01, + "learning_rate": 3.848648648648649e-05, + "loss": 0.2074, + "step": 46540 + }, + { + "epoch": 45.01, + "learning_rate": 3.8472972972972976e-05, + "loss": 0.3224, + "step": 46550 + }, + { + "epoch": 45.01, + "learning_rate": 3.8459459459459464e-05, + "loss": 0.5013, + "step": 46560 + }, + { + "epoch": 45.01, + "learning_rate": 3.844594594594595e-05, + "loss": 0.3831, + "step": 46570 + }, + { + "epoch": 45.01, + "learning_rate": 3.843243243243243e-05, + "loss": 0.1292, + "step": 46580 + }, + { + "epoch": 45.01, + "learning_rate": 3.841891891891892e-05, + "loss": 0.2393, + "step": 46590 + }, + { + "epoch": 45.01, + "learning_rate": 3.840540540540541e-05, + "loss": 0.1689, + "step": 46600 + }, + { + "epoch": 45.01, + "learning_rate": 3.8391891891891896e-05, + "loss": 0.1684, + "step": 46610 + }, + { + "epoch": 45.01, + "learning_rate": 3.8378378378378384e-05, + "loss": 0.1294, + "step": 46620 + }, + { + "epoch": 45.01, + "learning_rate": 3.836486486486487e-05, + "loss": 0.1157, + "step": 46630 + }, + { + "epoch": 45.01, + "learning_rate": 3.835135135135135e-05, + "loss": 0.1538, + "step": 46640 + }, + { + "epoch": 45.01, + "learning_rate": 3.833783783783784e-05, + "loss": 0.1995, + "step": 46650 + }, + { + "epoch": 45.01, + "learning_rate": 3.832432432432433e-05, + "loss": 0.4104, + "step": 46660 + }, + { + "epoch": 45.01, + "learning_rate": 3.831081081081081e-05, + "loss": 0.3252, + "step": 46670 + }, + { + "epoch": 45.01, + "learning_rate": 3.82972972972973e-05, + "loss": 0.2181, + "step": 46680 + }, + { + "epoch": 45.01, + "learning_rate": 3.8283783783783785e-05, + "loss": 0.2833, + "step": 46690 + }, + { + "epoch": 45.01, + "learning_rate": 3.827027027027027e-05, + "loss": 0.3926, + "step": 46700 + }, + { + "epoch": 45.01, + "learning_rate": 3.8256756756756754e-05, + "loss": 0.1901, + "step": 46710 + }, + { + "epoch": 45.01, + "learning_rate": 3.824324324324324e-05, + "loss": 0.1504, + "step": 46720 + }, + { + "epoch": 45.01, + "learning_rate": 3.822972972972973e-05, + "loss": 0.2557, + "step": 46730 + }, + { + "epoch": 45.01, + "learning_rate": 3.821621621621622e-05, + "loss": 0.3076, + "step": 46740 + }, + { + "epoch": 45.01, + "learning_rate": 3.8202702702702705e-05, + "loss": 0.3166, + "step": 46750 + }, + { + "epoch": 45.01, + "learning_rate": 3.8189189189189186e-05, + "loss": 0.2327, + "step": 46760 + }, + { + "epoch": 45.01, + "learning_rate": 3.8175675675675674e-05, + "loss": 0.1855, + "step": 46770 + }, + { + "epoch": 45.01, + "learning_rate": 3.816216216216216e-05, + "loss": 0.2292, + "step": 46780 + }, + { + "epoch": 45.01, + "learning_rate": 3.814864864864865e-05, + "loss": 0.2079, + "step": 46790 + }, + { + "epoch": 45.01, + "learning_rate": 3.813513513513514e-05, + "loss": 0.2658, + "step": 46800 + }, + { + "epoch": 45.01, + "learning_rate": 3.8121621621621625e-05, + "loss": 0.1162, + "step": 46810 + }, + { + "epoch": 45.01, + "learning_rate": 3.8108108108108106e-05, + "loss": 0.1482, + "step": 46820 + }, + { + "epoch": 45.01, + "learning_rate": 3.809594594594595e-05, + "loss": 0.2635, + "step": 46830 + }, + { + "epoch": 45.01, + "learning_rate": 3.808243243243244e-05, + "loss": 0.503, + "step": 46840 + }, + { + "epoch": 45.01, + "learning_rate": 3.806891891891892e-05, + "loss": 0.1289, + "step": 46850 + }, + { + "epoch": 45.01, + "learning_rate": 3.805540540540541e-05, + "loss": 0.17, + "step": 46860 + }, + { + "epoch": 45.01, + "learning_rate": 3.8041891891891895e-05, + "loss": 0.2214, + "step": 46870 + }, + { + "epoch": 45.01, + "learning_rate": 3.802837837837838e-05, + "loss": 0.2447, + "step": 46880 + }, + { + "epoch": 45.01, + "learning_rate": 3.801486486486487e-05, + "loss": 0.2374, + "step": 46890 + }, + { + "epoch": 45.01, + "learning_rate": 3.800135135135136e-05, + "loss": 0.293, + "step": 46900 + }, + { + "epoch": 45.01, + "learning_rate": 3.798783783783784e-05, + "loss": 0.2591, + "step": 46910 + }, + { + "epoch": 45.01, + "learning_rate": 3.797432432432433e-05, + "loss": 0.1812, + "step": 46920 + }, + { + "epoch": 45.01, + "learning_rate": 3.7960810810810815e-05, + "loss": 0.217, + "step": 46930 + }, + { + "epoch": 45.01, + "learning_rate": 3.79472972972973e-05, + "loss": 0.2868, + "step": 46940 + }, + { + "epoch": 45.01, + "learning_rate": 3.7933783783783784e-05, + "loss": 0.3347, + "step": 46950 + }, + { + "epoch": 45.01, + "learning_rate": 3.792027027027027e-05, + "loss": 0.3876, + "step": 46960 + }, + { + "epoch": 45.01, + "learning_rate": 3.790675675675676e-05, + "loss": 0.2931, + "step": 46970 + }, + { + "epoch": 45.01, + "learning_rate": 3.789324324324324e-05, + "loss": 0.5081, + "step": 46980 + }, + { + "epoch": 45.01, + "learning_rate": 3.787972972972973e-05, + "loss": 0.3756, + "step": 46990 + }, + { + "epoch": 45.01, + "learning_rate": 3.7866216216216216e-05, + "loss": 0.4165, + "step": 47000 + }, + { + "epoch": 45.01, + "eval_loss": 0.08795155584812164, + "eval_runtime": 128.4046, + "eval_samples_per_second": 28.099, + "eval_steps_per_second": 3.512, + "eval_wer": 0.08260727764059078, + "step": 47000 + }, + { + "epoch": 45.01, + "learning_rate": 3.7852702702702704e-05, + "loss": 0.4541, + "step": 47010 + }, + { + "epoch": 45.01, + "learning_rate": 3.783918918918919e-05, + "loss": 0.31, + "step": 47020 + }, + { + "epoch": 45.01, + "learning_rate": 3.782567567567568e-05, + "loss": 0.3087, + "step": 47030 + }, + { + "epoch": 45.01, + "learning_rate": 3.781216216216216e-05, + "loss": 0.2767, + "step": 47040 + }, + { + "epoch": 45.01, + "learning_rate": 3.779864864864865e-05, + "loss": 0.324, + "step": 47050 + }, + { + "epoch": 46.0, + "learning_rate": 3.7785135135135136e-05, + "loss": 0.4754, + "step": 47060 + }, + { + "epoch": 46.0, + "learning_rate": 3.7771621621621624e-05, + "loss": 0.3796, + "step": 47070 + }, + { + "epoch": 46.0, + "learning_rate": 3.775810810810811e-05, + "loss": 0.3982, + "step": 47080 + }, + { + "epoch": 46.0, + "learning_rate": 3.774459459459459e-05, + "loss": 0.4084, + "step": 47090 + }, + { + "epoch": 46.0, + "learning_rate": 3.773108108108108e-05, + "loss": 0.3349, + "step": 47100 + }, + { + "epoch": 46.0, + "learning_rate": 3.771756756756757e-05, + "loss": 0.3662, + "step": 47110 + }, + { + "epoch": 46.0, + "learning_rate": 3.7704054054054056e-05, + "loss": 0.427, + "step": 47120 + }, + { + "epoch": 46.0, + "learning_rate": 3.7690540540540544e-05, + "loss": 0.4521, + "step": 47130 + }, + { + "epoch": 46.0, + "learning_rate": 3.767702702702703e-05, + "loss": 0.3436, + "step": 47140 + }, + { + "epoch": 46.0, + "learning_rate": 3.766351351351351e-05, + "loss": 0.4284, + "step": 47150 + }, + { + "epoch": 46.0, + "learning_rate": 3.765e-05, + "loss": 0.391, + "step": 47160 + }, + { + "epoch": 46.0, + "learning_rate": 3.763648648648649e-05, + "loss": 0.3624, + "step": 47170 + }, + { + "epoch": 46.0, + "learning_rate": 3.7622972972972976e-05, + "loss": 0.3379, + "step": 47180 + }, + { + "epoch": 46.0, + "learning_rate": 3.7609459459459464e-05, + "loss": 0.2458, + "step": 47190 + }, + { + "epoch": 46.0, + "learning_rate": 3.759594594594595e-05, + "loss": 0.2313, + "step": 47200 + }, + { + "epoch": 46.0, + "learning_rate": 3.758243243243243e-05, + "loss": 0.2575, + "step": 47210 + }, + { + "epoch": 46.0, + "learning_rate": 3.756891891891892e-05, + "loss": 0.6112, + "step": 47220 + }, + { + "epoch": 46.0, + "learning_rate": 3.755540540540541e-05, + "loss": 0.821, + "step": 47230 + }, + { + "epoch": 46.0, + "learning_rate": 3.7541891891891896e-05, + "loss": 2.2442, + "step": 47240 + }, + { + "epoch": 46.0, + "learning_rate": 3.7528378378378384e-05, + "loss": 2.5167, + "step": 47250 + }, + { + "epoch": 46.0, + "learning_rate": 3.7514864864864865e-05, + "loss": 2.4079, + "step": 47260 + }, + { + "epoch": 46.0, + "learning_rate": 3.750135135135135e-05, + "loss": 2.5069, + "step": 47270 + }, + { + "epoch": 46.0, + "learning_rate": 3.748783783783784e-05, + "loss": 1.6121, + "step": 47280 + }, + { + "epoch": 46.0, + "learning_rate": 3.747432432432433e-05, + "loss": 1.4228, + "step": 47290 + }, + { + "epoch": 46.0, + "learning_rate": 3.7460810810810816e-05, + "loss": 0.8605, + "step": 47300 + }, + { + "epoch": 46.0, + "learning_rate": 3.7447297297297304e-05, + "loss": 0.3082, + "step": 47310 + }, + { + "epoch": 46.0, + "learning_rate": 3.7433783783783785e-05, + "loss": 0.1124, + "step": 47320 + }, + { + "epoch": 46.0, + "learning_rate": 3.742027027027027e-05, + "loss": 0.18, + "step": 47330 + }, + { + "epoch": 46.0, + "learning_rate": 3.740675675675676e-05, + "loss": 0.2075, + "step": 47340 + }, + { + "epoch": 46.0, + "learning_rate": 3.739324324324325e-05, + "loss": 0.219, + "step": 47350 + }, + { + "epoch": 46.0, + "learning_rate": 3.737972972972973e-05, + "loss": 0.3659, + "step": 47360 + }, + { + "epoch": 46.0, + "learning_rate": 3.736621621621622e-05, + "loss": 0.2046, + "step": 47370 + }, + { + "epoch": 46.0, + "learning_rate": 3.7352702702702705e-05, + "loss": 0.0989, + "step": 47380 + }, + { + "epoch": 46.0, + "learning_rate": 3.7339189189189186e-05, + "loss": 0.2178, + "step": 47390 + }, + { + "epoch": 46.0, + "learning_rate": 3.7325675675675674e-05, + "loss": 0.1496, + "step": 47400 + }, + { + "epoch": 46.0, + "learning_rate": 3.731216216216216e-05, + "loss": 0.2311, + "step": 47410 + }, + { + "epoch": 46.0, + "learning_rate": 3.729864864864865e-05, + "loss": 0.1724, + "step": 47420 + }, + { + "epoch": 46.0, + "learning_rate": 3.728513513513514e-05, + "loss": 0.1766, + "step": 47430 + }, + { + "epoch": 46.01, + "learning_rate": 3.7271621621621625e-05, + "loss": 0.1405, + "step": 47440 + }, + { + "epoch": 46.01, + "learning_rate": 3.7258108108108106e-05, + "loss": 0.0983, + "step": 47450 + }, + { + "epoch": 46.01, + "learning_rate": 3.7244594594594594e-05, + "loss": 0.139, + "step": 47460 + }, + { + "epoch": 46.01, + "learning_rate": 3.723108108108108e-05, + "loss": 0.1532, + "step": 47470 + }, + { + "epoch": 46.01, + "learning_rate": 3.721756756756757e-05, + "loss": 0.0983, + "step": 47480 + }, + { + "epoch": 46.01, + "learning_rate": 3.720405405405406e-05, + "loss": 0.206, + "step": 47490 + }, + { + "epoch": 46.01, + "learning_rate": 3.719054054054054e-05, + "loss": 0.2719, + "step": 47500 + }, + { + "epoch": 46.01, + "eval_loss": 0.1005823090672493, + "eval_runtime": 129.6959, + "eval_samples_per_second": 27.819, + "eval_steps_per_second": 3.477, + "eval_wer": 0.08437776638866887, + "step": 47500 + }, + { + "epoch": 46.01, + "learning_rate": 3.7177027027027026e-05, + "loss": 0.227, + "step": 47510 + }, + { + "epoch": 46.01, + "learning_rate": 3.7163513513513514e-05, + "loss": 0.1928, + "step": 47520 + }, + { + "epoch": 46.01, + "learning_rate": 3.715e-05, + "loss": 0.2971, + "step": 47530 + }, + { + "epoch": 46.01, + "learning_rate": 3.713648648648649e-05, + "loss": 0.2347, + "step": 47540 + }, + { + "epoch": 46.01, + "learning_rate": 3.712297297297298e-05, + "loss": 0.3108, + "step": 47550 + }, + { + "epoch": 46.01, + "learning_rate": 3.710945945945946e-05, + "loss": 0.2274, + "step": 47560 + }, + { + "epoch": 46.01, + "learning_rate": 3.7095945945945946e-05, + "loss": 0.239, + "step": 47570 + }, + { + "epoch": 46.01, + "learning_rate": 3.7082432432432434e-05, + "loss": 0.5165, + "step": 47580 + }, + { + "epoch": 46.01, + "learning_rate": 3.706891891891892e-05, + "loss": 0.4152, + "step": 47590 + }, + { + "epoch": 46.01, + "learning_rate": 3.705540540540541e-05, + "loss": 0.167, + "step": 47600 + }, + { + "epoch": 46.01, + "learning_rate": 3.70418918918919e-05, + "loss": 0.1419, + "step": 47610 + }, + { + "epoch": 46.01, + "learning_rate": 3.702837837837838e-05, + "loss": 0.204, + "step": 47620 + }, + { + "epoch": 46.01, + "learning_rate": 3.7014864864864866e-05, + "loss": 0.1832, + "step": 47630 + }, + { + "epoch": 46.01, + "learning_rate": 3.7001351351351354e-05, + "loss": 0.1797, + "step": 47640 + }, + { + "epoch": 46.01, + "learning_rate": 3.698783783783784e-05, + "loss": 0.1246, + "step": 47650 + }, + { + "epoch": 46.01, + "learning_rate": 3.697432432432433e-05, + "loss": 0.1185, + "step": 47660 + }, + { + "epoch": 46.01, + "learning_rate": 3.696081081081082e-05, + "loss": 0.1418, + "step": 47670 + }, + { + "epoch": 46.01, + "learning_rate": 3.69472972972973e-05, + "loss": 0.3633, + "step": 47680 + }, + { + "epoch": 46.01, + "learning_rate": 3.6933783783783786e-05, + "loss": 0.3734, + "step": 47690 + }, + { + "epoch": 46.01, + "learning_rate": 3.6920270270270274e-05, + "loss": 0.2258, + "step": 47700 + }, + { + "epoch": 46.01, + "learning_rate": 3.690675675675676e-05, + "loss": 0.2207, + "step": 47710 + }, + { + "epoch": 46.01, + "learning_rate": 3.689324324324325e-05, + "loss": 0.367, + "step": 47720 + }, + { + "epoch": 46.01, + "learning_rate": 3.687972972972973e-05, + "loss": 0.2815, + "step": 47730 + }, + { + "epoch": 46.01, + "learning_rate": 3.686621621621622e-05, + "loss": 0.1588, + "step": 47740 + }, + { + "epoch": 46.01, + "learning_rate": 3.6852702702702706e-05, + "loss": 0.1939, + "step": 47750 + }, + { + "epoch": 46.01, + "learning_rate": 3.683918918918919e-05, + "loss": 0.2616, + "step": 47760 + }, + { + "epoch": 46.01, + "learning_rate": 3.6825675675675675e-05, + "loss": 0.3356, + "step": 47770 + }, + { + "epoch": 46.01, + "learning_rate": 3.681216216216216e-05, + "loss": 0.2211, + "step": 47780 + }, + { + "epoch": 46.01, + "learning_rate": 3.679864864864865e-05, + "loss": 0.1888, + "step": 47790 + }, + { + "epoch": 46.01, + "learning_rate": 3.678513513513513e-05, + "loss": 0.2165, + "step": 47800 + }, + { + "epoch": 46.01, + "learning_rate": 3.677162162162162e-05, + "loss": 0.1771, + "step": 47810 + }, + { + "epoch": 46.01, + "learning_rate": 3.675810810810811e-05, + "loss": 0.172, + "step": 47820 + }, + { + "epoch": 46.01, + "learning_rate": 3.6744594594594595e-05, + "loss": 0.1858, + "step": 47830 + }, + { + "epoch": 46.01, + "learning_rate": 3.673108108108108e-05, + "loss": 0.106, + "step": 47840 + }, + { + "epoch": 46.01, + "learning_rate": 3.671756756756757e-05, + "loss": 0.2276, + "step": 47850 + }, + { + "epoch": 46.01, + "learning_rate": 3.670405405405405e-05, + "loss": 0.5311, + "step": 47860 + }, + { + "epoch": 46.01, + "learning_rate": 3.669054054054054e-05, + "loss": 0.1809, + "step": 47870 + }, + { + "epoch": 46.01, + "learning_rate": 3.667702702702703e-05, + "loss": 0.1418, + "step": 47880 + }, + { + "epoch": 46.01, + "learning_rate": 3.6663513513513515e-05, + "loss": 0.1978, + "step": 47890 + }, + { + "epoch": 46.01, + "learning_rate": 3.665e-05, + "loss": 0.1816, + "step": 47900 + }, + { + "epoch": 46.01, + "learning_rate": 3.663648648648649e-05, + "loss": 0.1914, + "step": 47910 + }, + { + "epoch": 46.01, + "learning_rate": 3.662297297297297e-05, + "loss": 0.2816, + "step": 47920 + }, + { + "epoch": 46.01, + "learning_rate": 3.660945945945946e-05, + "loss": 0.2979, + "step": 47930 + }, + { + "epoch": 46.01, + "learning_rate": 3.659594594594595e-05, + "loss": 0.1591, + "step": 47940 + }, + { + "epoch": 46.01, + "learning_rate": 3.6582432432432435e-05, + "loss": 0.2642, + "step": 47950 + }, + { + "epoch": 46.01, + "learning_rate": 3.656891891891892e-05, + "loss": 0.2017, + "step": 47960 + }, + { + "epoch": 46.01, + "learning_rate": 3.6555405405405404e-05, + "loss": 0.3524, + "step": 47970 + }, + { + "epoch": 46.01, + "learning_rate": 3.654189189189189e-05, + "loss": 0.387, + "step": 47980 + }, + { + "epoch": 46.01, + "learning_rate": 3.652837837837838e-05, + "loss": 0.2673, + "step": 47990 + }, + { + "epoch": 46.01, + "learning_rate": 3.651486486486487e-05, + "loss": 0.3737, + "step": 48000 + }, + { + "epoch": 46.01, + "eval_loss": 0.09164793789386749, + "eval_runtime": 128.1299, + "eval_samples_per_second": 28.159, + "eval_steps_per_second": 3.52, + "eval_wer": 0.08120952336579229, + "step": 48000 + }, + { + "epoch": 46.01, + "learning_rate": 3.6501351351351355e-05, + "loss": 0.3706, + "step": 48010 + }, + { + "epoch": 46.01, + "learning_rate": 3.648783783783784e-05, + "loss": 0.3264, + "step": 48020 + }, + { + "epoch": 46.01, + "learning_rate": 3.6474324324324324e-05, + "loss": 0.4092, + "step": 48030 + }, + { + "epoch": 46.01, + "learning_rate": 3.646081081081081e-05, + "loss": 0.3574, + "step": 48040 + }, + { + "epoch": 46.01, + "learning_rate": 3.64472972972973e-05, + "loss": 0.3271, + "step": 48050 + }, + { + "epoch": 46.01, + "learning_rate": 3.643378378378379e-05, + "loss": 0.298, + "step": 48060 + }, + { + "epoch": 46.01, + "learning_rate": 3.6420270270270276e-05, + "loss": 0.3063, + "step": 48070 + }, + { + "epoch": 46.01, + "learning_rate": 3.640675675675676e-05, + "loss": 0.4557, + "step": 48080 + }, + { + "epoch": 47.0, + "learning_rate": 3.6393243243243244e-05, + "loss": 0.3721, + "step": 48090 + }, + { + "epoch": 47.0, + "learning_rate": 3.637972972972973e-05, + "loss": 0.3934, + "step": 48100 + }, + { + "epoch": 47.0, + "learning_rate": 3.636621621621622e-05, + "loss": 0.4283, + "step": 48110 + }, + { + "epoch": 47.0, + "learning_rate": 3.635270270270271e-05, + "loss": 0.3125, + "step": 48120 + }, + { + "epoch": 47.0, + "learning_rate": 3.6339189189189196e-05, + "loss": 0.3716, + "step": 48130 + }, + { + "epoch": 47.0, + "learning_rate": 3.632567567567568e-05, + "loss": 0.3586, + "step": 48140 + }, + { + "epoch": 47.0, + "learning_rate": 3.6312162162162164e-05, + "loss": 0.5219, + "step": 48150 + }, + { + "epoch": 47.0, + "learning_rate": 3.6298648648648645e-05, + "loss": 0.35, + "step": 48160 + }, + { + "epoch": 47.0, + "learning_rate": 3.628513513513513e-05, + "loss": 0.3801, + "step": 48170 + }, + { + "epoch": 47.0, + "learning_rate": 3.627162162162162e-05, + "loss": 0.3749, + "step": 48180 + }, + { + "epoch": 47.0, + "learning_rate": 3.625810810810811e-05, + "loss": 0.3563, + "step": 48190 + }, + { + "epoch": 47.0, + "learning_rate": 3.62445945945946e-05, + "loss": 0.3491, + "step": 48200 + }, + { + "epoch": 47.0, + "learning_rate": 3.623108108108108e-05, + "loss": 0.2518, + "step": 48210 + }, + { + "epoch": 47.0, + "learning_rate": 3.6217567567567566e-05, + "loss": 0.2162, + "step": 48220 + }, + { + "epoch": 47.0, + "learning_rate": 3.620405405405405e-05, + "loss": 0.2421, + "step": 48230 + }, + { + "epoch": 47.0, + "learning_rate": 3.619054054054054e-05, + "loss": 0.2783, + "step": 48240 + }, + { + "epoch": 47.0, + "learning_rate": 3.617702702702703e-05, + "loss": 1.0657, + "step": 48250 + }, + { + "epoch": 47.0, + "learning_rate": 3.616351351351352e-05, + "loss": 1.5973, + "step": 48260 + }, + { + "epoch": 47.0, + "learning_rate": 3.615e-05, + "loss": 2.5262, + "step": 48270 + }, + { + "epoch": 47.0, + "learning_rate": 3.6136486486486486e-05, + "loss": 2.3457, + "step": 48280 + }, + { + "epoch": 47.0, + "learning_rate": 3.6122972972972973e-05, + "loss": 2.4966, + "step": 48290 + }, + { + "epoch": 47.0, + "learning_rate": 3.610945945945946e-05, + "loss": 2.0486, + "step": 48300 + }, + { + "epoch": 47.0, + "learning_rate": 3.609594594594595e-05, + "loss": 1.3731, + "step": 48310 + }, + { + "epoch": 47.0, + "learning_rate": 3.608243243243244e-05, + "loss": 1.1086, + "step": 48320 + }, + { + "epoch": 47.0, + "learning_rate": 3.606891891891892e-05, + "loss": 0.3956, + "step": 48330 + }, + { + "epoch": 47.0, + "learning_rate": 3.6055405405405406e-05, + "loss": 0.1156, + "step": 48340 + }, + { + "epoch": 47.0, + "learning_rate": 3.6041891891891893e-05, + "loss": 0.2278, + "step": 48350 + }, + { + "epoch": 47.0, + "learning_rate": 3.602837837837838e-05, + "loss": 0.1407, + "step": 48360 + }, + { + "epoch": 47.0, + "learning_rate": 3.601486486486487e-05, + "loss": 0.2438, + "step": 48370 + }, + { + "epoch": 47.0, + "learning_rate": 3.600135135135135e-05, + "loss": 0.3965, + "step": 48380 + }, + { + "epoch": 47.0, + "learning_rate": 3.598783783783784e-05, + "loss": 0.2354, + "step": 48390 + }, + { + "epoch": 47.0, + "learning_rate": 3.597567567567568e-05, + "loss": 0.1362, + "step": 48400 + }, + { + "epoch": 47.0, + "learning_rate": 3.596216216216217e-05, + "loss": 0.1684, + "step": 48410 + }, + { + "epoch": 47.0, + "learning_rate": 3.594864864864865e-05, + "loss": 0.2044, + "step": 48420 + }, + { + "epoch": 47.0, + "learning_rate": 3.593513513513514e-05, + "loss": 0.2043, + "step": 48430 + }, + { + "epoch": 47.0, + "learning_rate": 3.592162162162162e-05, + "loss": 0.2055, + "step": 48440 + }, + { + "epoch": 47.0, + "learning_rate": 3.590810810810811e-05, + "loss": 0.1579, + "step": 48450 + }, + { + "epoch": 47.01, + "learning_rate": 3.5894594594594595e-05, + "loss": 0.128, + "step": 48460 + }, + { + "epoch": 47.01, + "learning_rate": 3.588108108108108e-05, + "loss": 0.0987, + "step": 48470 + }, + { + "epoch": 47.01, + "learning_rate": 3.5867567567567564e-05, + "loss": 0.1193, + "step": 48480 + }, + { + "epoch": 47.01, + "learning_rate": 3.585405405405405e-05, + "loss": 0.2226, + "step": 48490 + }, + { + "epoch": 47.01, + "learning_rate": 3.584054054054054e-05, + "loss": 0.1377, + "step": 48500 + }, + { + "epoch": 47.01, + "eval_loss": 0.09414780884981155, + "eval_runtime": 132.8533, + "eval_samples_per_second": 27.158, + "eval_steps_per_second": 3.395, + "eval_wer": 0.08372548106042958, + "step": 48500 + }, + { + "epoch": 47.01, + "learning_rate": 3.582702702702703e-05, + "loss": 0.1886, + "step": 48510 + }, + { + "epoch": 47.01, + "learning_rate": 3.5813513513513515e-05, + "loss": 0.2285, + "step": 48520 + }, + { + "epoch": 47.01, + "learning_rate": 3.58e-05, + "loss": 0.2305, + "step": 48530 + }, + { + "epoch": 47.01, + "learning_rate": 3.5786486486486484e-05, + "loss": 0.1978, + "step": 48540 + }, + { + "epoch": 47.01, + "learning_rate": 3.577297297297297e-05, + "loss": 0.2612, + "step": 48550 + }, + { + "epoch": 47.01, + "learning_rate": 3.575945945945946e-05, + "loss": 0.2046, + "step": 48560 + }, + { + "epoch": 47.01, + "learning_rate": 3.574594594594595e-05, + "loss": 0.2802, + "step": 48570 + }, + { + "epoch": 47.01, + "learning_rate": 3.5732432432432435e-05, + "loss": 0.3047, + "step": 48580 + }, + { + "epoch": 47.01, + "learning_rate": 3.571891891891892e-05, + "loss": 0.1875, + "step": 48590 + }, + { + "epoch": 47.01, + "learning_rate": 3.5705405405405404e-05, + "loss": 0.4238, + "step": 48600 + }, + { + "epoch": 47.01, + "learning_rate": 3.569189189189189e-05, + "loss": 0.4021, + "step": 48610 + }, + { + "epoch": 47.01, + "learning_rate": 3.567837837837838e-05, + "loss": 0.249, + "step": 48620 + }, + { + "epoch": 47.01, + "learning_rate": 3.566486486486487e-05, + "loss": 0.1301, + "step": 48630 + }, + { + "epoch": 47.01, + "learning_rate": 3.5651351351351355e-05, + "loss": 0.1791, + "step": 48640 + }, + { + "epoch": 47.01, + "learning_rate": 3.563783783783784e-05, + "loss": 0.1644, + "step": 48650 + }, + { + "epoch": 47.01, + "learning_rate": 3.5624324324324324e-05, + "loss": 0.1716, + "step": 48660 + }, + { + "epoch": 47.01, + "learning_rate": 3.561081081081081e-05, + "loss": 0.1623, + "step": 48670 + }, + { + "epoch": 47.01, + "learning_rate": 3.55972972972973e-05, + "loss": 0.1506, + "step": 48680 + }, + { + "epoch": 47.01, + "learning_rate": 3.558378378378379e-05, + "loss": 0.1085, + "step": 48690 + }, + { + "epoch": 47.01, + "learning_rate": 3.5570270270270275e-05, + "loss": 0.3293, + "step": 48700 + }, + { + "epoch": 47.01, + "learning_rate": 3.5556756756756756e-05, + "loss": 0.332, + "step": 48710 + }, + { + "epoch": 47.01, + "learning_rate": 3.5543243243243244e-05, + "loss": 0.261, + "step": 48720 + }, + { + "epoch": 47.01, + "learning_rate": 3.552972972972973e-05, + "loss": 0.2245, + "step": 48730 + }, + { + "epoch": 47.01, + "learning_rate": 3.551621621621622e-05, + "loss": 0.3092, + "step": 48740 + }, + { + "epoch": 47.01, + "learning_rate": 3.550270270270271e-05, + "loss": 0.2655, + "step": 48750 + }, + { + "epoch": 47.01, + "learning_rate": 3.5489189189189195e-05, + "loss": 0.1676, + "step": 48760 + }, + { + "epoch": 47.01, + "learning_rate": 3.5475675675675676e-05, + "loss": 0.1691, + "step": 48770 + }, + { + "epoch": 47.01, + "learning_rate": 3.5462162162162164e-05, + "loss": 0.213, + "step": 48780 + }, + { + "epoch": 47.01, + "learning_rate": 3.544864864864865e-05, + "loss": 0.2831, + "step": 48790 + }, + { + "epoch": 47.01, + "learning_rate": 3.543513513513514e-05, + "loss": 0.2796, + "step": 48800 + }, + { + "epoch": 47.01, + "learning_rate": 3.542162162162163e-05, + "loss": 0.2123, + "step": 48810 + }, + { + "epoch": 47.01, + "learning_rate": 3.5408108108108115e-05, + "loss": 0.2332, + "step": 48820 + }, + { + "epoch": 47.01, + "learning_rate": 3.5394594594594596e-05, + "loss": 0.1867, + "step": 48830 + }, + { + "epoch": 47.01, + "learning_rate": 3.5381081081081084e-05, + "loss": 0.1737, + "step": 48840 + }, + { + "epoch": 47.01, + "learning_rate": 3.5367567567567565e-05, + "loss": 0.1851, + "step": 48850 + }, + { + "epoch": 47.01, + "learning_rate": 3.535405405405405e-05, + "loss": 0.1017, + "step": 48860 + }, + { + "epoch": 47.01, + "learning_rate": 3.534054054054054e-05, + "loss": 0.206, + "step": 48870 + }, + { + "epoch": 47.01, + "learning_rate": 3.532702702702703e-05, + "loss": 0.3654, + "step": 48880 + }, + { + "epoch": 47.01, + "learning_rate": 3.5313513513513516e-05, + "loss": 0.3235, + "step": 48890 + }, + { + "epoch": 47.01, + "learning_rate": 3.53e-05, + "loss": 0.1375, + "step": 48900 + }, + { + "epoch": 47.01, + "learning_rate": 3.5286486486486485e-05, + "loss": 0.2166, + "step": 48910 + }, + { + "epoch": 47.01, + "learning_rate": 3.527297297297297e-05, + "loss": 0.2274, + "step": 48920 + }, + { + "epoch": 47.01, + "learning_rate": 3.525945945945946e-05, + "loss": 0.1719, + "step": 48930 + }, + { + "epoch": 47.01, + "learning_rate": 3.524594594594595e-05, + "loss": 0.2959, + "step": 48940 + }, + { + "epoch": 47.01, + "learning_rate": 3.523243243243243e-05, + "loss": 0.3384, + "step": 48950 + }, + { + "epoch": 47.01, + "learning_rate": 3.521891891891892e-05, + "loss": 0.1502, + "step": 48960 + }, + { + "epoch": 47.01, + "learning_rate": 3.5205405405405405e-05, + "loss": 0.2754, + "step": 48970 + }, + { + "epoch": 47.01, + "learning_rate": 3.519189189189189e-05, + "loss": 0.1974, + "step": 48980 + }, + { + "epoch": 47.01, + "learning_rate": 3.517837837837838e-05, + "loss": 0.338, + "step": 48990 + }, + { + "epoch": 47.01, + "learning_rate": 3.516486486486487e-05, + "loss": 0.2985, + "step": 49000 + }, + { + "epoch": 47.01, + "eval_loss": 0.09127405285835266, + "eval_runtime": 128.9461, + "eval_samples_per_second": 27.981, + "eval_steps_per_second": 3.498, + "eval_wer": 0.0804640544192331, + "step": 49000 + }, + { + "epoch": 47.01, + "learning_rate": 3.515135135135135e-05, + "loss": 0.2895, + "step": 49010 + }, + { + "epoch": 47.01, + "learning_rate": 3.513783783783784e-05, + "loss": 0.3001, + "step": 49020 + }, + { + "epoch": 47.01, + "learning_rate": 3.5124324324324325e-05, + "loss": 0.3651, + "step": 49030 + }, + { + "epoch": 47.01, + "learning_rate": 3.511081081081081e-05, + "loss": 0.301, + "step": 49040 + }, + { + "epoch": 47.01, + "learning_rate": 3.50972972972973e-05, + "loss": 0.3921, + "step": 49050 + }, + { + "epoch": 47.01, + "learning_rate": 3.508378378378379e-05, + "loss": 0.3411, + "step": 49060 + }, + { + "epoch": 47.01, + "learning_rate": 3.507027027027027e-05, + "loss": 0.3234, + "step": 49070 + }, + { + "epoch": 47.01, + "learning_rate": 3.505675675675676e-05, + "loss": 0.3235, + "step": 49080 + }, + { + "epoch": 47.01, + "learning_rate": 3.5043243243243245e-05, + "loss": 0.2846, + "step": 49090 + }, + { + "epoch": 47.01, + "learning_rate": 3.502972972972973e-05, + "loss": 0.3977, + "step": 49100 + }, + { + "epoch": 48.0, + "learning_rate": 3.501621621621622e-05, + "loss": 0.3864, + "step": 49110 + }, + { + "epoch": 48.0, + "learning_rate": 3.50027027027027e-05, + "loss": 0.3428, + "step": 49120 + }, + { + "epoch": 48.0, + "learning_rate": 3.498918918918919e-05, + "loss": 0.4337, + "step": 49130 + }, + { + "epoch": 48.0, + "learning_rate": 3.497567567567568e-05, + "loss": 0.3343, + "step": 49140 + }, + { + "epoch": 48.0, + "learning_rate": 3.4962162162162166e-05, + "loss": 0.3486, + "step": 49150 + }, + { + "epoch": 48.0, + "learning_rate": 3.494864864864865e-05, + "loss": 0.3565, + "step": 49160 + }, + { + "epoch": 48.0, + "learning_rate": 3.493513513513514e-05, + "loss": 0.5544, + "step": 49170 + }, + { + "epoch": 48.0, + "learning_rate": 3.492162162162162e-05, + "loss": 0.3493, + "step": 49180 + }, + { + "epoch": 48.0, + "learning_rate": 3.490810810810811e-05, + "loss": 0.3575, + "step": 49190 + }, + { + "epoch": 48.0, + "learning_rate": 3.48945945945946e-05, + "loss": 0.3959, + "step": 49200 + }, + { + "epoch": 48.0, + "learning_rate": 3.4881081081081086e-05, + "loss": 0.3508, + "step": 49210 + }, + { + "epoch": 48.0, + "learning_rate": 3.486756756756757e-05, + "loss": 0.3644, + "step": 49220 + }, + { + "epoch": 48.0, + "learning_rate": 3.485405405405406e-05, + "loss": 0.2489, + "step": 49230 + }, + { + "epoch": 48.0, + "learning_rate": 3.484054054054054e-05, + "loss": 0.2127, + "step": 49240 + }, + { + "epoch": 48.0, + "learning_rate": 3.482702702702702e-05, + "loss": 0.2104, + "step": 49250 + }, + { + "epoch": 48.0, + "learning_rate": 3.481351351351351e-05, + "loss": 0.2197, + "step": 49260 + }, + { + "epoch": 48.0, + "learning_rate": 3.48e-05, + "loss": 0.9705, + "step": 49270 + }, + { + "epoch": 48.0, + "learning_rate": 3.478648648648649e-05, + "loss": 1.078, + "step": 49280 + }, + { + "epoch": 48.0, + "learning_rate": 3.4772972972972974e-05, + "loss": 2.5376, + "step": 49290 + }, + { + "epoch": 48.0, + "learning_rate": 3.475945945945946e-05, + "loss": 2.3896, + "step": 49300 + }, + { + "epoch": 48.0, + "learning_rate": 3.474594594594594e-05, + "loss": 2.4904, + "step": 49310 + }, + { + "epoch": 48.0, + "learning_rate": 3.473243243243243e-05, + "loss": 2.3604, + "step": 49320 + }, + { + "epoch": 48.0, + "learning_rate": 3.471891891891892e-05, + "loss": 1.1387, + "step": 49330 + }, + { + "epoch": 48.0, + "learning_rate": 3.470540540540541e-05, + "loss": 1.3633, + "step": 49340 + }, + { + "epoch": 48.0, + "learning_rate": 3.4691891891891895e-05, + "loss": 0.596, + "step": 49350 + }, + { + "epoch": 48.0, + "learning_rate": 3.4678378378378376e-05, + "loss": 0.181, + "step": 49360 + }, + { + "epoch": 48.0, + "learning_rate": 3.466486486486486e-05, + "loss": 0.1424, + "step": 49370 + }, + { + "epoch": 48.0, + "learning_rate": 3.465135135135135e-05, + "loss": 0.1585, + "step": 49380 + }, + { + "epoch": 48.0, + "learning_rate": 3.463783783783784e-05, + "loss": 0.2811, + "step": 49390 + }, + { + "epoch": 48.0, + "learning_rate": 3.462432432432433e-05, + "loss": 0.3083, + "step": 49400 + }, + { + "epoch": 48.0, + "learning_rate": 3.4610810810810815e-05, + "loss": 0.3204, + "step": 49410 + }, + { + "epoch": 48.0, + "learning_rate": 3.4597297297297296e-05, + "loss": 0.1474, + "step": 49420 + }, + { + "epoch": 48.0, + "learning_rate": 3.4583783783783783e-05, + "loss": 0.1248, + "step": 49430 + }, + { + "epoch": 48.0, + "learning_rate": 3.457027027027027e-05, + "loss": 0.2261, + "step": 49440 + }, + { + "epoch": 48.0, + "learning_rate": 3.455675675675676e-05, + "loss": 0.1731, + "step": 49450 + }, + { + "epoch": 48.0, + "learning_rate": 3.454324324324325e-05, + "loss": 0.1886, + "step": 49460 + }, + { + "epoch": 48.0, + "learning_rate": 3.4529729729729735e-05, + "loss": 0.1922, + "step": 49470 + }, + { + "epoch": 48.01, + "learning_rate": 3.4516216216216216e-05, + "loss": 0.152, + "step": 49480 + }, + { + "epoch": 48.01, + "learning_rate": 3.4502702702702703e-05, + "loss": 0.1205, + "step": 49490 + }, + { + "epoch": 48.01, + "learning_rate": 3.448918918918919e-05, + "loss": 0.1017, + "step": 49500 + }, + { + "epoch": 48.01, + "eval_loss": 0.09043174982070923, + "eval_runtime": 129.6214, + "eval_samples_per_second": 27.835, + "eval_steps_per_second": 3.479, + "eval_wer": 0.08079019708335275, + "step": 49500 + }, + { + "epoch": 48.01, + "learning_rate": 3.447567567567568e-05, + "loss": 0.1974, + "step": 49510 + }, + { + "epoch": 48.01, + "learning_rate": 3.446216216216217e-05, + "loss": 0.1492, + "step": 49520 + }, + { + "epoch": 48.01, + "learning_rate": 3.4448648648648655e-05, + "loss": 0.1492, + "step": 49530 + }, + { + "epoch": 48.01, + "learning_rate": 3.4435135135135136e-05, + "loss": 0.2186, + "step": 49540 + }, + { + "epoch": 48.01, + "learning_rate": 3.4421621621621624e-05, + "loss": 0.2605, + "step": 49550 + }, + { + "epoch": 48.01, + "learning_rate": 3.440810810810811e-05, + "loss": 0.156, + "step": 49560 + }, + { + "epoch": 48.01, + "learning_rate": 3.43945945945946e-05, + "loss": 0.2315, + "step": 49570 + }, + { + "epoch": 48.01, + "learning_rate": 3.438108108108109e-05, + "loss": 0.2444, + "step": 49580 + }, + { + "epoch": 48.01, + "learning_rate": 3.436756756756757e-05, + "loss": 0.3251, + "step": 49590 + }, + { + "epoch": 48.01, + "learning_rate": 3.4354054054054056e-05, + "loss": 0.2869, + "step": 49600 + }, + { + "epoch": 48.01, + "learning_rate": 3.4340540540540544e-05, + "loss": 0.2008, + "step": 49610 + }, + { + "epoch": 48.01, + "learning_rate": 3.432702702702703e-05, + "loss": 0.296, + "step": 49620 + }, + { + "epoch": 48.01, + "learning_rate": 3.431351351351352e-05, + "loss": 0.4529, + "step": 49630 + }, + { + "epoch": 48.01, + "learning_rate": 3.430000000000001e-05, + "loss": 0.3276, + "step": 49640 + }, + { + "epoch": 48.01, + "learning_rate": 3.428648648648649e-05, + "loss": 0.1253, + "step": 49650 + }, + { + "epoch": 48.01, + "learning_rate": 3.427297297297297e-05, + "loss": 0.199, + "step": 49660 + }, + { + "epoch": 48.01, + "learning_rate": 3.425945945945946e-05, + "loss": 0.1675, + "step": 49670 + }, + { + "epoch": 48.01, + "learning_rate": 3.4245945945945945e-05, + "loss": 0.1331, + "step": 49680 + }, + { + "epoch": 48.01, + "learning_rate": 3.423243243243243e-05, + "loss": 0.1617, + "step": 49690 + }, + { + "epoch": 48.01, + "learning_rate": 3.421891891891892e-05, + "loss": 0.1267, + "step": 49700 + }, + { + "epoch": 48.01, + "learning_rate": 3.420540540540541e-05, + "loss": 0.1322, + "step": 49710 + }, + { + "epoch": 48.01, + "learning_rate": 3.419189189189189e-05, + "loss": 0.2035, + "step": 49720 + }, + { + "epoch": 48.01, + "learning_rate": 3.417837837837838e-05, + "loss": 0.3709, + "step": 49730 + }, + { + "epoch": 48.01, + "learning_rate": 3.4164864864864865e-05, + "loss": 0.2847, + "step": 49740 + }, + { + "epoch": 48.01, + "learning_rate": 3.415135135135135e-05, + "loss": 0.1699, + "step": 49750 + }, + { + "epoch": 48.01, + "learning_rate": 3.413783783783784e-05, + "loss": 0.3028, + "step": 49760 + }, + { + "epoch": 48.01, + "learning_rate": 3.412432432432433e-05, + "loss": 0.375, + "step": 49770 + }, + { + "epoch": 48.01, + "learning_rate": 3.411081081081081e-05, + "loss": 0.1886, + "step": 49780 + }, + { + "epoch": 48.01, + "learning_rate": 3.40972972972973e-05, + "loss": 0.1331, + "step": 49790 + }, + { + "epoch": 48.01, + "learning_rate": 3.4083783783783785e-05, + "loss": 0.1729, + "step": 49800 + }, + { + "epoch": 48.01, + "learning_rate": 3.407027027027027e-05, + "loss": 0.3216, + "step": 49810 + }, + { + "epoch": 48.01, + "learning_rate": 3.405675675675676e-05, + "loss": 0.3178, + "step": 49820 + }, + { + "epoch": 48.01, + "learning_rate": 3.404324324324324e-05, + "loss": 0.2315, + "step": 49830 + }, + { + "epoch": 48.01, + "learning_rate": 3.402972972972973e-05, + "loss": 0.1847, + "step": 49840 + }, + { + "epoch": 48.01, + "learning_rate": 3.401621621621622e-05, + "loss": 0.2241, + "step": 49850 + }, + { + "epoch": 48.01, + "learning_rate": 3.4002702702702705e-05, + "loss": 0.1669, + "step": 49860 + }, + { + "epoch": 48.01, + "learning_rate": 3.398918918918919e-05, + "loss": 0.2202, + "step": 49870 + }, + { + "epoch": 48.01, + "learning_rate": 3.397567567567568e-05, + "loss": 0.1052, + "step": 49880 + }, + { + "epoch": 48.01, + "learning_rate": 3.396216216216216e-05, + "loss": 0.1627, + "step": 49890 + }, + { + "epoch": 48.01, + "learning_rate": 3.394864864864865e-05, + "loss": 0.2284, + "step": 49900 + }, + { + "epoch": 48.01, + "learning_rate": 3.393513513513514e-05, + "loss": 0.4815, + "step": 49910 + }, + { + "epoch": 48.01, + "learning_rate": 3.3921621621621625e-05, + "loss": 0.1208, + "step": 49920 + }, + { + "epoch": 48.01, + "learning_rate": 3.390810810810811e-05, + "loss": 0.1843, + "step": 49930 + }, + { + "epoch": 48.01, + "learning_rate": 3.38945945945946e-05, + "loss": 0.2176, + "step": 49940 + }, + { + "epoch": 48.01, + "learning_rate": 3.388108108108108e-05, + "loss": 0.2126, + "step": 49950 + }, + { + "epoch": 48.01, + "learning_rate": 3.386756756756757e-05, + "loss": 0.2181, + "step": 49960 + }, + { + "epoch": 48.01, + "learning_rate": 3.385405405405406e-05, + "loss": 0.3203, + "step": 49970 + }, + { + "epoch": 48.01, + "learning_rate": 3.3840540540540545e-05, + "loss": 0.2227, + "step": 49980 + }, + { + "epoch": 48.01, + "learning_rate": 3.382702702702703e-05, + "loss": 0.1738, + "step": 49990 + }, + { + "epoch": 48.01, + "learning_rate": 3.381351351351352e-05, + "loss": 0.2294, + "step": 50000 + }, + { + "epoch": 48.01, + "eval_loss": 0.09008501470088959, + "eval_runtime": 136.0591, + "eval_samples_per_second": 26.518, + "eval_steps_per_second": 3.315, + "eval_wer": 0.07776172948795601, + "step": 50000 + }, + { + "epoch": 48.01, + "learning_rate": 3.38e-05, + "loss": 0.334, + "step": 50010 + }, + { + "epoch": 48.01, + "learning_rate": 3.378648648648649e-05, + "loss": 0.3074, + "step": 50020 + }, + { + "epoch": 48.01, + "learning_rate": 3.377297297297298e-05, + "loss": 0.384, + "step": 50030 + }, + { + "epoch": 48.01, + "learning_rate": 3.3759459459459465e-05, + "loss": 0.2595, + "step": 50040 + }, + { + "epoch": 48.01, + "learning_rate": 3.3745945945945946e-05, + "loss": 0.4065, + "step": 50050 + }, + { + "epoch": 48.01, + "learning_rate": 3.3732432432432434e-05, + "loss": 0.3045, + "step": 50060 + }, + { + "epoch": 48.01, + "learning_rate": 3.3718918918918915e-05, + "loss": 0.4214, + "step": 50070 + }, + { + "epoch": 48.01, + "learning_rate": 3.37054054054054e-05, + "loss": 0.335, + "step": 50080 + }, + { + "epoch": 48.01, + "learning_rate": 3.369189189189189e-05, + "loss": 0.3031, + "step": 50090 + }, + { + "epoch": 48.01, + "learning_rate": 3.367837837837838e-05, + "loss": 0.2963, + "step": 50100 + }, + { + "epoch": 48.01, + "learning_rate": 3.3664864864864866e-05, + "loss": 0.2766, + "step": 50110 + }, + { + "epoch": 48.01, + "learning_rate": 3.3651351351351354e-05, + "loss": 0.3341, + "step": 50120 + }, + { + "epoch": 49.0, + "learning_rate": 3.3637837837837835e-05, + "loss": 0.4365, + "step": 50130 + }, + { + "epoch": 49.0, + "learning_rate": 3.362432432432432e-05, + "loss": 0.376, + "step": 50140 + }, + { + "epoch": 49.0, + "learning_rate": 3.361081081081081e-05, + "loss": 0.4255, + "step": 50150 + }, + { + "epoch": 49.0, + "learning_rate": 3.35972972972973e-05, + "loss": 0.3855, + "step": 50160 + }, + { + "epoch": 49.0, + "learning_rate": 3.3583783783783786e-05, + "loss": 0.3143, + "step": 50170 + }, + { + "epoch": 49.0, + "learning_rate": 3.3570270270270274e-05, + "loss": 0.3363, + "step": 50180 + }, + { + "epoch": 49.0, + "learning_rate": 3.3556756756756755e-05, + "loss": 0.4061, + "step": 50190 + }, + { + "epoch": 49.0, + "learning_rate": 3.354324324324324e-05, + "loss": 0.4451, + "step": 50200 + }, + { + "epoch": 49.0, + "learning_rate": 3.352972972972973e-05, + "loss": 0.3298, + "step": 50210 + }, + { + "epoch": 49.0, + "learning_rate": 3.351621621621622e-05, + "loss": 0.3668, + "step": 50220 + }, + { + "epoch": 49.0, + "learning_rate": 3.3502702702702706e-05, + "loss": 0.409, + "step": 50230 + }, + { + "epoch": 49.0, + "learning_rate": 3.348918918918919e-05, + "loss": 0.3763, + "step": 50240 + }, + { + "epoch": 49.0, + "learning_rate": 3.3475675675675675e-05, + "loss": 0.2772, + "step": 50250 + }, + { + "epoch": 49.0, + "learning_rate": 3.346216216216216e-05, + "loss": 0.2248, + "step": 50260 + }, + { + "epoch": 49.0, + "learning_rate": 3.344864864864865e-05, + "loss": 0.2062, + "step": 50270 + }, + { + "epoch": 49.0, + "learning_rate": 3.343513513513514e-05, + "loss": 0.2328, + "step": 50280 + }, + { + "epoch": 49.0, + "learning_rate": 3.3421621621621626e-05, + "loss": 0.7652, + "step": 50290 + }, + { + "epoch": 49.0, + "learning_rate": 3.340810810810811e-05, + "loss": 0.6703, + "step": 50300 + }, + { + "epoch": 49.0, + "learning_rate": 3.3394594594594595e-05, + "loss": 2.4157, + "step": 50310 + }, + { + "epoch": 49.0, + "learning_rate": 3.338108108108108e-05, + "loss": 2.4865, + "step": 50320 + }, + { + "epoch": 49.0, + "learning_rate": 3.336756756756757e-05, + "loss": 2.3704, + "step": 50330 + }, + { + "epoch": 49.0, + "learning_rate": 3.335405405405406e-05, + "loss": 2.491, + "step": 50340 + }, + { + "epoch": 49.0, + "learning_rate": 3.3340540540540546e-05, + "loss": 1.4851, + "step": 50350 + }, + { + "epoch": 49.0, + "learning_rate": 3.332702702702703e-05, + "loss": 1.373, + "step": 50360 + }, + { + "epoch": 49.0, + "learning_rate": 3.3313513513513515e-05, + "loss": 0.7444, + "step": 50370 + }, + { + "epoch": 49.0, + "learning_rate": 3.33e-05, + "loss": 0.2335, + "step": 50380 + }, + { + "epoch": 49.0, + "learning_rate": 3.328648648648649e-05, + "loss": 0.1002, + "step": 50390 + }, + { + "epoch": 49.0, + "learning_rate": 3.327297297297298e-05, + "loss": 0.185, + "step": 50400 + }, + { + "epoch": 49.0, + "learning_rate": 3.3259459459459466e-05, + "loss": 0.2323, + "step": 50410 + }, + { + "epoch": 49.0, + "learning_rate": 3.324594594594595e-05, + "loss": 0.2246, + "step": 50420 + }, + { + "epoch": 49.0, + "learning_rate": 3.3232432432432435e-05, + "loss": 0.3547, + "step": 50430 + }, + { + "epoch": 49.0, + "learning_rate": 3.321891891891892e-05, + "loss": 0.1731, + "step": 50440 + }, + { + "epoch": 49.0, + "learning_rate": 3.3205405405405404e-05, + "loss": 0.1171, + "step": 50450 + }, + { + "epoch": 49.0, + "learning_rate": 3.319189189189189e-05, + "loss": 0.2515, + "step": 50460 + }, + { + "epoch": 49.0, + "learning_rate": 3.317837837837838e-05, + "loss": 0.1396, + "step": 50470 + }, + { + "epoch": 49.0, + "learning_rate": 3.316486486486486e-05, + "loss": 0.2552, + "step": 50480 + }, + { + "epoch": 49.0, + "learning_rate": 3.315135135135135e-05, + "loss": 0.2026, + "step": 50490 + }, + { + "epoch": 49.0, + "learning_rate": 3.3137837837837836e-05, + "loss": 0.1298, + "step": 50500 + }, + { + "epoch": 49.0, + "eval_loss": 0.09423606842756271, + "eval_runtime": 128.1185, + "eval_samples_per_second": 28.161, + "eval_steps_per_second": 3.52, + "eval_wer": 0.07906630014443461, + "step": 50500 + }, + { + "epoch": 49.01, + "learning_rate": 3.3124324324324324e-05, + "loss": 0.1508, + "step": 50510 + }, + { + "epoch": 49.01, + "learning_rate": 3.311081081081081e-05, + "loss": 0.077, + "step": 50520 + }, + { + "epoch": 49.01, + "learning_rate": 3.30972972972973e-05, + "loss": 0.1559, + "step": 50530 + }, + { + "epoch": 49.01, + "learning_rate": 3.308378378378378e-05, + "loss": 0.1836, + "step": 50540 + }, + { + "epoch": 49.01, + "learning_rate": 3.307027027027027e-05, + "loss": 0.1109, + "step": 50550 + }, + { + "epoch": 49.01, + "learning_rate": 3.3056756756756756e-05, + "loss": 0.16, + "step": 50560 + }, + { + "epoch": 49.01, + "learning_rate": 3.3043243243243244e-05, + "loss": 0.2502, + "step": 50570 + }, + { + "epoch": 49.01, + "learning_rate": 3.302972972972973e-05, + "loss": 0.1789, + "step": 50580 + }, + { + "epoch": 49.01, + "learning_rate": 3.301621621621622e-05, + "loss": 0.221, + "step": 50590 + }, + { + "epoch": 49.01, + "learning_rate": 3.30027027027027e-05, + "loss": 0.2615, + "step": 50600 + }, + { + "epoch": 49.01, + "learning_rate": 3.298918918918919e-05, + "loss": 0.2421, + "step": 50610 + }, + { + "epoch": 49.01, + "learning_rate": 3.2975675675675677e-05, + "loss": 0.3025, + "step": 50620 + }, + { + "epoch": 49.01, + "learning_rate": 3.2962162162162164e-05, + "loss": 0.2153, + "step": 50630 + }, + { + "epoch": 49.01, + "learning_rate": 3.294864864864865e-05, + "loss": 0.2293, + "step": 50640 + }, + { + "epoch": 49.01, + "learning_rate": 3.293513513513514e-05, + "loss": 0.411, + "step": 50650 + }, + { + "epoch": 49.01, + "learning_rate": 3.292162162162162e-05, + "loss": 0.3581, + "step": 50660 + }, + { + "epoch": 49.01, + "learning_rate": 3.290810810810811e-05, + "loss": 0.1376, + "step": 50670 + }, + { + "epoch": 49.01, + "learning_rate": 3.2894594594594597e-05, + "loss": 0.1336, + "step": 50680 + }, + { + "epoch": 49.01, + "learning_rate": 3.2881081081081084e-05, + "loss": 0.2133, + "step": 50690 + }, + { + "epoch": 49.01, + "learning_rate": 3.286756756756757e-05, + "loss": 0.151, + "step": 50700 + }, + { + "epoch": 49.01, + "learning_rate": 3.285405405405405e-05, + "loss": 0.1749, + "step": 50710 + }, + { + "epoch": 49.01, + "learning_rate": 3.284054054054054e-05, + "loss": 0.1156, + "step": 50720 + }, + { + "epoch": 49.01, + "learning_rate": 3.282702702702703e-05, + "loss": 0.1349, + "step": 50730 + }, + { + "epoch": 49.01, + "learning_rate": 3.281351351351352e-05, + "loss": 0.1411, + "step": 50740 + }, + { + "epoch": 49.01, + "learning_rate": 3.2800000000000004e-05, + "loss": 0.3796, + "step": 50750 + }, + { + "epoch": 49.01, + "learning_rate": 3.278648648648649e-05, + "loss": 0.2848, + "step": 50760 + }, + { + "epoch": 49.01, + "learning_rate": 3.277297297297297e-05, + "loss": 0.2241, + "step": 50770 + }, + { + "epoch": 49.01, + "learning_rate": 3.275945945945946e-05, + "loss": 0.2523, + "step": 50780 + }, + { + "epoch": 49.01, + "learning_rate": 3.274594594594595e-05, + "loss": 0.377, + "step": 50790 + }, + { + "epoch": 49.01, + "learning_rate": 3.273243243243244e-05, + "loss": 0.2417, + "step": 50800 + }, + { + "epoch": 49.01, + "learning_rate": 3.2718918918918925e-05, + "loss": 0.1423, + "step": 50810 + }, + { + "epoch": 49.01, + "learning_rate": 3.270540540540541e-05, + "loss": 0.1873, + "step": 50820 + }, + { + "epoch": 49.01, + "learning_rate": 3.269189189189189e-05, + "loss": 0.3386, + "step": 50830 + }, + { + "epoch": 49.01, + "learning_rate": 3.267837837837838e-05, + "loss": 0.2704, + "step": 50840 + }, + { + "epoch": 49.01, + "learning_rate": 3.266486486486487e-05, + "loss": 0.2048, + "step": 50850 + }, + { + "epoch": 49.01, + "learning_rate": 3.265135135135135e-05, + "loss": 0.1882, + "step": 50860 + }, + { + "epoch": 49.01, + "learning_rate": 3.263783783783784e-05, + "loss": 0.1956, + "step": 50870 + }, + { + "epoch": 49.01, + "learning_rate": 3.2624324324324326e-05, + "loss": 0.1969, + "step": 50880 + }, + { + "epoch": 49.01, + "learning_rate": 3.2610810810810813e-05, + "loss": 0.1884, + "step": 50890 + }, + { + "epoch": 49.01, + "learning_rate": 3.2597297297297294e-05, + "loss": 0.1354, + "step": 50900 + }, + { + "epoch": 49.01, + "learning_rate": 3.258378378378378e-05, + "loss": 0.1069, + "step": 50910 + }, + { + "epoch": 49.01, + "learning_rate": 3.257027027027027e-05, + "loss": 0.224, + "step": 50920 + }, + { + "epoch": 49.01, + "learning_rate": 3.255675675675676e-05, + "loss": 0.5704, + "step": 50930 + }, + { + "epoch": 49.01, + "learning_rate": 3.2543243243243246e-05, + "loss": 0.1371, + "step": 50940 + }, + { + "epoch": 49.01, + "learning_rate": 3.252972972972973e-05, + "loss": 0.1403, + "step": 50950 + }, + { + "epoch": 49.01, + "learning_rate": 3.2516216216216214e-05, + "loss": 0.2126, + "step": 50960 + }, + { + "epoch": 49.01, + "learning_rate": 3.25027027027027e-05, + "loss": 0.2152, + "step": 50970 + }, + { + "epoch": 49.01, + "learning_rate": 3.248918918918919e-05, + "loss": 0.2315, + "step": 50980 + }, + { + "epoch": 49.01, + "learning_rate": 3.247567567567568e-05, + "loss": 0.2679, + "step": 50990 + }, + { + "epoch": 49.01, + "learning_rate": 3.2462162162162166e-05, + "loss": 0.2617, + "step": 51000 + }, + { + "epoch": 49.01, + "eval_loss": 0.0904531478881836, + "eval_runtime": 131.4675, + "eval_samples_per_second": 27.444, + "eval_steps_per_second": 3.431, + "eval_wer": 0.07804128034291571, + "step": 51000 + }, + { + "epoch": 49.01, + "learning_rate": 3.244864864864865e-05, + "loss": 0.1524, + "step": 51010 + }, + { + "epoch": 49.01, + "learning_rate": 3.2435135135135135e-05, + "loss": 0.2374, + "step": 51020 + }, + { + "epoch": 49.01, + "learning_rate": 3.242162162162162e-05, + "loss": 0.2449, + "step": 51030 + }, + { + "epoch": 49.01, + "learning_rate": 3.240810810810811e-05, + "loss": 0.3003, + "step": 51040 + }, + { + "epoch": 49.01, + "learning_rate": 3.23945945945946e-05, + "loss": 0.3048, + "step": 51050 + }, + { + "epoch": 49.01, + "learning_rate": 3.2381081081081086e-05, + "loss": 0.2471, + "step": 51060 + }, + { + "epoch": 49.01, + "learning_rate": 3.236756756756757e-05, + "loss": 0.413, + "step": 51070 + }, + { + "epoch": 49.01, + "learning_rate": 3.2354054054054055e-05, + "loss": 0.2757, + "step": 51080 + }, + { + "epoch": 49.01, + "learning_rate": 3.234054054054054e-05, + "loss": 0.3533, + "step": 51090 + }, + { + "epoch": 49.01, + "learning_rate": 3.232702702702703e-05, + "loss": 0.4407, + "step": 51100 + }, + { + "epoch": 49.01, + "learning_rate": 3.231351351351352e-05, + "loss": 0.3301, + "step": 51110 + }, + { + "epoch": 49.01, + "learning_rate": 3.2300000000000006e-05, + "loss": 0.3471, + "step": 51120 + }, + { + "epoch": 49.01, + "learning_rate": 3.228648648648649e-05, + "loss": 0.2651, + "step": 51130 + }, + { + "epoch": 49.01, + "learning_rate": 3.2272972972972975e-05, + "loss": 0.3555, + "step": 51140 + }, + { + "epoch": 49.01, + "learning_rate": 3.225945945945946e-05, + "loss": 0.4817, + "step": 51150 + }, + { + "epoch": 50.0, + "learning_rate": 3.224594594594595e-05, + "loss": 0.3558, + "step": 51160 + }, + { + "epoch": 50.0, + "learning_rate": 3.223243243243244e-05, + "loss": 0.3453, + "step": 51170 + }, + { + "epoch": 50.0, + "learning_rate": 3.221891891891892e-05, + "loss": 0.4019, + "step": 51180 + }, + { + "epoch": 50.0, + "learning_rate": 3.220540540540541e-05, + "loss": 0.2968, + "step": 51190 + }, + { + "epoch": 50.0, + "learning_rate": 3.2191891891891895e-05, + "loss": 0.3726, + "step": 51200 + }, + { + "epoch": 50.0, + "learning_rate": 3.217837837837838e-05, + "loss": 0.3453, + "step": 51210 + }, + { + "epoch": 50.0, + "learning_rate": 3.216486486486487e-05, + "loss": 0.4807, + "step": 51220 + }, + { + "epoch": 50.0, + "learning_rate": 3.215135135135136e-05, + "loss": 0.3318, + "step": 51230 + }, + { + "epoch": 50.0, + "learning_rate": 3.213783783783784e-05, + "loss": 0.4055, + "step": 51240 + }, + { + "epoch": 50.0, + "learning_rate": 3.212432432432433e-05, + "loss": 0.3748, + "step": 51250 + }, + { + "epoch": 50.0, + "learning_rate": 3.211081081081081e-05, + "loss": 0.3317, + "step": 51260 + }, + { + "epoch": 50.0, + "learning_rate": 3.2097297297297296e-05, + "loss": 0.3683, + "step": 51270 + }, + { + "epoch": 50.0, + "learning_rate": 3.2083783783783784e-05, + "loss": 0.2049, + "step": 51280 + }, + { + "epoch": 50.0, + "learning_rate": 3.207027027027027e-05, + "loss": 0.2035, + "step": 51290 + }, + { + "epoch": 50.0, + "learning_rate": 3.205675675675676e-05, + "loss": 0.2353, + "step": 51300 + }, + { + "epoch": 50.0, + "learning_rate": 3.204324324324324e-05, + "loss": 0.3832, + "step": 51310 + }, + { + "epoch": 50.0, + "learning_rate": 3.202972972972973e-05, + "loss": 0.9489, + "step": 51320 + }, + { + "epoch": 50.0, + "learning_rate": 3.2016216216216216e-05, + "loss": 1.7588, + "step": 51330 + }, + { + "epoch": 50.0, + "learning_rate": 3.2002702702702704e-05, + "loss": 2.5184, + "step": 51340 + }, + { + "epoch": 50.0, + "learning_rate": 3.198918918918919e-05, + "loss": 2.3408, + "step": 51350 + }, + { + "epoch": 50.0, + "learning_rate": 3.197567567567567e-05, + "loss": 2.4892, + "step": 51360 + }, + { + "epoch": 50.0, + "learning_rate": 3.196216216216216e-05, + "loss": 1.7632, + "step": 51370 + }, + { + "epoch": 50.0, + "learning_rate": 3.194864864864865e-05, + "loss": 1.4124, + "step": 51380 + }, + { + "epoch": 50.0, + "learning_rate": 3.1935135135135136e-05, + "loss": 0.9859, + "step": 51390 + }, + { + "epoch": 50.0, + "learning_rate": 3.1921621621621624e-05, + "loss": 0.3514, + "step": 51400 + }, + { + "epoch": 50.0, + "learning_rate": 3.190810810810811e-05, + "loss": 0.1082, + "step": 51410 + }, + { + "epoch": 50.0, + "learning_rate": 3.189459459459459e-05, + "loss": 0.2006, + "step": 51420 + }, + { + "epoch": 50.0, + "learning_rate": 3.188108108108108e-05, + "loss": 0.2026, + "step": 51430 + }, + { + "epoch": 50.0, + "learning_rate": 3.186756756756757e-05, + "loss": 0.2203, + "step": 51440 + }, + { + "epoch": 50.0, + "learning_rate": 3.1854054054054056e-05, + "loss": 0.3725, + "step": 51450 + }, + { + "epoch": 50.0, + "learning_rate": 3.1840540540540544e-05, + "loss": 0.2214, + "step": 51460 + }, + { + "epoch": 50.0, + "learning_rate": 3.182702702702703e-05, + "loss": 0.1127, + "step": 51470 + }, + { + "epoch": 50.0, + "learning_rate": 3.181351351351351e-05, + "loss": 0.151, + "step": 51480 + }, + { + "epoch": 50.0, + "learning_rate": 3.18e-05, + "loss": 0.1568, + "step": 51490 + }, + { + "epoch": 50.0, + "learning_rate": 3.178648648648649e-05, + "loss": 0.1712, + "step": 51500 + }, + { + "epoch": 50.0, + "eval_loss": 0.0938711166381836, + "eval_runtime": 138.1197, + "eval_samples_per_second": 26.122, + "eval_steps_per_second": 3.265, + "eval_wer": 0.07790150491543586, + "step": 51500 + }, + { + "epoch": 50.0, + "learning_rate": 3.1772972972972976e-05, + "loss": 0.2062, + "step": 51510 + }, + { + "epoch": 50.0, + "learning_rate": 3.1759459459459464e-05, + "loss": 0.157, + "step": 51520 + }, + { + "epoch": 50.01, + "learning_rate": 3.174594594594595e-05, + "loss": 0.162, + "step": 51530 + }, + { + "epoch": 50.01, + "learning_rate": 3.173243243243243e-05, + "loss": 0.104, + "step": 51540 + }, + { + "epoch": 50.01, + "learning_rate": 3.171891891891892e-05, + "loss": 0.107, + "step": 51550 + }, + { + "epoch": 50.01, + "learning_rate": 3.170540540540541e-05, + "loss": 0.2008, + "step": 51560 + }, + { + "epoch": 50.01, + "learning_rate": 3.1691891891891896e-05, + "loss": 0.1046, + "step": 51570 + }, + { + "epoch": 50.01, + "learning_rate": 3.1678378378378384e-05, + "loss": 0.1656, + "step": 51580 + }, + { + "epoch": 50.01, + "learning_rate": 3.1664864864864865e-05, + "loss": 0.237, + "step": 51590 + }, + { + "epoch": 50.01, + "learning_rate": 3.165135135135135e-05, + "loss": 0.1949, + "step": 51600 + }, + { + "epoch": 50.01, + "learning_rate": 3.163783783783784e-05, + "loss": 0.2065, + "step": 51610 + }, + { + "epoch": 50.01, + "learning_rate": 3.162432432432433e-05, + "loss": 0.3188, + "step": 51620 + }, + { + "epoch": 50.01, + "learning_rate": 3.1610810810810816e-05, + "loss": 0.2218, + "step": 51630 + }, + { + "epoch": 50.01, + "learning_rate": 3.1597297297297304e-05, + "loss": 0.2895, + "step": 51640 + }, + { + "epoch": 50.01, + "learning_rate": 3.1583783783783785e-05, + "loss": 0.2436, + "step": 51650 + }, + { + "epoch": 50.01, + "learning_rate": 3.1570270270270266e-05, + "loss": 0.1814, + "step": 51660 + }, + { + "epoch": 50.01, + "learning_rate": 3.1556756756756754e-05, + "loss": 0.461, + "step": 51670 + }, + { + "epoch": 50.01, + "learning_rate": 3.154324324324324e-05, + "loss": 0.4188, + "step": 51680 + }, + { + "epoch": 50.01, + "learning_rate": 3.152972972972973e-05, + "loss": 0.2005, + "step": 51690 + }, + { + "epoch": 50.01, + "learning_rate": 3.151621621621622e-05, + "loss": 0.1248, + "step": 51700 + }, + { + "epoch": 50.01, + "learning_rate": 3.1502702702702705e-05, + "loss": 0.1956, + "step": 51710 + }, + { + "epoch": 50.01, + "learning_rate": 3.1489189189189186e-05, + "loss": 0.1579, + "step": 51720 + }, + { + "epoch": 50.01, + "learning_rate": 3.1475675675675674e-05, + "loss": 0.155, + "step": 51730 + }, + { + "epoch": 50.01, + "learning_rate": 3.146216216216216e-05, + "loss": 0.1527, + "step": 51740 + }, + { + "epoch": 50.01, + "learning_rate": 3.144864864864865e-05, + "loss": 0.1314, + "step": 51750 + }, + { + "epoch": 50.01, + "learning_rate": 3.143513513513514e-05, + "loss": 0.0944, + "step": 51760 + }, + { + "epoch": 50.01, + "learning_rate": 3.1421621621621625e-05, + "loss": 0.3177, + "step": 51770 + }, + { + "epoch": 50.01, + "learning_rate": 3.1408108108108106e-05, + "loss": 0.3018, + "step": 51780 + }, + { + "epoch": 50.01, + "learning_rate": 3.1394594594594594e-05, + "loss": 0.2886, + "step": 51790 + }, + { + "epoch": 50.01, + "learning_rate": 3.138108108108108e-05, + "loss": 0.2039, + "step": 51800 + }, + { + "epoch": 50.01, + "learning_rate": 3.136756756756757e-05, + "loss": 0.3076, + "step": 51810 + }, + { + "epoch": 50.01, + "learning_rate": 3.135405405405406e-05, + "loss": 0.2956, + "step": 51820 + }, + { + "epoch": 50.01, + "learning_rate": 3.134054054054054e-05, + "loss": 0.1757, + "step": 51830 + }, + { + "epoch": 50.01, + "learning_rate": 3.1327027027027026e-05, + "loss": 0.1662, + "step": 51840 + }, + { + "epoch": 50.01, + "learning_rate": 3.1313513513513514e-05, + "loss": 0.2502, + "step": 51850 + }, + { + "epoch": 50.01, + "learning_rate": 3.13e-05, + "loss": 0.312, + "step": 51860 + }, + { + "epoch": 50.01, + "learning_rate": 3.128648648648649e-05, + "loss": 0.2509, + "step": 51870 + }, + { + "epoch": 50.01, + "learning_rate": 3.127297297297298e-05, + "loss": 0.192, + "step": 51880 + }, + { + "epoch": 50.01, + "learning_rate": 3.125945945945946e-05, + "loss": 0.2161, + "step": 51890 + }, + { + "epoch": 50.01, + "learning_rate": 3.1245945945945946e-05, + "loss": 0.1975, + "step": 51900 + }, + { + "epoch": 50.01, + "learning_rate": 3.1232432432432434e-05, + "loss": 0.2062, + "step": 51910 + }, + { + "epoch": 50.01, + "learning_rate": 3.121891891891892e-05, + "loss": 0.1865, + "step": 51920 + }, + { + "epoch": 50.01, + "learning_rate": 3.120540540540541e-05, + "loss": 0.0912, + "step": 51930 + }, + { + "epoch": 50.01, + "learning_rate": 3.11918918918919e-05, + "loss": 0.2214, + "step": 51940 + }, + { + "epoch": 50.01, + "learning_rate": 3.117837837837838e-05, + "loss": 0.3985, + "step": 51950 + }, + { + "epoch": 50.01, + "learning_rate": 3.1164864864864866e-05, + "loss": 0.3051, + "step": 51960 + }, + { + "epoch": 50.01, + "learning_rate": 3.1151351351351354e-05, + "loss": 0.13, + "step": 51970 + }, + { + "epoch": 50.01, + "learning_rate": 3.113783783783784e-05, + "loss": 0.1786, + "step": 51980 + }, + { + "epoch": 50.01, + "learning_rate": 3.112432432432433e-05, + "loss": 0.1825, + "step": 51990 + }, + { + "epoch": 50.01, + "learning_rate": 3.111081081081082e-05, + "loss": 0.2058, + "step": 52000 + }, + { + "epoch": 50.01, + "eval_loss": 0.0881146490573883, + "eval_runtime": 129.6639, + "eval_samples_per_second": 27.826, + "eval_steps_per_second": 3.478, + "eval_wer": 0.07720262777803662, + "step": 52000 + }, + { + "epoch": 50.01, + "learning_rate": 3.10972972972973e-05, + "loss": 0.2599, + "step": 52010 + }, + { + "epoch": 50.01, + "learning_rate": 3.1083783783783786e-05, + "loss": 0.2987, + "step": 52020 + }, + { + "epoch": 50.01, + "learning_rate": 3.1070270270270274e-05, + "loss": 0.1365, + "step": 52030 + }, + { + "epoch": 50.01, + "learning_rate": 3.105675675675676e-05, + "loss": 0.2472, + "step": 52040 + }, + { + "epoch": 50.01, + "learning_rate": 3.104324324324325e-05, + "loss": 0.1825, + "step": 52050 + }, + { + "epoch": 50.01, + "learning_rate": 3.102972972972973e-05, + "loss": 0.3603, + "step": 52060 + }, + { + "epoch": 50.01, + "learning_rate": 3.101621621621621e-05, + "loss": 0.3417, + "step": 52070 + }, + { + "epoch": 50.01, + "learning_rate": 3.10027027027027e-05, + "loss": 0.2939, + "step": 52080 + }, + { + "epoch": 50.01, + "learning_rate": 3.098918918918919e-05, + "loss": 0.305, + "step": 52090 + }, + { + "epoch": 50.01, + "learning_rate": 3.0975675675675675e-05, + "loss": 0.3692, + "step": 52100 + }, + { + "epoch": 50.01, + "learning_rate": 3.096216216216216e-05, + "loss": 0.3029, + "step": 52110 + }, + { + "epoch": 50.01, + "learning_rate": 3.094864864864865e-05, + "loss": 0.4304, + "step": 52120 + }, + { + "epoch": 50.01, + "learning_rate": 3.093513513513513e-05, + "loss": 0.3517, + "step": 52130 + }, + { + "epoch": 50.01, + "learning_rate": 3.092162162162162e-05, + "loss": 0.291, + "step": 52140 + }, + { + "epoch": 50.01, + "learning_rate": 3.090810810810811e-05, + "loss": 0.298, + "step": 52150 + }, + { + "epoch": 50.01, + "learning_rate": 3.0894594594594595e-05, + "loss": 0.3083, + "step": 52160 + }, + { + "epoch": 50.01, + "learning_rate": 3.088108108108108e-05, + "loss": 0.3744, + "step": 52170 + }, + { + "epoch": 51.0, + "learning_rate": 3.086756756756757e-05, + "loss": 0.3519, + "step": 52180 + }, + { + "epoch": 51.0, + "learning_rate": 3.085405405405405e-05, + "loss": 0.3355, + "step": 52190 + }, + { + "epoch": 51.0, + "learning_rate": 3.084054054054054e-05, + "loss": 0.3945, + "step": 52200 + }, + { + "epoch": 51.0, + "learning_rate": 3.082702702702703e-05, + "loss": 0.3311, + "step": 52210 + }, + { + "epoch": 51.0, + "learning_rate": 3.0813513513513515e-05, + "loss": 0.3268, + "step": 52220 + }, + { + "epoch": 51.0, + "learning_rate": 3.08e-05, + "loss": 0.362, + "step": 52230 + }, + { + "epoch": 51.0, + "learning_rate": 3.078648648648649e-05, + "loss": 0.4899, + "step": 52240 + }, + { + "epoch": 51.0, + "learning_rate": 3.077297297297297e-05, + "loss": 0.3432, + "step": 52250 + }, + { + "epoch": 51.0, + "learning_rate": 3.075945945945946e-05, + "loss": 0.3157, + "step": 52260 + }, + { + "epoch": 51.0, + "learning_rate": 3.074594594594595e-05, + "loss": 0.3628, + "step": 52270 + }, + { + "epoch": 51.0, + "learning_rate": 3.0732432432432436e-05, + "loss": 0.3155, + "step": 52280 + }, + { + "epoch": 51.0, + "learning_rate": 3.071891891891892e-05, + "loss": 0.3881, + "step": 52290 + }, + { + "epoch": 51.0, + "learning_rate": 3.0705405405405404e-05, + "loss": 0.2325, + "step": 52300 + }, + { + "epoch": 51.0, + "learning_rate": 3.069189189189189e-05, + "loss": 0.2092, + "step": 52310 + }, + { + "epoch": 51.0, + "learning_rate": 3.067837837837838e-05, + "loss": 0.219, + "step": 52320 + }, + { + "epoch": 51.0, + "learning_rate": 3.066486486486487e-05, + "loss": 0.2239, + "step": 52330 + }, + { + "epoch": 51.0, + "learning_rate": 3.0651351351351356e-05, + "loss": 0.951, + "step": 52340 + }, + { + "epoch": 51.0, + "learning_rate": 3.063783783783784e-05, + "loss": 1.2077, + "step": 52350 + }, + { + "epoch": 51.0, + "learning_rate": 3.0624324324324324e-05, + "loss": 2.5539, + "step": 52360 + }, + { + "epoch": 51.0, + "learning_rate": 3.061081081081081e-05, + "loss": 2.3532, + "step": 52370 + }, + { + "epoch": 51.0, + "learning_rate": 3.05972972972973e-05, + "loss": 2.5038, + "step": 52380 + }, + { + "epoch": 51.0, + "learning_rate": 3.058378378378379e-05, + "loss": 2.1864, + "step": 52390 + }, + { + "epoch": 51.0, + "learning_rate": 3.0570270270270276e-05, + "loss": 1.288, + "step": 52400 + }, + { + "epoch": 51.0, + "learning_rate": 3.0556756756756763e-05, + "loss": 1.1868, + "step": 52410 + }, + { + "epoch": 51.0, + "learning_rate": 3.0543243243243244e-05, + "loss": 0.5183, + "step": 52420 + }, + { + "epoch": 51.0, + "learning_rate": 3.052972972972973e-05, + "loss": 0.1401, + "step": 52430 + }, + { + "epoch": 51.0, + "learning_rate": 3.051621621621622e-05, + "loss": 0.1862, + "step": 52440 + }, + { + "epoch": 51.0, + "learning_rate": 3.0502702702702708e-05, + "loss": 0.1435, + "step": 52450 + }, + { + "epoch": 51.0, + "learning_rate": 3.0489189189189192e-05, + "loss": 0.2449, + "step": 52460 + }, + { + "epoch": 51.0, + "learning_rate": 3.0475675675675673e-05, + "loss": 0.3046, + "step": 52470 + }, + { + "epoch": 51.0, + "learning_rate": 3.046216216216216e-05, + "loss": 0.279, + "step": 52480 + }, + { + "epoch": 51.0, + "learning_rate": 3.044864864864865e-05, + "loss": 0.1488, + "step": 52490 + }, + { + "epoch": 51.0, + "learning_rate": 3.0435135135135133e-05, + "loss": 0.126, + "step": 52500 + }, + { + "epoch": 51.0, + "eval_loss": 0.09489134699106216, + "eval_runtime": 129.2723, + "eval_samples_per_second": 27.91, + "eval_steps_per_second": 3.489, + "eval_wer": 0.07836742300703536, + "step": 52500 + }, + { + "epoch": 51.0, + "learning_rate": 3.042162162162162e-05, + "loss": 0.1863, + "step": 52510 + }, + { + "epoch": 51.0, + "learning_rate": 3.040810810810811e-05, + "loss": 0.1857, + "step": 52520 + }, + { + "epoch": 51.0, + "learning_rate": 3.0394594594594593e-05, + "loss": 0.197, + "step": 52530 + }, + { + "epoch": 51.0, + "learning_rate": 3.038108108108108e-05, + "loss": 0.1723, + "step": 52540 + }, + { + "epoch": 51.01, + "learning_rate": 3.036756756756757e-05, + "loss": 0.1602, + "step": 52550 + }, + { + "epoch": 51.01, + "learning_rate": 3.0354054054054053e-05, + "loss": 0.1036, + "step": 52560 + }, + { + "epoch": 51.01, + "learning_rate": 3.034054054054054e-05, + "loss": 0.093, + "step": 52570 + }, + { + "epoch": 51.01, + "learning_rate": 3.032702702702703e-05, + "loss": 0.1507, + "step": 52580 + }, + { + "epoch": 51.01, + "learning_rate": 3.0313513513513513e-05, + "loss": 0.1508, + "step": 52590 + }, + { + "epoch": 51.01, + "learning_rate": 3.03e-05, + "loss": 0.1912, + "step": 52600 + }, + { + "epoch": 51.01, + "learning_rate": 3.0286486486486486e-05, + "loss": 0.2153, + "step": 52610 + }, + { + "epoch": 51.01, + "learning_rate": 3.0272972972972974e-05, + "loss": 0.2069, + "step": 52620 + }, + { + "epoch": 51.01, + "learning_rate": 3.025945945945946e-05, + "loss": 0.1805, + "step": 52630 + }, + { + "epoch": 51.01, + "learning_rate": 3.0245945945945946e-05, + "loss": 0.1997, + "step": 52640 + }, + { + "epoch": 51.01, + "learning_rate": 3.0232432432432434e-05, + "loss": 0.2472, + "step": 52650 + }, + { + "epoch": 51.01, + "learning_rate": 3.021891891891892e-05, + "loss": 0.35, + "step": 52660 + }, + { + "epoch": 51.01, + "learning_rate": 3.0205405405405406e-05, + "loss": 0.3078, + "step": 52670 + }, + { + "epoch": 51.01, + "learning_rate": 3.0191891891891894e-05, + "loss": 0.1834, + "step": 52680 + }, + { + "epoch": 51.01, + "learning_rate": 3.017837837837838e-05, + "loss": 0.3464, + "step": 52690 + }, + { + "epoch": 51.01, + "learning_rate": 3.0164864864864866e-05, + "loss": 0.4192, + "step": 52700 + }, + { + "epoch": 51.01, + "learning_rate": 3.0151351351351354e-05, + "loss": 0.3343, + "step": 52710 + }, + { + "epoch": 51.01, + "learning_rate": 3.013783783783784e-05, + "loss": 0.1057, + "step": 52720 + }, + { + "epoch": 51.01, + "learning_rate": 3.0124324324324326e-05, + "loss": 0.1643, + "step": 52730 + }, + { + "epoch": 51.01, + "learning_rate": 3.0110810810810814e-05, + "loss": 0.1711, + "step": 52740 + }, + { + "epoch": 51.01, + "learning_rate": 3.00972972972973e-05, + "loss": 0.139, + "step": 52750 + }, + { + "epoch": 51.01, + "learning_rate": 3.0083783783783786e-05, + "loss": 0.142, + "step": 52760 + }, + { + "epoch": 51.01, + "learning_rate": 3.0070270270270274e-05, + "loss": 0.1192, + "step": 52770 + }, + { + "epoch": 51.01, + "learning_rate": 3.005675675675676e-05, + "loss": 0.1019, + "step": 52780 + }, + { + "epoch": 51.01, + "learning_rate": 3.0043243243243246e-05, + "loss": 0.2414, + "step": 52790 + }, + { + "epoch": 51.01, + "learning_rate": 3.0029729729729734e-05, + "loss": 0.3565, + "step": 52800 + }, + { + "epoch": 51.01, + "learning_rate": 3.0016216216216218e-05, + "loss": 0.2765, + "step": 52810 + }, + { + "epoch": 51.01, + "learning_rate": 3.0002702702702706e-05, + "loss": 0.191, + "step": 52820 + }, + { + "epoch": 51.01, + "learning_rate": 2.9989189189189194e-05, + "loss": 0.2801, + "step": 52830 + }, + { + "epoch": 51.01, + "learning_rate": 2.9975675675675678e-05, + "loss": 0.3102, + "step": 52840 + }, + { + "epoch": 51.01, + "learning_rate": 2.9962162162162166e-05, + "loss": 0.1769, + "step": 52850 + }, + { + "epoch": 51.01, + "learning_rate": 2.9948648648648654e-05, + "loss": 0.1285, + "step": 52860 + }, + { + "epoch": 51.01, + "learning_rate": 2.9935135135135135e-05, + "loss": 0.2132, + "step": 52870 + }, + { + "epoch": 51.01, + "learning_rate": 2.992162162162162e-05, + "loss": 0.263, + "step": 52880 + }, + { + "epoch": 51.01, + "learning_rate": 2.9908108108108107e-05, + "loss": 0.2607, + "step": 52890 + }, + { + "epoch": 51.01, + "learning_rate": 2.9894594594594595e-05, + "loss": 0.2076, + "step": 52900 + }, + { + "epoch": 51.01, + "learning_rate": 2.988108108108108e-05, + "loss": 0.1826, + "step": 52910 + }, + { + "epoch": 51.01, + "learning_rate": 2.9867567567567567e-05, + "loss": 0.199, + "step": 52920 + }, + { + "epoch": 51.01, + "learning_rate": 2.9854054054054055e-05, + "loss": 0.182, + "step": 52930 + }, + { + "epoch": 51.01, + "learning_rate": 2.984054054054054e-05, + "loss": 0.2206, + "step": 52940 + }, + { + "epoch": 51.01, + "learning_rate": 2.9827027027027027e-05, + "loss": 0.1121, + "step": 52950 + }, + { + "epoch": 51.01, + "learning_rate": 2.9813513513513515e-05, + "loss": 0.1813, + "step": 52960 + }, + { + "epoch": 51.01, + "learning_rate": 2.98e-05, + "loss": 0.2668, + "step": 52970 + }, + { + "epoch": 51.01, + "learning_rate": 2.9786486486486487e-05, + "loss": 0.3536, + "step": 52980 + }, + { + "epoch": 51.01, + "learning_rate": 2.9772972972972975e-05, + "loss": 0.1511, + "step": 52990 + }, + { + "epoch": 51.01, + "learning_rate": 2.975945945945946e-05, + "loss": 0.1738, + "step": 53000 + }, + { + "epoch": 51.01, + "eval_loss": 0.08920902013778687, + "eval_runtime": 130.0159, + "eval_samples_per_second": 27.75, + "eval_steps_per_second": 3.469, + "eval_wer": 0.07729581139635652, + "step": 53000 + }, + { + "epoch": 51.01, + "learning_rate": 2.9745945945945947e-05, + "loss": 0.1849, + "step": 53010 + }, + { + "epoch": 51.01, + "learning_rate": 2.9732432432432435e-05, + "loss": 0.2016, + "step": 53020 + }, + { + "epoch": 51.01, + "learning_rate": 2.971891891891892e-05, + "loss": 0.2394, + "step": 53030 + }, + { + "epoch": 51.01, + "learning_rate": 2.9705405405405407e-05, + "loss": 0.2703, + "step": 53040 + }, + { + "epoch": 51.01, + "learning_rate": 2.969189189189189e-05, + "loss": 0.1736, + "step": 53050 + }, + { + "epoch": 51.01, + "learning_rate": 2.967837837837838e-05, + "loss": 0.1742, + "step": 53060 + }, + { + "epoch": 51.01, + "learning_rate": 2.9664864864864867e-05, + "loss": 0.1935, + "step": 53070 + }, + { + "epoch": 51.01, + "learning_rate": 2.965135135135135e-05, + "loss": 0.3296, + "step": 53080 + }, + { + "epoch": 51.01, + "learning_rate": 2.963783783783784e-05, + "loss": 0.2653, + "step": 53090 + }, + { + "epoch": 51.01, + "learning_rate": 2.9624324324324327e-05, + "loss": 0.3966, + "step": 53100 + }, + { + "epoch": 51.01, + "learning_rate": 2.961081081081081e-05, + "loss": 0.3014, + "step": 53110 + }, + { + "epoch": 51.01, + "learning_rate": 2.95972972972973e-05, + "loss": 0.3767, + "step": 53120 + }, + { + "epoch": 51.01, + "learning_rate": 2.9583783783783787e-05, + "loss": 0.2841, + "step": 53130 + }, + { + "epoch": 51.01, + "learning_rate": 2.957027027027027e-05, + "loss": 0.4306, + "step": 53140 + }, + { + "epoch": 51.01, + "learning_rate": 2.955675675675676e-05, + "loss": 0.329, + "step": 53150 + }, + { + "epoch": 51.01, + "learning_rate": 2.9543243243243247e-05, + "loss": 0.308, + "step": 53160 + }, + { + "epoch": 51.01, + "learning_rate": 2.9529729729729732e-05, + "loss": 0.3054, + "step": 53170 + }, + { + "epoch": 51.01, + "learning_rate": 2.951621621621622e-05, + "loss": 0.2743, + "step": 53180 + }, + { + "epoch": 51.01, + "learning_rate": 2.9502702702702707e-05, + "loss": 0.3338, + "step": 53190 + }, + { + "epoch": 52.0, + "learning_rate": 2.9489189189189192e-05, + "loss": 0.3646, + "step": 53200 + }, + { + "epoch": 52.0, + "learning_rate": 2.947567567567568e-05, + "loss": 0.3877, + "step": 53210 + }, + { + "epoch": 52.0, + "learning_rate": 2.9462162162162167e-05, + "loss": 0.3522, + "step": 53220 + }, + { + "epoch": 52.0, + "learning_rate": 2.9448648648648652e-05, + "loss": 0.3459, + "step": 53230 + }, + { + "epoch": 52.0, + "learning_rate": 2.943513513513514e-05, + "loss": 0.286, + "step": 53240 + }, + { + "epoch": 52.0, + "learning_rate": 2.9421621621621624e-05, + "loss": 0.3481, + "step": 53250 + }, + { + "epoch": 52.0, + "learning_rate": 2.9408108108108112e-05, + "loss": 0.4797, + "step": 53260 + }, + { + "epoch": 52.0, + "learning_rate": 2.9394594594594593e-05, + "loss": 0.4221, + "step": 53270 + }, + { + "epoch": 52.0, + "learning_rate": 2.938108108108108e-05, + "loss": 0.3209, + "step": 53280 + }, + { + "epoch": 52.0, + "learning_rate": 2.9367567567567565e-05, + "loss": 0.3523, + "step": 53290 + }, + { + "epoch": 52.0, + "learning_rate": 2.9354054054054053e-05, + "loss": 0.3828, + "step": 53300 + }, + { + "epoch": 52.0, + "learning_rate": 2.934054054054054e-05, + "loss": 0.3788, + "step": 53310 + }, + { + "epoch": 52.0, + "learning_rate": 2.9327027027027025e-05, + "loss": 0.2301, + "step": 53320 + }, + { + "epoch": 52.0, + "learning_rate": 2.9313513513513513e-05, + "loss": 0.1999, + "step": 53330 + }, + { + "epoch": 52.0, + "learning_rate": 2.93e-05, + "loss": 0.2132, + "step": 53340 + }, + { + "epoch": 52.0, + "learning_rate": 2.9286486486486485e-05, + "loss": 0.2008, + "step": 53350 + }, + { + "epoch": 52.0, + "learning_rate": 2.9272972972972973e-05, + "loss": 0.7753, + "step": 53360 + }, + { + "epoch": 52.0, + "learning_rate": 2.925945945945946e-05, + "loss": 0.6527, + "step": 53370 + }, + { + "epoch": 52.0, + "learning_rate": 2.9245945945945945e-05, + "loss": 2.5558, + "step": 53380 + }, + { + "epoch": 52.0, + "learning_rate": 2.9232432432432433e-05, + "loss": 2.4903, + "step": 53390 + }, + { + "epoch": 52.0, + "learning_rate": 2.921891891891892e-05, + "loss": 2.3606, + "step": 53400 + }, + { + "epoch": 52.0, + "learning_rate": 2.9205405405405405e-05, + "loss": 2.4788, + "step": 53410 + }, + { + "epoch": 52.0, + "learning_rate": 2.9191891891891893e-05, + "loss": 1.2184, + "step": 53420 + }, + { + "epoch": 52.0, + "learning_rate": 2.917837837837838e-05, + "loss": 1.2998, + "step": 53430 + }, + { + "epoch": 52.0, + "learning_rate": 2.9164864864864865e-05, + "loss": 0.7338, + "step": 53440 + }, + { + "epoch": 52.0, + "learning_rate": 2.9151351351351353e-05, + "loss": 0.1864, + "step": 53450 + }, + { + "epoch": 52.0, + "learning_rate": 2.913783783783784e-05, + "loss": 0.1399, + "step": 53460 + }, + { + "epoch": 52.0, + "learning_rate": 2.9124324324324325e-05, + "loss": 0.2138, + "step": 53470 + }, + { + "epoch": 52.0, + "learning_rate": 2.9110810810810813e-05, + "loss": 0.2282, + "step": 53480 + }, + { + "epoch": 52.0, + "learning_rate": 2.9097297297297297e-05, + "loss": 0.3056, + "step": 53490 + }, + { + "epoch": 52.0, + "learning_rate": 2.9083783783783785e-05, + "loss": 0.3389, + "step": 53500 + }, + { + "epoch": 52.0, + "eval_loss": 0.08907531201839447, + "eval_runtime": 130.887, + "eval_samples_per_second": 27.566, + "eval_steps_per_second": 3.446, + "eval_wer": 0.07836742300703536, + "step": 53500 + }, + { + "epoch": 52.0, + "learning_rate": 2.9070270270270273e-05, + "loss": 0.1747, + "step": 53510 + }, + { + "epoch": 52.0, + "learning_rate": 2.9056756756756757e-05, + "loss": 0.093, + "step": 53520 + }, + { + "epoch": 52.0, + "learning_rate": 2.9043243243243245e-05, + "loss": 0.2136, + "step": 53530 + }, + { + "epoch": 52.0, + "learning_rate": 2.9029729729729733e-05, + "loss": 0.1496, + "step": 53540 + }, + { + "epoch": 52.0, + "learning_rate": 2.9016216216216218e-05, + "loss": 0.1979, + "step": 53550 + }, + { + "epoch": 52.0, + "learning_rate": 2.9002702702702705e-05, + "loss": 0.1927, + "step": 53560 + }, + { + "epoch": 52.0, + "learning_rate": 2.8989189189189193e-05, + "loss": 0.1406, + "step": 53570 + }, + { + "epoch": 52.01, + "learning_rate": 2.8975675675675678e-05, + "loss": 0.1378, + "step": 53580 + }, + { + "epoch": 52.01, + "learning_rate": 2.8962162162162165e-05, + "loss": 0.0703, + "step": 53590 + }, + { + "epoch": 52.01, + "learning_rate": 2.8948648648648653e-05, + "loss": 0.1842, + "step": 53600 + }, + { + "epoch": 52.01, + "learning_rate": 2.8935135135135138e-05, + "loss": 0.1538, + "step": 53610 + }, + { + "epoch": 52.01, + "learning_rate": 2.892297297297297e-05, + "loss": 0.1254, + "step": 53620 + }, + { + "epoch": 52.01, + "learning_rate": 2.890945945945946e-05, + "loss": 0.159, + "step": 53630 + }, + { + "epoch": 52.01, + "learning_rate": 2.8895945945945947e-05, + "loss": 0.2631, + "step": 53640 + }, + { + "epoch": 52.01, + "learning_rate": 2.888243243243243e-05, + "loss": 0.1506, + "step": 53650 + }, + { + "epoch": 52.01, + "learning_rate": 2.886891891891892e-05, + "loss": 0.2273, + "step": 53660 + }, + { + "epoch": 52.01, + "learning_rate": 2.8855405405405407e-05, + "loss": 0.242, + "step": 53670 + }, + { + "epoch": 52.01, + "learning_rate": 2.884189189189189e-05, + "loss": 0.2324, + "step": 53680 + }, + { + "epoch": 52.01, + "learning_rate": 2.882837837837838e-05, + "loss": 0.305, + "step": 53690 + }, + { + "epoch": 52.01, + "learning_rate": 2.8814864864864867e-05, + "loss": 0.2243, + "step": 53700 + }, + { + "epoch": 52.01, + "learning_rate": 2.880135135135135e-05, + "loss": 0.2405, + "step": 53710 + }, + { + "epoch": 52.01, + "learning_rate": 2.878783783783784e-05, + "loss": 0.4322, + "step": 53720 + }, + { + "epoch": 52.01, + "learning_rate": 2.8774324324324327e-05, + "loss": 0.397, + "step": 53730 + }, + { + "epoch": 52.01, + "learning_rate": 2.876081081081081e-05, + "loss": 0.1335, + "step": 53740 + }, + { + "epoch": 52.01, + "learning_rate": 2.87472972972973e-05, + "loss": 0.1825, + "step": 53750 + }, + { + "epoch": 52.01, + "learning_rate": 2.8733783783783787e-05, + "loss": 0.1909, + "step": 53760 + }, + { + "epoch": 52.01, + "learning_rate": 2.872027027027027e-05, + "loss": 0.1377, + "step": 53770 + }, + { + "epoch": 52.01, + "learning_rate": 2.870675675675676e-05, + "loss": 0.1419, + "step": 53780 + }, + { + "epoch": 52.01, + "learning_rate": 2.8693243243243244e-05, + "loss": 0.1174, + "step": 53790 + }, + { + "epoch": 52.01, + "learning_rate": 2.867972972972973e-05, + "loss": 0.1375, + "step": 53800 + }, + { + "epoch": 52.01, + "learning_rate": 2.866621621621622e-05, + "loss": 0.157, + "step": 53810 + }, + { + "epoch": 52.01, + "learning_rate": 2.8652702702702704e-05, + "loss": 0.3725, + "step": 53820 + }, + { + "epoch": 52.01, + "learning_rate": 2.863918918918919e-05, + "loss": 0.293, + "step": 53830 + }, + { + "epoch": 52.01, + "learning_rate": 2.862567567567568e-05, + "loss": 0.2275, + "step": 53840 + }, + { + "epoch": 52.01, + "learning_rate": 2.8612162162162164e-05, + "loss": 0.2485, + "step": 53850 + }, + { + "epoch": 52.01, + "learning_rate": 2.859864864864865e-05, + "loss": 0.4084, + "step": 53860 + }, + { + "epoch": 52.01, + "learning_rate": 2.858513513513514e-05, + "loss": 0.1471, + "step": 53870 + }, + { + "epoch": 52.01, + "learning_rate": 2.8571621621621624e-05, + "loss": 0.144, + "step": 53880 + }, + { + "epoch": 52.01, + "learning_rate": 2.855810810810811e-05, + "loss": 0.2286, + "step": 53890 + }, + { + "epoch": 52.01, + "learning_rate": 2.85445945945946e-05, + "loss": 0.2792, + "step": 53900 + }, + { + "epoch": 52.01, + "learning_rate": 2.8531081081081084e-05, + "loss": 0.2652, + "step": 53910 + }, + { + "epoch": 52.01, + "learning_rate": 2.851756756756757e-05, + "loss": 0.2452, + "step": 53920 + }, + { + "epoch": 52.01, + "learning_rate": 2.850405405405406e-05, + "loss": 0.2022, + "step": 53930 + }, + { + "epoch": 52.01, + "learning_rate": 2.8490540540540544e-05, + "loss": 0.2246, + "step": 53940 + }, + { + "epoch": 52.01, + "learning_rate": 2.8477027027027025e-05, + "loss": 0.2011, + "step": 53950 + }, + { + "epoch": 52.01, + "learning_rate": 2.8463513513513513e-05, + "loss": 0.2299, + "step": 53960 + }, + { + "epoch": 52.01, + "learning_rate": 2.845e-05, + "loss": 0.0974, + "step": 53970 + }, + { + "epoch": 52.01, + "learning_rate": 2.8436486486486485e-05, + "loss": 0.1269, + "step": 53980 + }, + { + "epoch": 52.01, + "learning_rate": 2.8422972972972973e-05, + "loss": 0.2349, + "step": 53990 + }, + { + "epoch": 52.01, + "learning_rate": 2.840945945945946e-05, + "loss": 0.5195, + "step": 54000 + }, + { + "epoch": 52.01, + "eval_loss": 0.08595506846904755, + "eval_runtime": 132.3913, + "eval_samples_per_second": 27.253, + "eval_steps_per_second": 3.407, + "eval_wer": 0.07752877044215627, + "step": 54000 + }, + { + "epoch": 52.01, + "learning_rate": 2.8395945945945945e-05, + "loss": 0.1201, + "step": 54010 + }, + { + "epoch": 52.01, + "learning_rate": 2.8382432432432433e-05, + "loss": 0.1195, + "step": 54020 + }, + { + "epoch": 52.01, + "learning_rate": 2.8368918918918917e-05, + "loss": 0.1904, + "step": 54030 + }, + { + "epoch": 52.01, + "learning_rate": 2.8355405405405405e-05, + "loss": 0.2436, + "step": 54040 + }, + { + "epoch": 52.01, + "learning_rate": 2.8341891891891893e-05, + "loss": 0.2594, + "step": 54050 + }, + { + "epoch": 52.01, + "learning_rate": 2.8328378378378377e-05, + "loss": 0.2994, + "step": 54060 + }, + { + "epoch": 52.01, + "learning_rate": 2.8314864864864865e-05, + "loss": 0.2382, + "step": 54070 + }, + { + "epoch": 52.01, + "learning_rate": 2.8301351351351353e-05, + "loss": 0.1418, + "step": 54080 + }, + { + "epoch": 52.01, + "learning_rate": 2.8287837837837837e-05, + "loss": 0.2193, + "step": 54090 + }, + { + "epoch": 52.01, + "learning_rate": 2.8274324324324325e-05, + "loss": 0.2381, + "step": 54100 + }, + { + "epoch": 52.01, + "learning_rate": 2.8260810810810813e-05, + "loss": 0.2814, + "step": 54110 + }, + { + "epoch": 52.01, + "learning_rate": 2.8247297297297297e-05, + "loss": 0.3662, + "step": 54120 + }, + { + "epoch": 52.01, + "learning_rate": 2.8233783783783785e-05, + "loss": 0.2648, + "step": 54130 + }, + { + "epoch": 52.01, + "learning_rate": 2.8220270270270273e-05, + "loss": 0.3762, + "step": 54140 + }, + { + "epoch": 52.01, + "learning_rate": 2.8206756756756757e-05, + "loss": 0.2639, + "step": 54150 + }, + { + "epoch": 52.01, + "learning_rate": 2.8193243243243245e-05, + "loss": 0.39, + "step": 54160 + }, + { + "epoch": 52.01, + "learning_rate": 2.8179729729729733e-05, + "loss": 0.3977, + "step": 54170 + }, + { + "epoch": 52.01, + "learning_rate": 2.8166216216216217e-05, + "loss": 0.251, + "step": 54180 + }, + { + "epoch": 52.01, + "learning_rate": 2.8152702702702705e-05, + "loss": 0.3103, + "step": 54190 + }, + { + "epoch": 52.01, + "learning_rate": 2.8139189189189193e-05, + "loss": 0.3142, + "step": 54200 + }, + { + "epoch": 52.01, + "learning_rate": 2.8125675675675677e-05, + "loss": 0.2584, + "step": 54210 + }, + { + "epoch": 53.0, + "learning_rate": 2.8112162162162165e-05, + "loss": 0.4059, + "step": 54220 + }, + { + "epoch": 53.0, + "learning_rate": 2.809864864864865e-05, + "loss": 0.3863, + "step": 54230 + }, + { + "epoch": 53.0, + "learning_rate": 2.8085135135135137e-05, + "loss": 0.3608, + "step": 54240 + }, + { + "epoch": 53.0, + "learning_rate": 2.8071621621621625e-05, + "loss": 0.3663, + "step": 54250 + }, + { + "epoch": 53.0, + "learning_rate": 2.805810810810811e-05, + "loss": 0.3034, + "step": 54260 + }, + { + "epoch": 53.0, + "learning_rate": 2.8044594594594597e-05, + "loss": 0.3347, + "step": 54270 + }, + { + "epoch": 53.0, + "learning_rate": 2.8031081081081085e-05, + "loss": 0.3622, + "step": 54280 + }, + { + "epoch": 53.0, + "learning_rate": 2.801756756756757e-05, + "loss": 0.4849, + "step": 54290 + }, + { + "epoch": 53.0, + "learning_rate": 2.8004054054054057e-05, + "loss": 0.3233, + "step": 54300 + }, + { + "epoch": 53.0, + "learning_rate": 2.7990540540540545e-05, + "loss": 0.3647, + "step": 54310 + }, + { + "epoch": 53.0, + "learning_rate": 2.797702702702703e-05, + "loss": 0.3879, + "step": 54320 + }, + { + "epoch": 53.0, + "learning_rate": 2.7963513513513517e-05, + "loss": 0.2899, + "step": 54330 + }, + { + "epoch": 53.0, + "learning_rate": 2.7950000000000005e-05, + "loss": 0.3245, + "step": 54340 + }, + { + "epoch": 53.0, + "learning_rate": 2.793648648648649e-05, + "loss": 0.1877, + "step": 54350 + }, + { + "epoch": 53.0, + "learning_rate": 2.792297297297297e-05, + "loss": 0.2435, + "step": 54360 + }, + { + "epoch": 53.0, + "learning_rate": 2.790945945945946e-05, + "loss": 0.2031, + "step": 54370 + }, + { + "epoch": 53.0, + "learning_rate": 2.7895945945945946e-05, + "loss": 0.4888, + "step": 54380 + }, + { + "epoch": 53.0, + "learning_rate": 2.788243243243243e-05, + "loss": 0.8564, + "step": 54390 + }, + { + "epoch": 53.0, + "learning_rate": 2.786891891891892e-05, + "loss": 2.0108, + "step": 54400 + }, + { + "epoch": 53.0, + "learning_rate": 2.7855405405405406e-05, + "loss": 2.4881, + "step": 54410 + }, + { + "epoch": 53.0, + "learning_rate": 2.784189189189189e-05, + "loss": 2.3665, + "step": 54420 + }, + { + "epoch": 53.0, + "learning_rate": 2.782837837837838e-05, + "loss": 2.4833, + "step": 54430 + }, + { + "epoch": 53.0, + "learning_rate": 2.7814864864864866e-05, + "loss": 1.6849, + "step": 54440 + }, + { + "epoch": 53.0, + "learning_rate": 2.780135135135135e-05, + "loss": 1.3753, + "step": 54450 + }, + { + "epoch": 53.0, + "learning_rate": 2.778783783783784e-05, + "loss": 0.8854, + "step": 54460 + }, + { + "epoch": 53.0, + "learning_rate": 2.7774324324324323e-05, + "loss": 0.3523, + "step": 54470 + }, + { + "epoch": 53.0, + "learning_rate": 2.776081081081081e-05, + "loss": 0.1074, + "step": 54480 + }, + { + "epoch": 53.0, + "learning_rate": 2.77472972972973e-05, + "loss": 0.2016, + "step": 54490 + }, + { + "epoch": 53.0, + "learning_rate": 2.7733783783783783e-05, + "loss": 0.1749, + "step": 54500 + }, + { + "epoch": 53.0, + "eval_loss": 0.09646682441234589, + "eval_runtime": 143.7194, + "eval_samples_per_second": 25.104, + "eval_steps_per_second": 3.138, + "eval_wer": 0.07869356567115501, + "step": 54500 + }, + { + "epoch": 53.0, + "learning_rate": 2.772027027027027e-05, + "loss": 0.1723, + "step": 54510 + }, + { + "epoch": 53.0, + "learning_rate": 2.770675675675676e-05, + "loss": 0.3489, + "step": 54520 + }, + { + "epoch": 53.0, + "learning_rate": 2.7693243243243243e-05, + "loss": 0.211, + "step": 54530 + }, + { + "epoch": 53.0, + "learning_rate": 2.767972972972973e-05, + "loss": 0.1005, + "step": 54540 + }, + { + "epoch": 53.0, + "learning_rate": 2.766621621621622e-05, + "loss": 0.174, + "step": 54550 + }, + { + "epoch": 53.0, + "learning_rate": 2.7652702702702703e-05, + "loss": 0.1717, + "step": 54560 + }, + { + "epoch": 53.0, + "learning_rate": 2.763918918918919e-05, + "loss": 0.1953, + "step": 54570 + }, + { + "epoch": 53.0, + "learning_rate": 2.762567567567568e-05, + "loss": 0.1862, + "step": 54580 + }, + { + "epoch": 53.0, + "learning_rate": 2.7612162162162163e-05, + "loss": 0.158, + "step": 54590 + }, + { + "epoch": 53.01, + "learning_rate": 2.759864864864865e-05, + "loss": 0.1156, + "step": 54600 + }, + { + "epoch": 53.01, + "learning_rate": 2.758513513513514e-05, + "loss": 0.1131, + "step": 54610 + }, + { + "epoch": 53.01, + "learning_rate": 2.7571621621621623e-05, + "loss": 0.1276, + "step": 54620 + }, + { + "epoch": 53.01, + "learning_rate": 2.755810810810811e-05, + "loss": 0.1689, + "step": 54630 + }, + { + "epoch": 53.01, + "learning_rate": 2.75445945945946e-05, + "loss": 0.0729, + "step": 54640 + }, + { + "epoch": 53.01, + "learning_rate": 2.7531081081081083e-05, + "loss": 0.1637, + "step": 54650 + }, + { + "epoch": 53.01, + "learning_rate": 2.751756756756757e-05, + "loss": 0.2228, + "step": 54660 + }, + { + "epoch": 53.01, + "learning_rate": 2.7504054054054055e-05, + "loss": 0.2376, + "step": 54670 + }, + { + "epoch": 53.01, + "learning_rate": 2.7490540540540543e-05, + "loss": 0.1885, + "step": 54680 + }, + { + "epoch": 53.01, + "learning_rate": 2.747702702702703e-05, + "loss": 0.2498, + "step": 54690 + }, + { + "epoch": 53.01, + "learning_rate": 2.7463513513513515e-05, + "loss": 0.218, + "step": 54700 + }, + { + "epoch": 53.01, + "learning_rate": 2.7450000000000003e-05, + "loss": 0.3416, + "step": 54710 + }, + { + "epoch": 53.01, + "learning_rate": 2.743648648648649e-05, + "loss": 0.2622, + "step": 54720 + }, + { + "epoch": 53.01, + "learning_rate": 2.7422972972972975e-05, + "loss": 0.2006, + "step": 54730 + }, + { + "epoch": 53.01, + "learning_rate": 2.7409459459459463e-05, + "loss": 0.4478, + "step": 54740 + }, + { + "epoch": 53.01, + "learning_rate": 2.739594594594595e-05, + "loss": 0.4487, + "step": 54750 + }, + { + "epoch": 53.01, + "learning_rate": 2.7382432432432432e-05, + "loss": 0.1762, + "step": 54760 + }, + { + "epoch": 53.01, + "learning_rate": 2.7368918918918916e-05, + "loss": 0.1262, + "step": 54770 + }, + { + "epoch": 53.01, + "learning_rate": 2.7355405405405404e-05, + "loss": 0.1791, + "step": 54780 + }, + { + "epoch": 53.01, + "learning_rate": 2.7341891891891892e-05, + "loss": 0.1319, + "step": 54790 + }, + { + "epoch": 53.01, + "learning_rate": 2.7328378378378376e-05, + "loss": 0.142, + "step": 54800 + }, + { + "epoch": 53.01, + "learning_rate": 2.7314864864864864e-05, + "loss": 0.1358, + "step": 54810 + }, + { + "epoch": 53.01, + "learning_rate": 2.7301351351351352e-05, + "loss": 0.1396, + "step": 54820 + }, + { + "epoch": 53.01, + "learning_rate": 2.7287837837837836e-05, + "loss": 0.1357, + "step": 54830 + }, + { + "epoch": 53.01, + "learning_rate": 2.7274324324324324e-05, + "loss": 0.2958, + "step": 54840 + }, + { + "epoch": 53.01, + "learning_rate": 2.7260810810810812e-05, + "loss": 0.3281, + "step": 54850 + }, + { + "epoch": 53.01, + "learning_rate": 2.7247297297297297e-05, + "loss": 0.2358, + "step": 54860 + }, + { + "epoch": 53.01, + "learning_rate": 2.7233783783783784e-05, + "loss": 0.2077, + "step": 54870 + }, + { + "epoch": 53.01, + "learning_rate": 2.7220270270270272e-05, + "loss": 0.3434, + "step": 54880 + }, + { + "epoch": 53.01, + "learning_rate": 2.7206756756756757e-05, + "loss": 0.239, + "step": 54890 + }, + { + "epoch": 53.01, + "learning_rate": 2.7193243243243244e-05, + "loss": 0.1372, + "step": 54900 + }, + { + "epoch": 53.01, + "learning_rate": 2.717972972972973e-05, + "loss": 0.1629, + "step": 54910 + }, + { + "epoch": 53.01, + "learning_rate": 2.7166216216216217e-05, + "loss": 0.2211, + "step": 54920 + }, + { + "epoch": 53.01, + "learning_rate": 2.7152702702702704e-05, + "loss": 0.2534, + "step": 54930 + }, + { + "epoch": 53.01, + "learning_rate": 2.713918918918919e-05, + "loss": 0.2061, + "step": 54940 + }, + { + "epoch": 53.01, + "learning_rate": 2.7125675675675677e-05, + "loss": 0.1878, + "step": 54950 + }, + { + "epoch": 53.01, + "learning_rate": 2.7112162162162164e-05, + "loss": 0.2288, + "step": 54960 + }, + { + "epoch": 53.01, + "learning_rate": 2.709864864864865e-05, + "loss": 0.1918, + "step": 54970 + }, + { + "epoch": 53.01, + "learning_rate": 2.7085135135135137e-05, + "loss": 0.1654, + "step": 54980 + }, + { + "epoch": 53.01, + "learning_rate": 2.7071621621621624e-05, + "loss": 0.161, + "step": 54990 + }, + { + "epoch": 53.01, + "learning_rate": 2.705810810810811e-05, + "loss": 0.0958, + "step": 55000 + }, + { + "epoch": 53.01, + "eval_loss": 0.08691856265068054, + "eval_runtime": 131.1087, + "eval_samples_per_second": 27.519, + "eval_steps_per_second": 3.44, + "eval_wer": 0.07519917998415879, + "step": 55000 + }, + { + "epoch": 53.01, + "learning_rate": 2.7044594594594597e-05, + "loss": 0.198, + "step": 55010 + }, + { + "epoch": 53.01, + "learning_rate": 2.7031081081081084e-05, + "loss": 0.4401, + "step": 55020 + }, + { + "epoch": 53.01, + "learning_rate": 2.701756756756757e-05, + "loss": 0.2558, + "step": 55030 + }, + { + "epoch": 53.01, + "learning_rate": 2.7004054054054057e-05, + "loss": 0.1541, + "step": 55040 + }, + { + "epoch": 53.01, + "learning_rate": 2.6990540540540545e-05, + "loss": 0.1831, + "step": 55050 + }, + { + "epoch": 53.01, + "learning_rate": 2.697702702702703e-05, + "loss": 0.2156, + "step": 55060 + }, + { + "epoch": 53.01, + "learning_rate": 2.6963513513513517e-05, + "loss": 0.1788, + "step": 55070 + }, + { + "epoch": 53.01, + "learning_rate": 2.6950000000000005e-05, + "loss": 0.2546, + "step": 55080 + }, + { + "epoch": 53.01, + "learning_rate": 2.693648648648649e-05, + "loss": 0.2855, + "step": 55090 + }, + { + "epoch": 53.01, + "learning_rate": 2.6922972972972977e-05, + "loss": 0.151, + "step": 55100 + }, + { + "epoch": 53.01, + "learning_rate": 2.6909459459459465e-05, + "loss": 0.1885, + "step": 55110 + }, + { + "epoch": 53.01, + "learning_rate": 2.689594594594595e-05, + "loss": 0.2073, + "step": 55120 + }, + { + "epoch": 53.01, + "learning_rate": 2.6882432432432437e-05, + "loss": 0.3426, + "step": 55130 + }, + { + "epoch": 53.01, + "learning_rate": 2.686891891891892e-05, + "loss": 0.3297, + "step": 55140 + }, + { + "epoch": 53.01, + "learning_rate": 2.685540540540541e-05, + "loss": 0.2916, + "step": 55150 + }, + { + "epoch": 53.01, + "learning_rate": 2.684189189189189e-05, + "loss": 0.3281, + "step": 55160 + }, + { + "epoch": 53.01, + "learning_rate": 2.6828378378378378e-05, + "loss": 0.2836, + "step": 55170 + }, + { + "epoch": 53.01, + "learning_rate": 2.6814864864864862e-05, + "loss": 0.2929, + "step": 55180 + }, + { + "epoch": 53.01, + "learning_rate": 2.680135135135135e-05, + "loss": 0.4115, + "step": 55190 + }, + { + "epoch": 53.01, + "learning_rate": 2.6787837837837838e-05, + "loss": 0.2936, + "step": 55200 + }, + { + "epoch": 53.01, + "learning_rate": 2.6774324324324322e-05, + "loss": 0.2782, + "step": 55210 + }, + { + "epoch": 53.01, + "learning_rate": 2.676081081081081e-05, + "loss": 0.279, + "step": 55220 + }, + { + "epoch": 53.01, + "learning_rate": 2.6747297297297298e-05, + "loss": 0.225, + "step": 55230 + }, + { + "epoch": 53.01, + "learning_rate": 2.6733783783783782e-05, + "loss": 0.3997, + "step": 55240 + }, + { + "epoch": 54.0, + "learning_rate": 2.672027027027027e-05, + "loss": 0.3348, + "step": 55250 + }, + { + "epoch": 54.0, + "learning_rate": 2.6706756756756758e-05, + "loss": 0.3253, + "step": 55260 + }, + { + "epoch": 54.0, + "learning_rate": 2.6693243243243242e-05, + "loss": 0.417, + "step": 55270 + }, + { + "epoch": 54.0, + "learning_rate": 2.667972972972973e-05, + "loss": 0.2924, + "step": 55280 + }, + { + "epoch": 54.0, + "learning_rate": 2.6666216216216218e-05, + "loss": 0.3033, + "step": 55290 + }, + { + "epoch": 54.0, + "learning_rate": 2.6652702702702702e-05, + "loss": 0.2976, + "step": 55300 + }, + { + "epoch": 54.0, + "learning_rate": 2.663918918918919e-05, + "loss": 0.5006, + "step": 55310 + }, + { + "epoch": 54.0, + "learning_rate": 2.6625675675675678e-05, + "loss": 0.3299, + "step": 55320 + }, + { + "epoch": 54.0, + "learning_rate": 2.6612162162162162e-05, + "loss": 0.3282, + "step": 55330 + }, + { + "epoch": 54.0, + "learning_rate": 2.659864864864865e-05, + "loss": 0.3936, + "step": 55340 + }, + { + "epoch": 54.0, + "learning_rate": 2.6585135135135135e-05, + "loss": 0.3417, + "step": 55350 + }, + { + "epoch": 54.0, + "learning_rate": 2.6571621621621622e-05, + "loss": 0.3433, + "step": 55360 + }, + { + "epoch": 54.0, + "learning_rate": 2.655810810810811e-05, + "loss": 0.2242, + "step": 55370 + }, + { + "epoch": 54.0, + "learning_rate": 2.6544594594594595e-05, + "loss": 0.1959, + "step": 55380 + }, + { + "epoch": 54.0, + "learning_rate": 2.6531081081081083e-05, + "loss": 0.2085, + "step": 55390 + }, + { + "epoch": 54.0, + "learning_rate": 2.651756756756757e-05, + "loss": 0.2433, + "step": 55400 + }, + { + "epoch": 54.0, + "learning_rate": 2.6504054054054055e-05, + "loss": 0.9811, + "step": 55410 + }, + { + "epoch": 54.0, + "learning_rate": 2.6490540540540543e-05, + "loss": 1.3555, + "step": 55420 + }, + { + "epoch": 54.0, + "learning_rate": 2.647702702702703e-05, + "loss": 2.5176, + "step": 55430 + }, + { + "epoch": 54.0, + "learning_rate": 2.6463513513513515e-05, + "loss": 2.3345, + "step": 55440 + }, + { + "epoch": 54.0, + "learning_rate": 2.6450000000000003e-05, + "loss": 2.4774, + "step": 55450 + }, + { + "epoch": 54.0, + "learning_rate": 2.643648648648649e-05, + "loss": 2.0216, + "step": 55460 + }, + { + "epoch": 54.0, + "learning_rate": 2.6422972972972975e-05, + "loss": 1.2743, + "step": 55470 + }, + { + "epoch": 54.0, + "learning_rate": 2.6409459459459463e-05, + "loss": 1.2256, + "step": 55480 + }, + { + "epoch": 54.0, + "learning_rate": 2.639594594594595e-05, + "loss": 0.4296, + "step": 55490 + }, + { + "epoch": 54.0, + "learning_rate": 2.6382432432432435e-05, + "loss": 0.1284, + "step": 55500 + }, + { + "epoch": 54.0, + "eval_loss": 0.0935041531920433, + "eval_runtime": 137.1907, + "eval_samples_per_second": 26.299, + "eval_steps_per_second": 3.287, + "eval_wer": 0.08167544145739179, + "step": 55500 + }, + { + "epoch": 54.0, + "learning_rate": 2.6368918918918923e-05, + "loss": 0.157, + "step": 55510 + }, + { + "epoch": 54.0, + "learning_rate": 2.635540540540541e-05, + "loss": 0.1274, + "step": 55520 + }, + { + "epoch": 54.0, + "learning_rate": 2.6341891891891895e-05, + "loss": 0.2415, + "step": 55530 + }, + { + "epoch": 54.0, + "learning_rate": 2.6328378378378383e-05, + "loss": 0.3106, + "step": 55540 + }, + { + "epoch": 54.0, + "learning_rate": 2.631486486486487e-05, + "loss": 0.2582, + "step": 55550 + }, + { + "epoch": 54.0, + "learning_rate": 2.630135135135135e-05, + "loss": 0.1225, + "step": 55560 + }, + { + "epoch": 54.0, + "learning_rate": 2.6287837837837836e-05, + "loss": 0.1435, + "step": 55570 + }, + { + "epoch": 54.0, + "learning_rate": 2.6274324324324324e-05, + "loss": 0.1758, + "step": 55580 + }, + { + "epoch": 54.0, + "learning_rate": 2.6260810810810808e-05, + "loss": 0.1642, + "step": 55590 + }, + { + "epoch": 54.0, + "learning_rate": 2.6247297297297296e-05, + "loss": 0.1608, + "step": 55600 + }, + { + "epoch": 54.0, + "learning_rate": 2.6233783783783784e-05, + "loss": 0.1645, + "step": 55610 + }, + { + "epoch": 54.01, + "learning_rate": 2.6220270270270268e-05, + "loss": 0.1279, + "step": 55620 + }, + { + "epoch": 54.01, + "learning_rate": 2.6206756756756756e-05, + "loss": 0.0917, + "step": 55630 + }, + { + "epoch": 54.01, + "learning_rate": 2.6193243243243244e-05, + "loss": 0.1183, + "step": 55640 + }, + { + "epoch": 54.01, + "learning_rate": 2.6179729729729728e-05, + "loss": 0.1755, + "step": 55650 + }, + { + "epoch": 54.01, + "learning_rate": 2.6166216216216216e-05, + "loss": 0.1111, + "step": 55660 + }, + { + "epoch": 54.01, + "learning_rate": 2.6152702702702704e-05, + "loss": 0.1483, + "step": 55670 + }, + { + "epoch": 54.01, + "learning_rate": 2.6139189189189188e-05, + "loss": 0.1925, + "step": 55680 + }, + { + "epoch": 54.01, + "learning_rate": 2.6125675675675676e-05, + "loss": 0.2262, + "step": 55690 + }, + { + "epoch": 54.01, + "learning_rate": 2.6112162162162164e-05, + "loss": 0.1742, + "step": 55700 + }, + { + "epoch": 54.01, + "learning_rate": 2.6098648648648648e-05, + "loss": 0.255, + "step": 55710 + }, + { + "epoch": 54.01, + "learning_rate": 2.6085135135135136e-05, + "loss": 0.2327, + "step": 55720 + }, + { + "epoch": 54.01, + "learning_rate": 2.6071621621621624e-05, + "loss": 0.2748, + "step": 55730 + }, + { + "epoch": 54.01, + "learning_rate": 2.6058108108108108e-05, + "loss": 0.2561, + "step": 55740 + }, + { + "epoch": 54.01, + "learning_rate": 2.6044594594594596e-05, + "loss": 0.1823, + "step": 55750 + }, + { + "epoch": 54.01, + "learning_rate": 2.6031081081081084e-05, + "loss": 0.3989, + "step": 55760 + }, + { + "epoch": 54.01, + "learning_rate": 2.601756756756757e-05, + "loss": 0.4244, + "step": 55770 + }, + { + "epoch": 54.01, + "learning_rate": 2.6004054054054056e-05, + "loss": 0.2954, + "step": 55780 + }, + { + "epoch": 54.01, + "learning_rate": 2.599054054054054e-05, + "loss": 0.1038, + "step": 55790 + }, + { + "epoch": 54.01, + "learning_rate": 2.597702702702703e-05, + "loss": 0.1924, + "step": 55800 + }, + { + "epoch": 54.01, + "learning_rate": 2.5963513513513516e-05, + "loss": 0.1729, + "step": 55810 + }, + { + "epoch": 54.01, + "learning_rate": 2.595e-05, + "loss": 0.1277, + "step": 55820 + }, + { + "epoch": 54.01, + "learning_rate": 2.593648648648649e-05, + "loss": 0.1346, + "step": 55830 + }, + { + "epoch": 54.01, + "learning_rate": 2.5922972972972976e-05, + "loss": 0.1121, + "step": 55840 + }, + { + "epoch": 54.01, + "learning_rate": 2.590945945945946e-05, + "loss": 0.0965, + "step": 55850 + }, + { + "epoch": 54.01, + "learning_rate": 2.589594594594595e-05, + "loss": 0.2489, + "step": 55860 + }, + { + "epoch": 54.01, + "learning_rate": 2.5882432432432436e-05, + "loss": 0.3472, + "step": 55870 + }, + { + "epoch": 54.01, + "learning_rate": 2.586891891891892e-05, + "loss": 0.2602, + "step": 55880 + }, + { + "epoch": 54.01, + "learning_rate": 2.585540540540541e-05, + "loss": 0.185, + "step": 55890 + }, + { + "epoch": 54.01, + "learning_rate": 2.5841891891891896e-05, + "loss": 0.2498, + "step": 55900 + }, + { + "epoch": 54.01, + "learning_rate": 2.582837837837838e-05, + "loss": 0.2814, + "step": 55910 + }, + { + "epoch": 54.01, + "learning_rate": 2.581486486486487e-05, + "loss": 0.1642, + "step": 55920 + }, + { + "epoch": 54.01, + "learning_rate": 2.5801351351351356e-05, + "loss": 0.1564, + "step": 55930 + }, + { + "epoch": 54.01, + "learning_rate": 2.578783783783784e-05, + "loss": 0.2391, + "step": 55940 + }, + { + "epoch": 54.01, + "learning_rate": 2.577432432432433e-05, + "loss": 0.2739, + "step": 55950 + }, + { + "epoch": 54.01, + "learning_rate": 2.576081081081081e-05, + "loss": 0.2587, + "step": 55960 + }, + { + "epoch": 54.01, + "learning_rate": 2.5747297297297297e-05, + "loss": 0.2192, + "step": 55970 + }, + { + "epoch": 54.01, + "learning_rate": 2.5733783783783782e-05, + "loss": 0.175, + "step": 55980 + }, + { + "epoch": 54.01, + "learning_rate": 2.572027027027027e-05, + "loss": 0.1586, + "step": 55990 + }, + { + "epoch": 54.01, + "learning_rate": 2.5706756756756757e-05, + "loss": 0.1592, + "step": 56000 + }, + { + "epoch": 54.01, + "eval_loss": 0.08834712207317352, + "eval_runtime": 132.3991, + "eval_samples_per_second": 27.251, + "eval_steps_per_second": 3.406, + "eval_wer": 0.07310254857196105, + "step": 56000 + }, + { + "epoch": 54.01, + "learning_rate": 2.5693243243243242e-05, + "loss": 0.1942, + "step": 56010 + }, + { + "epoch": 54.01, + "learning_rate": 2.567972972972973e-05, + "loss": 0.0881, + "step": 56020 + }, + { + "epoch": 54.01, + "learning_rate": 2.5666216216216214e-05, + "loss": 0.1987, + "step": 56030 + }, + { + "epoch": 54.01, + "learning_rate": 2.5652702702702702e-05, + "loss": 0.2933, + "step": 56040 + }, + { + "epoch": 54.01, + "learning_rate": 2.563918918918919e-05, + "loss": 0.3283, + "step": 56050 + }, + { + "epoch": 54.01, + "learning_rate": 2.5625675675675674e-05, + "loss": 0.1148, + "step": 56060 + }, + { + "epoch": 54.01, + "learning_rate": 2.5612162162162162e-05, + "loss": 0.1263, + "step": 56070 + }, + { + "epoch": 54.01, + "learning_rate": 2.559864864864865e-05, + "loss": 0.1901, + "step": 56080 + }, + { + "epoch": 54.01, + "learning_rate": 2.5585135135135134e-05, + "loss": 0.1775, + "step": 56090 + }, + { + "epoch": 54.01, + "learning_rate": 2.5571621621621622e-05, + "loss": 0.2051, + "step": 56100 + }, + { + "epoch": 54.01, + "learning_rate": 2.555810810810811e-05, + "loss": 0.2923, + "step": 56110 + }, + { + "epoch": 54.01, + "learning_rate": 2.5544594594594594e-05, + "loss": 0.1802, + "step": 56120 + }, + { + "epoch": 54.01, + "learning_rate": 2.5531081081081082e-05, + "loss": 0.1901, + "step": 56130 + }, + { + "epoch": 54.01, + "learning_rate": 2.551756756756757e-05, + "loss": 0.1841, + "step": 56140 + }, + { + "epoch": 54.01, + "learning_rate": 2.5504054054054054e-05, + "loss": 0.3016, + "step": 56150 + }, + { + "epoch": 54.01, + "learning_rate": 2.5490540540540542e-05, + "loss": 0.2425, + "step": 56160 + }, + { + "epoch": 54.01, + "learning_rate": 2.547702702702703e-05, + "loss": 0.3339, + "step": 56170 + }, + { + "epoch": 54.01, + "learning_rate": 2.5463513513513514e-05, + "loss": 0.2584, + "step": 56180 + }, + { + "epoch": 54.01, + "learning_rate": 2.5450000000000002e-05, + "loss": 0.3178, + "step": 56190 + }, + { + "epoch": 54.01, + "learning_rate": 2.543648648648649e-05, + "loss": 0.2749, + "step": 56200 + }, + { + "epoch": 54.01, + "learning_rate": 2.5422972972972974e-05, + "loss": 0.3794, + "step": 56210 + }, + { + "epoch": 54.01, + "learning_rate": 2.5409459459459462e-05, + "loss": 0.3208, + "step": 56220 + }, + { + "epoch": 54.01, + "learning_rate": 2.539594594594595e-05, + "loss": 0.2769, + "step": 56230 + }, + { + "epoch": 54.01, + "learning_rate": 2.5382432432432434e-05, + "loss": 0.282, + "step": 56240 + }, + { + "epoch": 54.01, + "learning_rate": 2.5368918918918922e-05, + "loss": 0.2892, + "step": 56250 + }, + { + "epoch": 54.01, + "learning_rate": 2.5355405405405406e-05, + "loss": 0.3469, + "step": 56260 + }, + { + "epoch": 55.0, + "learning_rate": 2.5341891891891894e-05, + "loss": 0.3425, + "step": 56270 + }, + { + "epoch": 55.0, + "learning_rate": 2.5328378378378382e-05, + "loss": 0.3743, + "step": 56280 + }, + { + "epoch": 55.0, + "learning_rate": 2.5314864864864866e-05, + "loss": 0.3608, + "step": 56290 + }, + { + "epoch": 55.0, + "learning_rate": 2.5301351351351354e-05, + "loss": 0.3748, + "step": 56300 + }, + { + "epoch": 55.0, + "learning_rate": 2.5287837837837842e-05, + "loss": 0.3204, + "step": 56310 + }, + { + "epoch": 55.0, + "learning_rate": 2.5274324324324327e-05, + "loss": 0.3525, + "step": 56320 + }, + { + "epoch": 55.0, + "learning_rate": 2.5260810810810814e-05, + "loss": 0.5141, + "step": 56330 + }, + { + "epoch": 55.0, + "learning_rate": 2.5247297297297302e-05, + "loss": 0.3374, + "step": 56340 + }, + { + "epoch": 55.0, + "learning_rate": 2.5233783783783787e-05, + "loss": 0.3383, + "step": 56350 + }, + { + "epoch": 55.0, + "learning_rate": 2.5220270270270274e-05, + "loss": 0.3588, + "step": 56360 + }, + { + "epoch": 55.0, + "learning_rate": 2.5206756756756755e-05, + "loss": 0.3512, + "step": 56370 + }, + { + "epoch": 55.0, + "learning_rate": 2.5193243243243243e-05, + "loss": 0.3785, + "step": 56380 + }, + { + "epoch": 55.0, + "learning_rate": 2.5179729729729728e-05, + "loss": 0.2198, + "step": 56390 + }, + { + "epoch": 55.0, + "learning_rate": 2.5166216216216215e-05, + "loss": 0.2061, + "step": 56400 + }, + { + "epoch": 55.0, + "learning_rate": 2.5152702702702703e-05, + "loss": 0.2216, + "step": 56410 + }, + { + "epoch": 55.0, + "learning_rate": 2.5139189189189188e-05, + "loss": 0.2079, + "step": 56420 + }, + { + "epoch": 55.0, + "learning_rate": 2.5125675675675675e-05, + "loss": 0.93, + "step": 56430 + }, + { + "epoch": 55.0, + "learning_rate": 2.5112162162162163e-05, + "loss": 0.8218, + "step": 56440 + }, + { + "epoch": 55.0, + "learning_rate": 2.5098648648648648e-05, + "loss": 2.5442, + "step": 56450 + }, + { + "epoch": 55.0, + "learning_rate": 2.5085135135135135e-05, + "loss": 2.3191, + "step": 56460 + }, + { + "epoch": 55.0, + "learning_rate": 2.507162162162162e-05, + "loss": 2.4763, + "step": 56470 + }, + { + "epoch": 55.0, + "learning_rate": 2.5058108108108108e-05, + "loss": 2.4666, + "step": 56480 + }, + { + "epoch": 55.0, + "learning_rate": 2.5044594594594596e-05, + "loss": 1.1196, + "step": 56490 + }, + { + "epoch": 55.0, + "learning_rate": 2.503108108108108e-05, + "loss": 1.3825, + "step": 56500 + }, + { + "epoch": 55.0, + "eval_loss": 0.08699646592140198, + "eval_runtime": 133.9229, + "eval_samples_per_second": 26.941, + "eval_steps_per_second": 3.368, + "eval_wer": 0.08489027628942832, + "step": 56500 + }, + { + "epoch": 55.0, + "learning_rate": 2.5017567567567568e-05, + "loss": 0.5523, + "step": 56510 + }, + { + "epoch": 55.0, + "learning_rate": 2.5004054054054056e-05, + "loss": 0.1611, + "step": 56520 + }, + { + "epoch": 55.0, + "learning_rate": 2.499054054054054e-05, + "loss": 0.1079, + "step": 56530 + }, + { + "epoch": 55.0, + "learning_rate": 2.4977027027027028e-05, + "loss": 0.1633, + "step": 56540 + }, + { + "epoch": 55.0, + "learning_rate": 2.4963513513513516e-05, + "loss": 0.1832, + "step": 56550 + }, + { + "epoch": 55.0, + "learning_rate": 2.495e-05, + "loss": 0.2574, + "step": 56560 + }, + { + "epoch": 55.0, + "learning_rate": 2.4936486486486488e-05, + "loss": 0.2943, + "step": 56570 + }, + { + "epoch": 55.0, + "learning_rate": 2.4922972972972976e-05, + "loss": 0.141, + "step": 56580 + }, + { + "epoch": 55.0, + "learning_rate": 2.490945945945946e-05, + "loss": 0.1038, + "step": 56590 + }, + { + "epoch": 55.0, + "learning_rate": 2.4895945945945948e-05, + "loss": 0.196, + "step": 56600 + }, + { + "epoch": 55.0, + "learning_rate": 2.4882432432432436e-05, + "loss": 0.15, + "step": 56610 + }, + { + "epoch": 55.0, + "learning_rate": 2.486891891891892e-05, + "loss": 0.2123, + "step": 56620 + }, + { + "epoch": 55.0, + "learning_rate": 2.4855405405405408e-05, + "loss": 0.1981, + "step": 56630 + }, + { + "epoch": 55.01, + "learning_rate": 2.4841891891891896e-05, + "loss": 0.1498, + "step": 56640 + }, + { + "epoch": 55.01, + "learning_rate": 2.482837837837838e-05, + "loss": 0.1228, + "step": 56650 + }, + { + "epoch": 55.01, + "learning_rate": 2.4814864864864868e-05, + "loss": 0.0815, + "step": 56660 + }, + { + "epoch": 55.01, + "learning_rate": 2.4801351351351352e-05, + "loss": 0.1448, + "step": 56670 + }, + { + "epoch": 55.01, + "learning_rate": 2.4787837837837837e-05, + "loss": 0.1571, + "step": 56680 + }, + { + "epoch": 55.01, + "learning_rate": 2.4774324324324325e-05, + "loss": 0.1621, + "step": 56690 + }, + { + "epoch": 55.01, + "learning_rate": 2.4760810810810812e-05, + "loss": 0.1626, + "step": 56700 + }, + { + "epoch": 55.01, + "learning_rate": 2.4747297297297297e-05, + "loss": 0.2495, + "step": 56710 + }, + { + "epoch": 55.01, + "learning_rate": 2.4733783783783785e-05, + "loss": 0.1429, + "step": 56720 + }, + { + "epoch": 55.01, + "learning_rate": 2.4720270270270272e-05, + "loss": 0.2152, + "step": 56730 + }, + { + "epoch": 55.01, + "learning_rate": 2.4706756756756757e-05, + "loss": 0.1957, + "step": 56740 + }, + { + "epoch": 55.01, + "learning_rate": 2.4693243243243245e-05, + "loss": 0.2888, + "step": 56750 + }, + { + "epoch": 55.01, + "learning_rate": 2.4679729729729732e-05, + "loss": 0.2732, + "step": 56760 + }, + { + "epoch": 55.01, + "learning_rate": 2.4666216216216217e-05, + "loss": 0.1757, + "step": 56770 + }, + { + "epoch": 55.01, + "learning_rate": 2.4652702702702705e-05, + "loss": 0.3099, + "step": 56780 + }, + { + "epoch": 55.01, + "learning_rate": 2.463918918918919e-05, + "loss": 0.4297, + "step": 56790 + }, + { + "epoch": 55.01, + "learning_rate": 2.4625675675675677e-05, + "loss": 0.3222, + "step": 56800 + }, + { + "epoch": 55.01, + "learning_rate": 2.4612162162162165e-05, + "loss": 0.1122, + "step": 56810 + }, + { + "epoch": 55.01, + "learning_rate": 2.459864864864865e-05, + "loss": 0.1517, + "step": 56820 + }, + { + "epoch": 55.01, + "learning_rate": 2.4585135135135137e-05, + "loss": 0.1723, + "step": 56830 + }, + { + "epoch": 55.01, + "learning_rate": 2.4571621621621625e-05, + "loss": 0.1117, + "step": 56840 + }, + { + "epoch": 55.01, + "learning_rate": 2.455810810810811e-05, + "loss": 0.1072, + "step": 56850 + }, + { + "epoch": 55.01, + "learning_rate": 2.4544594594594597e-05, + "loss": 0.1242, + "step": 56860 + }, + { + "epoch": 55.01, + "learning_rate": 2.453108108108108e-05, + "loss": 0.1242, + "step": 56870 + }, + { + "epoch": 55.01, + "learning_rate": 2.451756756756757e-05, + "loss": 0.1512, + "step": 56880 + }, + { + "epoch": 55.01, + "learning_rate": 2.4504054054054054e-05, + "loss": 0.3986, + "step": 56890 + }, + { + "epoch": 55.01, + "learning_rate": 2.449054054054054e-05, + "loss": 0.2794, + "step": 56900 + }, + { + "epoch": 55.01, + "learning_rate": 2.4477027027027026e-05, + "loss": 0.1646, + "step": 56910 + }, + { + "epoch": 55.01, + "learning_rate": 2.4463513513513514e-05, + "loss": 0.213, + "step": 56920 + }, + { + "epoch": 55.01, + "learning_rate": 2.445e-05, + "loss": 0.3527, + "step": 56930 + }, + { + "epoch": 55.01, + "learning_rate": 2.4436486486486486e-05, + "loss": 0.1352, + "step": 56940 + }, + { + "epoch": 55.01, + "learning_rate": 2.4422972972972974e-05, + "loss": 0.1208, + "step": 56950 + }, + { + "epoch": 55.01, + "learning_rate": 2.440945945945946e-05, + "loss": 0.1822, + "step": 56960 + }, + { + "epoch": 55.01, + "learning_rate": 2.4395945945945946e-05, + "loss": 0.3093, + "step": 56970 + }, + { + "epoch": 55.01, + "learning_rate": 2.4382432432432434e-05, + "loss": 0.2311, + "step": 56980 + }, + { + "epoch": 55.01, + "learning_rate": 2.436891891891892e-05, + "loss": 0.1938, + "step": 56990 + }, + { + "epoch": 55.01, + "learning_rate": 2.4355405405405406e-05, + "loss": 0.1956, + "step": 57000 + }, + { + "epoch": 55.01, + "eval_loss": 0.0833604708313942, + "eval_runtime": 130.1421, + "eval_samples_per_second": 27.724, + "eval_steps_per_second": 3.465, + "eval_wer": 0.0726832222895215, + "step": 57000 + }, + { + "epoch": 55.01, + "learning_rate": 2.4341891891891894e-05, + "loss": 0.2095, + "step": 57010 + }, + { + "epoch": 55.01, + "learning_rate": 2.432837837837838e-05, + "loss": 0.179, + "step": 57020 + }, + { + "epoch": 55.01, + "learning_rate": 2.4314864864864866e-05, + "loss": 0.2167, + "step": 57030 + }, + { + "epoch": 55.01, + "learning_rate": 2.4301351351351354e-05, + "loss": 0.1004, + "step": 57040 + }, + { + "epoch": 55.01, + "learning_rate": 2.428783783783784e-05, + "loss": 0.1139, + "step": 57050 + }, + { + "epoch": 55.01, + "learning_rate": 2.4274324324324326e-05, + "loss": 0.223, + "step": 57060 + }, + { + "epoch": 55.01, + "learning_rate": 2.426081081081081e-05, + "loss": 0.4315, + "step": 57070 + }, + { + "epoch": 55.01, + "learning_rate": 2.4247297297297298e-05, + "loss": 0.1342, + "step": 57080 + }, + { + "epoch": 55.01, + "learning_rate": 2.4233783783783783e-05, + "loss": 0.145, + "step": 57090 + }, + { + "epoch": 55.01, + "learning_rate": 2.422027027027027e-05, + "loss": 0.2103, + "step": 57100 + }, + { + "epoch": 55.01, + "learning_rate": 2.4206756756756758e-05, + "loss": 0.2039, + "step": 57110 + }, + { + "epoch": 55.01, + "learning_rate": 2.4193243243243243e-05, + "loss": 0.1827, + "step": 57120 + }, + { + "epoch": 55.01, + "learning_rate": 2.417972972972973e-05, + "loss": 0.2463, + "step": 57130 + }, + { + "epoch": 55.01, + "learning_rate": 2.4166216216216218e-05, + "loss": 0.2168, + "step": 57140 + }, + { + "epoch": 55.01, + "learning_rate": 2.4152702702702703e-05, + "loss": 0.1486, + "step": 57150 + }, + { + "epoch": 55.01, + "learning_rate": 2.413918918918919e-05, + "loss": 0.1878, + "step": 57160 + }, + { + "epoch": 55.01, + "learning_rate": 2.4125675675675678e-05, + "loss": 0.2544, + "step": 57170 + }, + { + "epoch": 55.01, + "learning_rate": 2.4112162162162163e-05, + "loss": 0.2435, + "step": 57180 + }, + { + "epoch": 55.01, + "learning_rate": 2.409864864864865e-05, + "loss": 0.3812, + "step": 57190 + }, + { + "epoch": 55.01, + "learning_rate": 2.4085135135135138e-05, + "loss": 0.2824, + "step": 57200 + }, + { + "epoch": 55.01, + "learning_rate": 2.4071621621621623e-05, + "loss": 0.3808, + "step": 57210 + }, + { + "epoch": 55.01, + "learning_rate": 2.405810810810811e-05, + "loss": 0.323, + "step": 57220 + }, + { + "epoch": 55.01, + "learning_rate": 2.4044594594594598e-05, + "loss": 0.3917, + "step": 57230 + }, + { + "epoch": 55.01, + "learning_rate": 2.4031081081081083e-05, + "loss": 0.339, + "step": 57240 + }, + { + "epoch": 55.01, + "learning_rate": 2.401756756756757e-05, + "loss": 0.2448, + "step": 57250 + }, + { + "epoch": 55.01, + "learning_rate": 2.4005405405405408e-05, + "loss": 0.2597, + "step": 57260 + }, + { + "epoch": 55.01, + "learning_rate": 2.3991891891891892e-05, + "loss": 0.3101, + "step": 57270 + }, + { + "epoch": 55.01, + "learning_rate": 2.397837837837838e-05, + "loss": 0.2709, + "step": 57280 + }, + { + "epoch": 56.0, + "learning_rate": 2.3964864864864868e-05, + "loss": 0.339, + "step": 57290 + }, + { + "epoch": 56.0, + "learning_rate": 2.3951351351351352e-05, + "loss": 0.3359, + "step": 57300 + }, + { + "epoch": 56.0, + "learning_rate": 2.393783783783784e-05, + "loss": 0.3377, + "step": 57310 + }, + { + "epoch": 56.0, + "learning_rate": 2.3924324324324328e-05, + "loss": 0.3551, + "step": 57320 + }, + { + "epoch": 56.0, + "learning_rate": 2.3910810810810812e-05, + "loss": 0.288, + "step": 57330 + }, + { + "epoch": 56.0, + "learning_rate": 2.38972972972973e-05, + "loss": 0.3581, + "step": 57340 + }, + { + "epoch": 56.0, + "learning_rate": 2.3883783783783784e-05, + "loss": 0.4098, + "step": 57350 + }, + { + "epoch": 56.0, + "learning_rate": 2.387027027027027e-05, + "loss": 0.446, + "step": 57360 + }, + { + "epoch": 56.0, + "learning_rate": 2.3856756756756756e-05, + "loss": 0.3027, + "step": 57370 + }, + { + "epoch": 56.0, + "learning_rate": 2.3843243243243244e-05, + "loss": 0.3397, + "step": 57380 + }, + { + "epoch": 56.0, + "learning_rate": 2.382972972972973e-05, + "loss": 0.3555, + "step": 57390 + }, + { + "epoch": 56.0, + "learning_rate": 2.3816216216216216e-05, + "loss": 0.3326, + "step": 57400 + }, + { + "epoch": 56.0, + "learning_rate": 2.3802702702702704e-05, + "loss": 0.282, + "step": 57410 + }, + { + "epoch": 56.0, + "learning_rate": 2.378918918918919e-05, + "loss": 0.2117, + "step": 57420 + }, + { + "epoch": 56.0, + "learning_rate": 2.3775675675675677e-05, + "loss": 0.2099, + "step": 57430 + }, + { + "epoch": 56.0, + "learning_rate": 2.3762162162162164e-05, + "loss": 0.2177, + "step": 57440 + }, + { + "epoch": 56.0, + "learning_rate": 2.374864864864865e-05, + "loss": 0.5614, + "step": 57450 + }, + { + "epoch": 56.0, + "learning_rate": 2.3735135135135137e-05, + "loss": 0.7639, + "step": 57460 + }, + { + "epoch": 56.0, + "learning_rate": 2.3721621621621624e-05, + "loss": 2.1767, + "step": 57470 + }, + { + "epoch": 56.0, + "learning_rate": 2.370810810810811e-05, + "loss": 2.4718, + "step": 57480 + }, + { + "epoch": 56.0, + "learning_rate": 2.3694594594594597e-05, + "loss": 2.3706, + "step": 57490 + }, + { + "epoch": 56.0, + "learning_rate": 2.3681081081081084e-05, + "loss": 2.4653, + "step": 57500 + }, + { + "epoch": 56.0, + "eval_loss": 0.08348675817251205, + "eval_runtime": 129.2168, + "eval_samples_per_second": 27.922, + "eval_steps_per_second": 3.49, + "eval_wer": 0.0811163397474724, + "step": 57500 } ], "max_steps": 75000, "num_train_epochs": 9223372036854775807, - "total_flos": 1.3193673854990254e+20, + "total_flos": 3.790378322257517e+20, "trial_name": null, "trial_params": null }