diff --git "a/trainer_state.json" "b/trainer_state.json" --- "a/trainer_state.json" +++ "b/trainer_state.json" @@ -1,18205 +1,5245 @@ { - "best_metric": 0.4693412184715271, - "best_model_checkpoint": "ai-light-dance_singing3_ft_wav2vec2-large-xlsr-53-v1-5gram/checkpoint-288", - "epoch": 99.9974025974026, - "global_step": 28800, + "best_metric": 0.45630136132240295, + "best_model_checkpoint": "ai-light-dance_singing3_ft_wav2vec2-large-xlsr-53-v1-5gram/checkpoint-504", + "epoch": 99.99653979238754, + "global_step": 7200, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { - "epoch": 0.03, - "learning_rate": 8e-08, - "loss": 0.3037, + "epoch": 0.14, + "learning_rate": 5e-06, + "loss": 0.48, "step": 10 }, { - "epoch": 0.07, - "learning_rate": 1.6e-07, - "loss": 0.3044, + "epoch": 0.28, + "learning_rate": 1e-05, + "loss": 0.4916, "step": 20 }, { - "epoch": 0.1, - "learning_rate": 2.32e-07, - "loss": 0.2922, + "epoch": 0.42, + "learning_rate": 1.45e-05, + "loss": 0.4674, "step": 30 }, { - "epoch": 0.14, - "learning_rate": 3.12e-07, - "loss": 0.3287, + "epoch": 0.55, + "learning_rate": 1.9500000000000003e-05, + "loss": 0.4695, "step": 40 }, { - "epoch": 0.17, - "learning_rate": 3.92e-07, - "loss": 0.3189, + "epoch": 0.69, + "learning_rate": 2.45e-05, + "loss": 0.4717, "step": 50 }, { - "epoch": 0.21, - "learning_rate": 4.64e-07, - "loss": 0.2791, + "epoch": 0.83, + "learning_rate": 2.95e-05, + "loss": 0.4723, "step": 60 }, { - "epoch": 0.24, - "learning_rate": 5.44e-07, - "loss": 0.2892, + "epoch": 0.97, + "learning_rate": 3.45e-05, + "loss": 0.504, "step": 70 }, { - "epoch": 0.28, - "learning_rate": 6.24e-07, - "loss": 0.3011, + "epoch": 1.0, + "eval_loss": 0.48100385069847107, + "eval_runtime": 127.9947, + "eval_samples_per_second": 4.156, + "eval_steps_per_second": 0.523, + "eval_wer": 0.23127852413704442, + "step": 72 + }, + { + "epoch": 1.11, + "learning_rate": 3.9500000000000005e-05, + "loss": 0.4949, "step": 80 }, { - "epoch": 0.31, - "learning_rate": 7.04e-07, - "loss": 0.3154, + "epoch": 1.25, + "learning_rate": 4.4500000000000004e-05, + "loss": 0.4909, "step": 90 }, { - "epoch": 0.35, - "learning_rate": 7.84e-07, - "loss": 0.3242, + "epoch": 1.39, + "learning_rate": 4.9500000000000004e-05, + "loss": 0.4735, "step": 100 }, { - "epoch": 0.38, - "learning_rate": 8.639999999999999e-07, - "loss": 0.2931, + "epoch": 1.53, + "learning_rate": 4.993661971830986e-05, + "loss": 0.5011, "step": 110 }, { - "epoch": 0.42, - "learning_rate": 9.439999999999999e-07, - "loss": 0.2822, + "epoch": 1.66, + "learning_rate": 4.98661971830986e-05, + "loss": 0.5118, "step": 120 }, { - "epoch": 0.45, - "learning_rate": 1.024e-06, - "loss": 0.3186, + "epoch": 1.8, + "learning_rate": 4.9795774647887327e-05, + "loss": 0.5348, "step": 130 }, { - "epoch": 0.48, - "learning_rate": 1.1040000000000001e-06, - "loss": 0.3111, + "epoch": 1.94, + "learning_rate": 4.972535211267606e-05, + "loss": 0.5274, "step": 140 }, { - "epoch": 0.52, - "learning_rate": 1.1839999999999998e-06, - "loss": 0.2909, + "epoch": 2.0, + "eval_loss": 0.4828048348426819, + "eval_runtime": 129.7646, + "eval_samples_per_second": 4.1, + "eval_steps_per_second": 0.516, + "eval_wer": 0.23879925435495275, + "step": 144 + }, + { + "epoch": 2.08, + "learning_rate": 4.965492957746479e-05, + "loss": 0.5455, "step": 150 }, { - "epoch": 0.55, - "learning_rate": 1.2639999999999999e-06, - "loss": 0.299, + "epoch": 2.22, + "learning_rate": 4.9584507042253526e-05, + "loss": 0.518, "step": 160 }, { - "epoch": 0.59, - "learning_rate": 1.344e-06, - "loss": 0.3338, + "epoch": 2.36, + "learning_rate": 4.951408450704226e-05, + "loss": 0.5118, "step": 170 }, { - "epoch": 0.62, - "learning_rate": 1.4239999999999998e-06, - "loss": 0.2607, + "epoch": 2.5, + "learning_rate": 4.944366197183099e-05, + "loss": 0.5116, "step": 180 }, { - "epoch": 0.66, - "learning_rate": 1.504e-06, - "loss": 0.2763, + "epoch": 2.64, + "learning_rate": 4.9373239436619725e-05, + "loss": 0.4943, "step": 190 }, { - "epoch": 0.69, - "learning_rate": 1.584e-06, - "loss": 0.296, + "epoch": 2.78, + "learning_rate": 4.930281690140845e-05, + "loss": 0.5187, "step": 200 }, { - "epoch": 0.73, - "learning_rate": 1.6639999999999999e-06, - "loss": 0.2896, + "epoch": 2.91, + "learning_rate": 4.923239436619719e-05, + "loss": 0.5021, "step": 210 }, { - "epoch": 0.76, - "learning_rate": 1.744e-06, - "loss": 0.2852, + "epoch": 3.0, + "eval_loss": 0.5007606744766235, + "eval_runtime": 129.4059, + "eval_samples_per_second": 4.111, + "eval_steps_per_second": 0.518, + "eval_wer": 0.2408562062094234, + "step": 216 + }, + { + "epoch": 3.06, + "learning_rate": 4.916901408450704e-05, + "loss": 0.5289, "step": 220 }, { - "epoch": 0.8, - "learning_rate": 1.824e-06, - "loss": 0.2691, + "epoch": 3.19, + "learning_rate": 4.909859154929578e-05, + "loss": 0.4999, "step": 230 }, { - "epoch": 0.83, - "learning_rate": 1.904e-06, - "loss": 0.3116, + "epoch": 3.33, + "learning_rate": 4.9028169014084506e-05, + "loss": 0.535, "step": 240 }, { - "epoch": 0.87, - "learning_rate": 1.976e-06, - "loss": 0.3348, + "epoch": 3.47, + "learning_rate": 4.895774647887324e-05, + "loss": 0.5052, "step": 250 }, { - "epoch": 0.9, - "learning_rate": 2.056e-06, - "loss": 0.2831, + "epoch": 3.61, + "learning_rate": 4.888732394366197e-05, + "loss": 0.5107, "step": 260 }, { - "epoch": 0.94, - "learning_rate": 2.136e-06, - "loss": 0.2814, + "epoch": 3.75, + "learning_rate": 4.8816901408450705e-05, + "loss": 0.5191, "step": 270 }, { - "epoch": 0.97, - "learning_rate": 2.216e-06, - "loss": 0.3028, + "epoch": 3.89, + "learning_rate": 4.874647887323944e-05, + "loss": 0.4956, "step": 280 }, { - "epoch": 1.0, - "eval_loss": 0.4693412184715271, - "eval_runtime": 130.2494, - "eval_samples_per_second": 4.084, - "eval_steps_per_second": 1.021, - "eval_wer": 0.2046024297743781, + "epoch": 4.0, + "eval_loss": 0.48966091871261597, + "eval_runtime": 127.0197, + "eval_samples_per_second": 4.188, + "eval_steps_per_second": 0.527, + "eval_wer": 0.24008484926399692, "step": 288 }, { - "epoch": 1.01, - "learning_rate": 2.2959999999999997e-06, - "loss": 0.3338, + "epoch": 4.03, + "learning_rate": 4.867605633802817e-05, + "loss": 0.5342, "step": 290 }, { - "epoch": 1.04, - "learning_rate": 2.3759999999999998e-06, - "loss": 0.2803, + "epoch": 4.17, + "learning_rate": 4.8605633802816904e-05, + "loss": 0.4984, "step": 300 }, { - "epoch": 1.08, - "learning_rate": 2.456e-06, - "loss": 0.2859, + "epoch": 4.3, + "learning_rate": 4.853521126760563e-05, + "loss": 0.4968, "step": 310 }, { - "epoch": 1.11, - "learning_rate": 2.536e-06, - "loss": 0.282, + "epoch": 4.44, + "learning_rate": 4.846478873239437e-05, + "loss": 0.5207, "step": 320 }, { - "epoch": 1.15, - "learning_rate": 2.616e-06, - "loss": 0.2971, + "epoch": 4.58, + "learning_rate": 4.83943661971831e-05, + "loss": 0.5271, "step": 330 }, { - "epoch": 1.18, - "learning_rate": 2.696e-06, - "loss": 0.2832, + "epoch": 4.72, + "learning_rate": 4.832394366197183e-05, + "loss": 0.5277, "step": 340 }, { - "epoch": 1.21, - "learning_rate": 2.7759999999999998e-06, - "loss": 0.2776, + "epoch": 4.86, + "learning_rate": 4.8253521126760566e-05, + "loss": 0.5238, "step": 350 }, { - "epoch": 1.25, - "learning_rate": 2.856e-06, - "loss": 0.2812, + "epoch": 5.0, + "learning_rate": 4.8183098591549295e-05, + "loss": 0.543, + "step": 360 + }, + { + "epoch": 5.0, + "eval_loss": 0.5795093774795532, + "eval_runtime": 130.2268, + "eval_samples_per_second": 4.085, + "eval_steps_per_second": 0.514, + "eval_wer": 0.24734846050009643, "step": 360 }, { - "epoch": 1.28, - "learning_rate": 2.936e-06, - "loss": 0.2765, + "epoch": 5.14, + "learning_rate": 4.811267605633803e-05, + "loss": 0.5184, "step": 370 }, { - "epoch": 1.32, - "learning_rate": 3.016e-06, - "loss": 0.2905, + "epoch": 5.28, + "learning_rate": 4.8042253521126765e-05, + "loss": 0.543, "step": 380 }, { - "epoch": 1.35, - "learning_rate": 3.096e-06, - "loss": 0.2992, + "epoch": 5.42, + "learning_rate": 4.7971830985915494e-05, + "loss": 0.5174, "step": 390 }, { - "epoch": 1.39, - "learning_rate": 3.176e-06, - "loss": 0.2972, + "epoch": 5.55, + "learning_rate": 4.790140845070423e-05, + "loss": 0.5021, "step": 400 }, { - "epoch": 1.42, - "learning_rate": 3.256e-06, - "loss": 0.2884, + "epoch": 5.69, + "learning_rate": 4.783098591549296e-05, + "loss": 0.5295, "step": 410 }, { - "epoch": 1.46, - "learning_rate": 3.336e-06, - "loss": 0.2667, + "epoch": 5.83, + "learning_rate": 4.776056338028169e-05, + "loss": 0.534, "step": 420 }, { - "epoch": 1.49, - "learning_rate": 3.4159999999999996e-06, - "loss": 0.3059, + "epoch": 5.97, + "learning_rate": 4.769014084507042e-05, + "loss": 0.5239, "step": 430 }, { - "epoch": 1.53, - "learning_rate": 3.4959999999999996e-06, - "loss": 0.2853, + "epoch": 6.0, + "eval_loss": 0.5018669366836548, + "eval_runtime": 126.6372, + "eval_samples_per_second": 4.201, + "eval_steps_per_second": 0.529, + "eval_wer": 0.24901973388185383, + "step": 432 + }, + { + "epoch": 6.11, + "learning_rate": 4.761971830985916e-05, + "loss": 0.5529, "step": 440 }, { - "epoch": 1.56, - "learning_rate": 3.5759999999999997e-06, - "loss": 0.2775, + "epoch": 6.25, + "learning_rate": 4.754929577464789e-05, + "loss": 0.5127, "step": 450 }, { - "epoch": 1.6, - "learning_rate": 3.656e-06, - "loss": 0.2873, + "epoch": 6.39, + "learning_rate": 4.747887323943662e-05, + "loss": 0.5299, "step": 460 }, { - "epoch": 1.63, - "learning_rate": 3.736e-06, - "loss": 0.2874, + "epoch": 6.53, + "learning_rate": 4.7408450704225356e-05, + "loss": 0.5447, "step": 470 }, { - "epoch": 1.66, - "learning_rate": 3.8159999999999995e-06, - "loss": 0.2988, + "epoch": 6.66, + "learning_rate": 4.7338028169014084e-05, + "loss": 0.5173, "step": 480 }, { - "epoch": 1.7, - "learning_rate": 3.896e-06, - "loss": 0.2957, + "epoch": 6.8, + "learning_rate": 4.726760563380282e-05, + "loss": 0.5003, "step": 490 }, { - "epoch": 1.73, - "learning_rate": 3.976e-06, - "loss": 0.3037, + "epoch": 6.94, + "learning_rate": 4.7197183098591555e-05, + "loss": 0.4928, "step": 500 }, { - "epoch": 1.77, - "learning_rate": 3.999010600706714e-06, - "loss": 0.2873, + "epoch": 7.0, + "eval_loss": 0.45630136132240295, + "eval_runtime": 126.0852, + "eval_samples_per_second": 4.219, + "eval_steps_per_second": 0.531, + "eval_wer": 0.23121424439159222, + "step": 504 + }, + { + "epoch": 7.08, + "learning_rate": 4.7133802816901415e-05, + "loss": 0.534, "step": 510 }, { - "epoch": 1.8, - "learning_rate": 3.997597173144876e-06, - "loss": 0.2904, + "epoch": 7.22, + "learning_rate": 4.7063380281690144e-05, + "loss": 0.5019, "step": 520 }, { - "epoch": 1.84, - "learning_rate": 3.996183745583039e-06, - "loss": 0.3108, + "epoch": 7.36, + "learning_rate": 4.699295774647888e-05, + "loss": 0.5234, "step": 530 }, { - "epoch": 1.87, - "learning_rate": 3.994770318021201e-06, - "loss": 0.3071, + "epoch": 7.5, + "learning_rate": 4.692253521126761e-05, + "loss": 0.5523, "step": 540 }, { - "epoch": 1.91, - "learning_rate": 3.993356890459364e-06, - "loss": 0.2944, + "epoch": 7.64, + "learning_rate": 4.685211267605634e-05, + "loss": 0.5048, "step": 550 }, { - "epoch": 1.94, - "learning_rate": 3.9919434628975264e-06, - "loss": 0.2848, + "epoch": 7.78, + "learning_rate": 4.678169014084508e-05, + "loss": 0.5298, "step": 560 }, { - "epoch": 1.98, - "learning_rate": 3.990530035335689e-06, - "loss": 0.2986, + "epoch": 7.91, + "learning_rate": 4.6711267605633806e-05, + "loss": 0.5236, "step": 570 }, { - "epoch": 2.0, - "eval_loss": 0.48284950852394104, - "eval_runtime": 130.0663, - "eval_samples_per_second": 4.09, - "eval_steps_per_second": 1.023, - "eval_wer": 0.20575946519251784, + "epoch": 8.0, + "eval_loss": 0.5311173796653748, + "eval_runtime": 132.2426, + "eval_samples_per_second": 4.023, + "eval_steps_per_second": 0.507, + "eval_wer": 0.2647682715176448, "step": 576 }, { - "epoch": 2.01, - "learning_rate": 3.989116607773851e-06, - "loss": 0.3048, + "epoch": 8.06, + "learning_rate": 4.664084507042254e-05, + "loss": 0.5346, "step": 580 }, { - "epoch": 2.05, - "learning_rate": 3.987703180212014e-06, - "loss": 0.2977, + "epoch": 8.19, + "learning_rate": 4.657042253521127e-05, + "loss": 0.5205, "step": 590 }, { - "epoch": 2.08, - "learning_rate": 3.986289752650176e-06, - "loss": 0.2796, + "epoch": 8.33, + "learning_rate": 4.6500000000000005e-05, + "loss": 0.5074, "step": 600 }, { - "epoch": 2.12, - "learning_rate": 3.984876325088339e-06, - "loss": 0.2934, + "epoch": 8.47, + "learning_rate": 4.6429577464788734e-05, + "loss": 0.5188, "step": 610 }, { - "epoch": 2.15, - "learning_rate": 3.983462897526502e-06, - "loss": 0.3091, + "epoch": 8.61, + "learning_rate": 4.635915492957747e-05, + "loss": 0.5274, "step": 620 }, { - "epoch": 2.19, - "learning_rate": 3.982049469964665e-06, - "loss": 0.2864, + "epoch": 8.75, + "learning_rate": 4.6288732394366204e-05, + "loss": 0.5385, "step": 630 }, { - "epoch": 2.22, - "learning_rate": 3.9806360424028266e-06, - "loss": 0.2948, + "epoch": 8.89, + "learning_rate": 4.6218309859154926e-05, + "loss": 0.5059, "step": 640 }, { - "epoch": 2.26, - "learning_rate": 3.979222614840989e-06, - "loss": 0.3012, + "epoch": 9.0, + "eval_loss": 0.4728511869907379, + "eval_runtime": 125.7839, + "eval_samples_per_second": 4.229, + "eval_steps_per_second": 0.533, + "eval_wer": 0.22935013177347818, + "step": 648 + }, + { + "epoch": 9.03, + "learning_rate": 4.614788732394366e-05, + "loss": 0.5293, "step": 650 }, { - "epoch": 2.29, - "learning_rate": 3.977809187279151e-06, - "loss": 0.2824, + "epoch": 9.17, + "learning_rate": 4.60774647887324e-05, + "loss": 0.5124, "step": 660 }, { - "epoch": 2.33, - "learning_rate": 3.976395759717314e-06, - "loss": 0.3008, + "epoch": 9.3, + "learning_rate": 4.6007042253521125e-05, + "loss": 0.5266, "step": 670 }, { - "epoch": 2.36, - "learning_rate": 3.974982332155477e-06, - "loss": 0.3, + "epoch": 9.44, + "learning_rate": 4.593661971830986e-05, + "loss": 0.5256, "step": 680 }, { - "epoch": 2.39, - "learning_rate": 3.97356890459364e-06, - "loss": 0.2641, + "epoch": 9.58, + "learning_rate": 4.586619718309859e-05, + "loss": 0.517, "step": 690 }, { - "epoch": 2.43, - "learning_rate": 3.972155477031802e-06, - "loss": 0.2677, + "epoch": 9.72, + "learning_rate": 4.5795774647887324e-05, + "loss": 0.5001, "step": 700 }, { - "epoch": 2.46, - "learning_rate": 3.970742049469965e-06, - "loss": 0.2851, + "epoch": 9.86, + "learning_rate": 4.572535211267606e-05, + "loss": 0.4924, "step": 710 }, { - "epoch": 2.5, - "learning_rate": 3.969328621908127e-06, - "loss": 0.2923, + "epoch": 10.0, + "learning_rate": 4.565492957746479e-05, + "loss": 0.5064, + "step": 720 + }, + { + "epoch": 10.0, + "eval_loss": 0.5000531673431396, + "eval_runtime": 126.1137, + "eval_samples_per_second": 4.218, + "eval_steps_per_second": 0.531, + "eval_wer": 0.2464485440637655, "step": 720 }, { - "epoch": 2.53, - "learning_rate": 3.9679151943462895e-06, - "loss": 0.2957, + "epoch": 10.14, + "learning_rate": 4.558450704225352e-05, + "loss": 0.5004, "step": 730 }, { - "epoch": 2.57, - "learning_rate": 3.966501766784452e-06, - "loss": 0.2915, + "epoch": 10.28, + "learning_rate": 4.551408450704225e-05, + "loss": 0.522, "step": 740 }, { - "epoch": 2.6, - "learning_rate": 3.965088339222615e-06, - "loss": 0.2786, + "epoch": 10.42, + "learning_rate": 4.544366197183099e-05, + "loss": 0.5214, "step": 750 }, { - "epoch": 2.64, - "learning_rate": 3.963674911660777e-06, - "loss": 0.3032, + "epoch": 10.55, + "learning_rate": 4.537323943661972e-05, + "loss": 0.5257, "step": 760 }, { - "epoch": 2.67, - "learning_rate": 3.96226148409894e-06, - "loss": 0.3004, + "epoch": 10.69, + "learning_rate": 4.530281690140845e-05, + "loss": 0.5166, "step": 770 }, { - "epoch": 2.71, - "learning_rate": 3.960848056537102e-06, - "loss": 0.2904, + "epoch": 10.83, + "learning_rate": 4.5232394366197186e-05, + "loss": 0.516, "step": 780 }, { - "epoch": 2.74, - "learning_rate": 3.959434628975265e-06, - "loss": 0.2702, + "epoch": 10.97, + "learning_rate": 4.5161971830985914e-05, + "loss": 0.5032, "step": 790 }, { - "epoch": 2.78, - "learning_rate": 3.958021201413428e-06, - "loss": 0.2831, + "epoch": 11.0, + "eval_loss": 0.4968065619468689, + "eval_runtime": 127.6202, + "eval_samples_per_second": 4.169, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2335283152278717, + "step": 792 + }, + { + "epoch": 11.11, + "learning_rate": 4.509154929577465e-05, + "loss": 0.5208, "step": 800 }, { - "epoch": 2.81, - "learning_rate": 3.95660777385159e-06, - "loss": 0.2874, + "epoch": 11.25, + "learning_rate": 4.502112676056338e-05, + "loss": 0.5148, "step": 810 }, { - "epoch": 2.85, - "learning_rate": 3.9551943462897525e-06, - "loss": 0.2791, + "epoch": 11.39, + "learning_rate": 4.4950704225352113e-05, + "loss": 0.5035, "step": 820 }, { - "epoch": 2.88, - "learning_rate": 3.953780918727915e-06, - "loss": 0.2896, + "epoch": 11.53, + "learning_rate": 4.488028169014085e-05, + "loss": 0.5137, "step": 830 }, { - "epoch": 2.91, - "learning_rate": 3.952367491166077e-06, - "loss": 0.2694, + "epoch": 11.66, + "learning_rate": 4.480985915492958e-05, + "loss": 0.4974, "step": 840 }, { - "epoch": 2.95, - "learning_rate": 3.95095406360424e-06, - "loss": 0.277, + "epoch": 11.8, + "learning_rate": 4.473943661971831e-05, + "loss": 0.513, "step": 850 }, { - "epoch": 2.98, - "learning_rate": 3.949540636042403e-06, - "loss": 0.297, + "epoch": 11.94, + "learning_rate": 4.466901408450704e-05, + "loss": 0.5064, "step": 860 }, { - "epoch": 3.0, - "eval_loss": 0.5019953846931458, - "eval_runtime": 130.2566, - "eval_samples_per_second": 4.084, - "eval_steps_per_second": 1.021, - "eval_wer": 0.2038310728289516, + "epoch": 12.0, + "eval_loss": 0.5237506031990051, + "eval_runtime": 128.1921, + "eval_samples_per_second": 4.15, + "eval_steps_per_second": 0.523, + "eval_wer": 0.23648518351867326, "step": 864 }, { - "epoch": 3.02, - "learning_rate": 3.948127208480565e-06, - "loss": 0.2977, + "epoch": 12.08, + "learning_rate": 4.4598591549295776e-05, + "loss": 0.5065, "step": 870 }, { - "epoch": 3.06, - "learning_rate": 3.946713780918728e-06, - "loss": 0.3039, + "epoch": 12.22, + "learning_rate": 4.452816901408451e-05, + "loss": 0.4883, "step": 880 }, { - "epoch": 3.09, - "learning_rate": 3.945300353356891e-06, - "loss": 0.2913, + "epoch": 12.36, + "learning_rate": 4.445774647887324e-05, + "loss": 0.5032, "step": 890 }, { - "epoch": 3.12, - "learning_rate": 3.943886925795053e-06, - "loss": 0.307, + "epoch": 12.5, + "learning_rate": 4.4387323943661975e-05, + "loss": 0.4986, "step": 900 }, { - "epoch": 3.16, - "learning_rate": 3.9424734982332154e-06, - "loss": 0.3053, + "epoch": 12.64, + "learning_rate": 4.4316901408450704e-05, + "loss": 0.4756, "step": 910 }, { - "epoch": 3.19, - "learning_rate": 3.941060070671378e-06, - "loss": 0.2781, + "epoch": 12.78, + "learning_rate": 4.424647887323944e-05, + "loss": 0.5002, "step": 920 }, { - "epoch": 3.23, - "learning_rate": 3.93964664310954e-06, - "loss": 0.2978, + "epoch": 12.91, + "learning_rate": 4.4176056338028174e-05, + "loss": 0.5001, "step": 930 }, { - "epoch": 3.26, - "learning_rate": 3.938233215547703e-06, - "loss": 0.2859, + "epoch": 13.0, + "eval_loss": 0.477408230304718, + "eval_runtime": 129.9607, + "eval_samples_per_second": 4.094, + "eval_steps_per_second": 0.516, + "eval_wer": 0.23249983930063636, + "step": 936 + }, + { + "epoch": 13.06, + "learning_rate": 4.41056338028169e-05, + "loss": 0.5252, "step": 940 }, { - "epoch": 3.3, - "learning_rate": 3.936819787985866e-06, - "loss": 0.3001, + "epoch": 13.19, + "learning_rate": 4.403521126760564e-05, + "loss": 0.4894, "step": 950 }, { - "epoch": 3.33, - "learning_rate": 3.935406360424028e-06, - "loss": 0.3167, + "epoch": 13.33, + "learning_rate": 4.3964788732394366e-05, + "loss": 0.5057, "step": 960 }, { - "epoch": 3.37, - "learning_rate": 3.933992932862191e-06, - "loss": 0.307, + "epoch": 13.47, + "learning_rate": 4.38943661971831e-05, + "loss": 0.5051, "step": 970 }, { - "epoch": 3.4, - "learning_rate": 3.932579505300353e-06, - "loss": 0.3129, + "epoch": 13.61, + "learning_rate": 4.382394366197183e-05, + "loss": 0.4997, "step": 980 }, { - "epoch": 3.44, - "learning_rate": 3.9311660777385156e-06, - "loss": 0.2694, + "epoch": 13.75, + "learning_rate": 4.3753521126760566e-05, + "loss": 0.5206, "step": 990 }, { - "epoch": 3.47, - "learning_rate": 3.929752650176678e-06, - "loss": 0.3088, + "epoch": 13.89, + "learning_rate": 4.36830985915493e-05, + "loss": 0.5003, "step": 1000 }, { - "epoch": 3.51, - "learning_rate": 3.928339222614841e-06, - "loss": 0.2849, + "epoch": 14.0, + "eval_loss": 0.4961102604866028, + "eval_runtime": 125.9234, + "eval_samples_per_second": 4.225, + "eval_steps_per_second": 0.532, + "eval_wer": 0.23391399370058494, + "step": 1008 + }, + { + "epoch": 14.03, + "learning_rate": 4.361267605633803e-05, + "loss": 0.5108, "step": 1010 }, { - "epoch": 3.54, - "learning_rate": 3.926925795053003e-06, - "loss": 0.3203, + "epoch": 14.17, + "learning_rate": 4.3542253521126765e-05, + "loss": 0.4982, "step": 1020 }, { - "epoch": 3.57, - "learning_rate": 3.925512367491166e-06, - "loss": 0.3022, + "epoch": 14.3, + "learning_rate": 4.347183098591549e-05, + "loss": 0.5178, "step": 1030 }, { - "epoch": 3.61, - "learning_rate": 3.924098939929328e-06, - "loss": 0.2711, + "epoch": 14.44, + "learning_rate": 4.340140845070423e-05, + "loss": 0.5131, "step": 1040 }, { - "epoch": 3.64, - "learning_rate": 3.922685512367491e-06, - "loss": 0.2765, + "epoch": 14.58, + "learning_rate": 4.3330985915492964e-05, + "loss": 0.523, "step": 1050 }, { - "epoch": 3.68, - "learning_rate": 3.921272084805654e-06, - "loss": 0.2897, + "epoch": 14.72, + "learning_rate": 4.326056338028169e-05, + "loss": 0.5054, "step": 1060 }, { - "epoch": 3.71, - "learning_rate": 3.9198586572438165e-06, - "loss": 0.2561, + "epoch": 14.86, + "learning_rate": 4.319014084507043e-05, + "loss": 0.4994, "step": 1070 }, { - "epoch": 3.75, - "learning_rate": 3.9184452296819785e-06, - "loss": 0.2596, + "epoch": 15.0, + "learning_rate": 4.3119718309859156e-05, + "loss": 0.5085, + "step": 1080 + }, + { + "epoch": 15.0, + "eval_loss": 0.46455711126327515, + "eval_runtime": 125.665, + "eval_samples_per_second": 4.233, + "eval_steps_per_second": 0.533, + "eval_wer": 0.2271003406826509, "step": 1080 }, { - "epoch": 3.78, - "learning_rate": 3.917031802120141e-06, - "loss": 0.2759, + "epoch": 15.14, + "learning_rate": 4.304929577464789e-05, + "loss": 0.5079, "step": 1090 }, { - "epoch": 3.82, - "learning_rate": 3.915618374558303e-06, - "loss": 0.3017, + "epoch": 15.28, + "learning_rate": 4.2978873239436626e-05, + "loss": 0.5114, "step": 1100 }, { - "epoch": 3.85, - "learning_rate": 3.914204946996466e-06, - "loss": 0.2668, + "epoch": 15.42, + "learning_rate": 4.2908450704225355e-05, + "loss": 0.4859, "step": 1110 }, { - "epoch": 3.89, - "learning_rate": 3.912791519434629e-06, - "loss": 0.284, + "epoch": 15.55, + "learning_rate": 4.283802816901409e-05, + "loss": 0.4951, "step": 1120 }, { - "epoch": 3.92, - "learning_rate": 3.911378091872792e-06, - "loss": 0.2808, + "epoch": 15.69, + "learning_rate": 4.276760563380282e-05, + "loss": 0.4861, "step": 1130 }, { - "epoch": 3.96, - "learning_rate": 3.909964664310954e-06, - "loss": 0.2801, + "epoch": 15.83, + "learning_rate": 4.2697183098591554e-05, + "loss": 0.5128, "step": 1140 }, { - "epoch": 3.99, - "learning_rate": 3.908551236749117e-06, - "loss": 0.2863, + "epoch": 15.97, + "learning_rate": 4.263380281690141e-05, + "loss": 0.4931, "step": 1150 }, { - "epoch": 4.0, - "eval_loss": 0.5215898752212524, - "eval_runtime": 130.8056, - "eval_samples_per_second": 4.067, - "eval_steps_per_second": 1.017, - "eval_wer": 0.20203123995628977, + "epoch": 16.0, + "eval_loss": 0.5006607174873352, + "eval_runtime": 126.1174, + "eval_samples_per_second": 4.218, + "eval_steps_per_second": 0.531, + "eval_wer": 0.2320498810824709, "step": 1152 }, { - "epoch": 4.03, - "learning_rate": 3.907137809187279e-06, - "loss": 0.2845, + "epoch": 16.11, + "learning_rate": 4.256338028169014e-05, + "loss": 0.5034, "step": 1160 }, { - "epoch": 4.06, - "learning_rate": 3.9057243816254415e-06, - "loss": 0.2787, + "epoch": 16.25, + "learning_rate": 4.249295774647887e-05, + "loss": 0.4863, "step": 1170 }, { - "epoch": 4.1, - "learning_rate": 3.904310954063604e-06, - "loss": 0.2562, + "epoch": 16.39, + "learning_rate": 4.2422535211267606e-05, + "loss": 0.4821, "step": 1180 }, { - "epoch": 4.13, - "learning_rate": 3.902897526501767e-06, - "loss": 0.2833, + "epoch": 16.53, + "learning_rate": 4.2352112676056335e-05, + "loss": 0.5075, "step": 1190 }, { - "epoch": 4.17, - "learning_rate": 3.901484098939929e-06, - "loss": 0.2655, + "epoch": 16.66, + "learning_rate": 4.228169014084507e-05, + "loss": 0.5022, "step": 1200 }, { - "epoch": 4.2, - "learning_rate": 3.900070671378092e-06, - "loss": 0.2865, + "epoch": 16.8, + "learning_rate": 4.2211267605633805e-05, + "loss": 0.4698, "step": 1210 }, { - "epoch": 4.24, - "learning_rate": 3.898657243816254e-06, - "loss": 0.2702, + "epoch": 16.94, + "learning_rate": 4.2140845070422534e-05, + "loss": 0.4807, "step": 1220 }, { - "epoch": 4.27, - "learning_rate": 3.897243816254417e-06, - "loss": 0.2733, + "epoch": 17.0, + "eval_loss": 0.4817637503147125, + "eval_runtime": 125.5305, + "eval_samples_per_second": 4.238, + "eval_steps_per_second": 0.534, + "eval_wer": 0.22581474577360675, + "step": 1224 + }, + { + "epoch": 17.08, + "learning_rate": 4.207042253521127e-05, + "loss": 0.5367, "step": 1230 }, { - "epoch": 4.3, - "learning_rate": 3.89583038869258e-06, - "loss": 0.3136, + "epoch": 17.22, + "learning_rate": 4.2e-05, + "loss": 0.4781, "step": 1240 }, { - "epoch": 4.34, - "learning_rate": 3.8944169611307424e-06, - "loss": 0.2846, + "epoch": 17.36, + "learning_rate": 4.192957746478873e-05, + "loss": 0.4866, "step": 1250 }, { - "epoch": 4.37, - "learning_rate": 3.8930035335689044e-06, - "loss": 0.2756, + "epoch": 17.5, + "learning_rate": 4.185915492957747e-05, + "loss": 0.5144, "step": 1260 }, { - "epoch": 4.41, - "learning_rate": 3.891590106007066e-06, - "loss": 0.2934, + "epoch": 17.64, + "learning_rate": 4.17887323943662e-05, + "loss": 0.4789, "step": 1270 }, { - "epoch": 4.44, - "learning_rate": 3.890176678445229e-06, - "loss": 0.2851, + "epoch": 17.78, + "learning_rate": 4.171830985915493e-05, + "loss": 0.5048, "step": 1280 }, { - "epoch": 4.48, - "learning_rate": 3.888763250883392e-06, - "loss": 0.2979, + "epoch": 17.91, + "learning_rate": 4.164788732394366e-05, + "loss": 0.4894, "step": 1290 }, { - "epoch": 4.51, - "learning_rate": 3.887349823321555e-06, - "loss": 0.2944, + "epoch": 18.0, + "eval_loss": 0.49539196491241455, + "eval_runtime": 126.545, + "eval_samples_per_second": 4.204, + "eval_steps_per_second": 0.529, + "eval_wer": 0.2310856849006878, + "step": 1296 + }, + { + "epoch": 18.06, + "learning_rate": 4.1577464788732396e-05, + "loss": 0.5086, "step": 1300 }, { - "epoch": 4.55, - "learning_rate": 3.885936395759717e-06, - "loss": 0.2839, + "epoch": 18.19, + "learning_rate": 4.150704225352113e-05, + "loss": 0.4923, "step": 1310 }, { - "epoch": 4.58, - "learning_rate": 3.88452296819788e-06, - "loss": 0.287, + "epoch": 18.33, + "learning_rate": 4.143661971830986e-05, + "loss": 0.509, "step": 1320 }, { - "epoch": 4.62, - "learning_rate": 3.883109540636042e-06, - "loss": 0.2757, + "epoch": 18.47, + "learning_rate": 4.1366197183098595e-05, + "loss": 0.4926, "step": 1330 }, { - "epoch": 4.65, - "learning_rate": 3.8816961130742046e-06, - "loss": 0.3039, + "epoch": 18.61, + "learning_rate": 4.129577464788732e-05, + "loss": 0.5059, "step": 1340 }, { - "epoch": 4.69, - "learning_rate": 3.880282685512367e-06, - "loss": 0.2852, + "epoch": 18.75, + "learning_rate": 4.122535211267606e-05, + "loss": 0.4753, "step": 1350 }, { - "epoch": 4.72, - "learning_rate": 3.87886925795053e-06, - "loss": 0.2655, + "epoch": 18.89, + "learning_rate": 4.115492957746479e-05, + "loss": 0.4746, "step": 1360 }, { - "epoch": 4.75, - "learning_rate": 3.877455830388692e-06, - "loss": 0.2777, + "epoch": 19.0, + "eval_loss": 0.4951326847076416, + "eval_runtime": 126.1102, + "eval_samples_per_second": 4.219, + "eval_steps_per_second": 0.531, + "eval_wer": 0.22928585202802598, + "step": 1368 + }, + { + "epoch": 19.03, + "learning_rate": 4.108450704225352e-05, + "loss": 0.4928, "step": 1370 }, { - "epoch": 4.79, - "learning_rate": 3.876042402826855e-06, - "loss": 0.2714, + "epoch": 19.17, + "learning_rate": 4.101408450704226e-05, + "loss": 0.4758, "step": 1380 }, { - "epoch": 4.82, - "learning_rate": 3.874628975265017e-06, - "loss": 0.2803, + "epoch": 19.3, + "learning_rate": 4.0943661971830986e-05, + "loss": 0.4898, "step": 1390 }, { - "epoch": 4.86, - "learning_rate": 3.87321554770318e-06, - "loss": 0.3032, + "epoch": 19.44, + "learning_rate": 4.087323943661972e-05, + "loss": 0.4933, "step": 1400 }, { - "epoch": 4.89, - "learning_rate": 3.871802120141343e-06, - "loss": 0.2808, + "epoch": 19.58, + "learning_rate": 4.080281690140845e-05, + "loss": 0.5012, "step": 1410 }, { - "epoch": 4.93, - "learning_rate": 3.8703886925795055e-06, - "loss": 0.2795, + "epoch": 19.72, + "learning_rate": 4.0732394366197185e-05, + "loss": 0.4911, "step": 1420 }, { - "epoch": 4.96, - "learning_rate": 3.8689752650176675e-06, - "loss": 0.2664, + "epoch": 19.86, + "learning_rate": 4.066197183098592e-05, + "loss": 0.5053, "step": 1430 }, { - "epoch": 5.0, - "learning_rate": 3.86756183745583e-06, - "loss": 0.3036, + "epoch": 20.0, + "learning_rate": 4.059154929577465e-05, + "loss": 0.4795, "step": 1440 }, { - "epoch": 5.0, - "eval_loss": 0.49630099534988403, - "eval_runtime": 131.2377, - "eval_samples_per_second": 4.054, - "eval_steps_per_second": 1.013, - "eval_wer": 0.20080992479269782, + "epoch": 20.0, + "eval_loss": 0.48727360367774963, + "eval_runtime": 126.1522, + "eval_samples_per_second": 4.217, + "eval_steps_per_second": 0.531, + "eval_wer": 0.2304428874461657, "step": 1440 }, { - "epoch": 5.03, - "learning_rate": 3.866148409893992e-06, - "loss": 0.2955, + "epoch": 20.14, + "learning_rate": 4.0521126760563384e-05, + "loss": 0.4929, "step": 1450 }, { - "epoch": 5.07, - "learning_rate": 3.864734982332155e-06, - "loss": 0.2806, + "epoch": 20.28, + "learning_rate": 4.045070422535211e-05, + "loss": 0.481, "step": 1460 }, { - "epoch": 5.1, - "learning_rate": 3.863321554770318e-06, - "loss": 0.2625, + "epoch": 20.42, + "learning_rate": 4.038028169014085e-05, + "loss": 0.4819, "step": 1470 }, { - "epoch": 5.14, - "learning_rate": 3.861908127208481e-06, - "loss": 0.2775, + "epoch": 20.55, + "learning_rate": 4.030985915492958e-05, + "loss": 0.4814, "step": 1480 }, { - "epoch": 5.17, - "learning_rate": 3.860494699646643e-06, - "loss": 0.2916, + "epoch": 20.69, + "learning_rate": 4.023943661971831e-05, + "loss": 0.4871, "step": 1490 }, { - "epoch": 5.21, - "learning_rate": 3.859081272084806e-06, - "loss": 0.2783, + "epoch": 20.83, + "learning_rate": 4.016901408450705e-05, + "loss": 0.4934, "step": 1500 }, { - "epoch": 5.24, - "learning_rate": 3.857667844522968e-06, - "loss": 0.2728, + "epoch": 20.97, + "learning_rate": 4.0098591549295775e-05, + "loss": 0.4964, "step": 1510 }, { - "epoch": 5.28, - "learning_rate": 3.8562544169611305e-06, - "loss": 0.2706, + "epoch": 21.0, + "eval_loss": 0.49976399540901184, + "eval_runtime": 126.0303, + "eval_samples_per_second": 4.221, + "eval_steps_per_second": 0.532, + "eval_wer": 0.2431059973002507, + "step": 1512 + }, + { + "epoch": 21.11, + "learning_rate": 4.002816901408451e-05, + "loss": 0.4966, "step": 1520 }, { - "epoch": 5.31, - "learning_rate": 3.854840989399293e-06, - "loss": 0.2857, + "epoch": 21.25, + "learning_rate": 3.9957746478873246e-05, + "loss": 0.5021, "step": 1530 }, { - "epoch": 5.35, - "learning_rate": 3.853427561837456e-06, - "loss": 0.2956, + "epoch": 21.39, + "learning_rate": 3.9887323943661974e-05, + "loss": 0.4965, "step": 1540 }, { - "epoch": 5.38, - "learning_rate": 3.852014134275618e-06, - "loss": 0.2629, + "epoch": 21.53, + "learning_rate": 3.981690140845071e-05, + "loss": 0.4876, "step": 1550 }, { - "epoch": 5.42, - "learning_rate": 3.850600706713781e-06, - "loss": 0.2656, + "epoch": 21.66, + "learning_rate": 3.974647887323944e-05, + "loss": 0.4755, "step": 1560 }, { - "epoch": 5.45, - "learning_rate": 3.849187279151943e-06, - "loss": 0.2842, + "epoch": 21.8, + "learning_rate": 3.967605633802817e-05, + "loss": 0.479, "step": 1570 }, { - "epoch": 5.48, - "learning_rate": 3.847773851590106e-06, - "loss": 0.3061, + "epoch": 21.94, + "learning_rate": 3.96056338028169e-05, + "loss": 0.4947, "step": 1580 }, { - "epoch": 5.52, - "learning_rate": 3.846360424028269e-06, - "loss": 0.2755, + "epoch": 22.0, + "eval_loss": 0.498555451631546, + "eval_runtime": 126.1675, + "eval_samples_per_second": 4.217, + "eval_steps_per_second": 0.531, + "eval_wer": 0.23237127980973196, + "step": 1584 + }, + { + "epoch": 22.08, + "learning_rate": 3.953521126760564e-05, + "loss": 0.5085, "step": 1590 }, { - "epoch": 5.55, - "learning_rate": 3.844946996466431e-06, - "loss": 0.2695, + "epoch": 22.22, + "learning_rate": 3.946478873239437e-05, + "loss": 0.4862, "step": 1600 }, { - "epoch": 5.59, - "learning_rate": 3.843533568904593e-06, - "loss": 0.2636, + "epoch": 22.36, + "learning_rate": 3.93943661971831e-05, + "loss": 0.4888, "step": 1610 }, { - "epoch": 5.62, - "learning_rate": 3.842120141342756e-06, - "loss": 0.2822, + "epoch": 22.5, + "learning_rate": 3.9323943661971836e-05, + "loss": 0.4954, "step": 1620 }, { - "epoch": 5.66, - "learning_rate": 3.840706713780918e-06, - "loss": 0.2815, + "epoch": 22.64, + "learning_rate": 3.9253521126760565e-05, + "loss": 0.4826, "step": 1630 }, { - "epoch": 5.69, - "learning_rate": 3.839293286219081e-06, - "loss": 0.3095, + "epoch": 22.78, + "learning_rate": 3.91830985915493e-05, + "loss": 0.477, "step": 1640 }, { - "epoch": 5.73, - "learning_rate": 3.837879858657244e-06, - "loss": 0.2825, + "epoch": 22.91, + "learning_rate": 3.9112676056338035e-05, + "loss": 0.4789, "step": 1650 }, { - "epoch": 5.76, - "learning_rate": 3.836466431095406e-06, - "loss": 0.2883, + "epoch": 23.0, + "eval_loss": 0.5379728078842163, + "eval_runtime": 126.405, + "eval_samples_per_second": 4.209, + "eval_steps_per_second": 0.53, + "eval_wer": 0.23809217715497846, + "step": 1656 + }, + { + "epoch": 23.06, + "learning_rate": 3.9042253521126764e-05, + "loss": 0.4964, "step": 1660 }, { - "epoch": 5.8, - "learning_rate": 3.835053003533569e-06, - "loss": 0.2781, + "epoch": 23.19, + "learning_rate": 3.89718309859155e-05, + "loss": 0.4926, "step": 1670 }, { - "epoch": 5.83, - "learning_rate": 3.8336395759717316e-06, - "loss": 0.3046, + "epoch": 23.33, + "learning_rate": 3.890140845070423e-05, + "loss": 0.4901, "step": 1680 }, { - "epoch": 5.87, - "learning_rate": 3.8322261484098935e-06, - "loss": 0.2752, + "epoch": 23.47, + "learning_rate": 3.883098591549296e-05, + "loss": 0.4879, "step": 1690 }, { - "epoch": 5.9, - "learning_rate": 3.830812720848056e-06, - "loss": 0.2571, + "epoch": 23.61, + "learning_rate": 3.87605633802817e-05, + "loss": 0.4833, "step": 1700 }, { - "epoch": 5.94, - "learning_rate": 3.829399293286218e-06, - "loss": 0.2836, + "epoch": 23.75, + "learning_rate": 3.869014084507042e-05, + "loss": 0.4752, "step": 1710 }, { - "epoch": 5.97, - "learning_rate": 3.827985865724381e-06, - "loss": 0.3141, + "epoch": 23.89, + "learning_rate": 3.8619718309859155e-05, + "loss": 0.4603, "step": 1720 }, { - "epoch": 6.0, - "eval_loss": 0.5004593729972839, - "eval_runtime": 130.6889, - "eval_samples_per_second": 4.071, - "eval_steps_per_second": 1.018, - "eval_wer": 0.20203123995628977, + "epoch": 24.0, + "eval_loss": 0.4818807542324066, + "eval_runtime": 125.9972, + "eval_samples_per_second": 4.222, + "eval_steps_per_second": 0.532, + "eval_wer": 0.23391399370058494, "step": 1728 }, { - "epoch": 6.01, - "learning_rate": 3.826572438162544e-06, - "loss": 0.299, + "epoch": 24.03, + "learning_rate": 3.854929577464788e-05, + "loss": 0.4808, "step": 1730 }, { - "epoch": 6.04, - "learning_rate": 3.825159010600707e-06, - "loss": 0.3013, + "epoch": 24.17, + "learning_rate": 3.847887323943662e-05, + "loss": 0.4693, "step": 1740 }, { - "epoch": 6.08, - "learning_rate": 3.823745583038869e-06, - "loss": 0.2818, + "epoch": 24.3, + "learning_rate": 3.8408450704225354e-05, + "loss": 0.4729, "step": 1750 }, { - "epoch": 6.11, - "learning_rate": 3.822332155477032e-06, - "loss": 0.2743, + "epoch": 24.44, + "learning_rate": 3.833802816901408e-05, + "loss": 0.4722, "step": 1760 }, { - "epoch": 6.15, - "learning_rate": 3.820918727915194e-06, - "loss": 0.2774, + "epoch": 24.58, + "learning_rate": 3.826760563380282e-05, + "loss": 0.4687, "step": 1770 }, { - "epoch": 6.18, - "learning_rate": 3.8195053003533565e-06, - "loss": 0.2833, + "epoch": 24.72, + "learning_rate": 3.8197183098591546e-05, + "loss": 0.4682, "step": 1780 }, { - "epoch": 6.21, - "learning_rate": 3.818091872791519e-06, - "loss": 0.2895, + "epoch": 24.86, + "learning_rate": 3.812676056338028e-05, + "loss": 0.4694, "step": 1790 }, { - "epoch": 6.25, - "learning_rate": 3.816678445229682e-06, - "loss": 0.2511, + "epoch": 25.0, + "learning_rate": 3.8056338028169017e-05, + "loss": 0.4591, "step": 1800 }, { - "epoch": 6.28, - "learning_rate": 3.815265017667844e-06, - "loss": 0.2567, + "epoch": 25.0, + "eval_loss": 0.4868641793727875, + "eval_runtime": 126.1227, + "eval_samples_per_second": 4.218, + "eval_steps_per_second": 0.531, + "eval_wer": 0.22022240791926465, + "step": 1800 + }, + { + "epoch": 25.14, + "learning_rate": 3.7985915492957745e-05, + "loss": 0.4893, "step": 1810 }, { - "epoch": 6.32, - "learning_rate": 3.813851590106007e-06, - "loss": 0.3127, + "epoch": 25.28, + "learning_rate": 3.791549295774648e-05, + "loss": 0.4773, "step": 1820 }, { - "epoch": 6.35, - "learning_rate": 3.8124381625441694e-06, - "loss": 0.3125, + "epoch": 25.42, + "learning_rate": 3.784507042253521e-05, + "loss": 0.4635, "step": 1830 }, { - "epoch": 6.39, - "learning_rate": 3.811024734982332e-06, - "loss": 0.2699, + "epoch": 25.55, + "learning_rate": 3.7774647887323944e-05, + "loss": 0.4789, "step": 1840 }, { - "epoch": 6.42, - "learning_rate": 3.8096113074204946e-06, - "loss": 0.2896, + "epoch": 25.69, + "learning_rate": 3.770422535211268e-05, + "loss": 0.4857, "step": 1850 }, { - "epoch": 6.46, - "learning_rate": 3.808197879858657e-06, - "loss": 0.3067, + "epoch": 25.83, + "learning_rate": 3.763380281690141e-05, + "loss": 0.4734, "step": 1860 }, { - "epoch": 6.49, - "learning_rate": 3.80678445229682e-06, - "loss": 0.2647, + "epoch": 25.97, + "learning_rate": 3.756338028169014e-05, + "loss": 0.4675, "step": 1870 }, { - "epoch": 6.53, - "learning_rate": 3.805371024734982e-06, - "loss": 0.2916, + "epoch": 26.0, + "eval_loss": 0.48727670311927795, + "eval_runtime": 125.7599, + "eval_samples_per_second": 4.23, + "eval_steps_per_second": 0.533, + "eval_wer": 0.2213794433374044, + "step": 1872 + }, + { + "epoch": 26.11, + "learning_rate": 3.749295774647887e-05, + "loss": 0.486, "step": 1880 }, { - "epoch": 6.56, - "learning_rate": 3.8039575971731447e-06, - "loss": 0.2825, + "epoch": 26.25, + "learning_rate": 3.742253521126761e-05, + "loss": 0.482, "step": 1890 }, { - "epoch": 6.6, - "learning_rate": 3.802544169611307e-06, - "loss": 0.283, + "epoch": 26.39, + "learning_rate": 3.735211267605634e-05, + "loss": 0.4778, "step": 1900 }, { - "epoch": 6.63, - "learning_rate": 3.80113074204947e-06, - "loss": 0.2913, + "epoch": 26.53, + "learning_rate": 3.728169014084507e-05, + "loss": 0.4825, "step": 1910 }, { - "epoch": 6.66, - "learning_rate": 3.7997173144876324e-06, - "loss": 0.2937, + "epoch": 26.66, + "learning_rate": 3.7211267605633806e-05, + "loss": 0.4717, "step": 1920 }, { - "epoch": 6.7, - "learning_rate": 3.798303886925795e-06, - "loss": 0.2815, + "epoch": 26.8, + "learning_rate": 3.7140845070422534e-05, + "loss": 0.4944, "step": 1930 }, { - "epoch": 6.73, - "learning_rate": 3.796890459363957e-06, - "loss": 0.261, + "epoch": 26.94, + "learning_rate": 3.707042253521127e-05, + "loss": 0.4777, "step": 1940 }, { - "epoch": 6.77, - "learning_rate": 3.79547703180212e-06, - "loss": 0.2883, + "epoch": 27.0, + "eval_loss": 0.4872089922428131, + "eval_runtime": 126.537, + "eval_samples_per_second": 4.204, + "eval_steps_per_second": 0.529, + "eval_wer": 0.22909301279166935, + "step": 1944 + }, + { + "epoch": 27.08, + "learning_rate": 3.7e-05, + "loss": 0.4797, "step": 1950 }, { - "epoch": 6.8, - "learning_rate": 3.7940636042402824e-06, - "loss": 0.2678, + "epoch": 27.22, + "learning_rate": 3.692957746478873e-05, + "loss": 0.4747, "step": 1960 }, { - "epoch": 6.84, - "learning_rate": 3.7926501766784452e-06, - "loss": 0.2959, + "epoch": 27.36, + "learning_rate": 3.685915492957747e-05, + "loss": 0.4834, "step": 1970 }, { - "epoch": 6.87, - "learning_rate": 3.7912367491166077e-06, - "loss": 0.2933, + "epoch": 27.5, + "learning_rate": 3.67887323943662e-05, + "loss": 0.495, "step": 1980 }, { - "epoch": 6.91, - "learning_rate": 3.7898233215547705e-06, - "loss": 0.2634, + "epoch": 27.64, + "learning_rate": 3.671830985915493e-05, + "loss": 0.4811, "step": 1990 }, { - "epoch": 6.94, - "learning_rate": 3.7884098939929325e-06, - "loss": 0.2767, + "epoch": 27.78, + "learning_rate": 3.664788732394366e-05, + "loss": 0.5012, "step": 2000 }, { - "epoch": 6.98, - "learning_rate": 3.7869964664310953e-06, - "loss": 0.2898, + "epoch": 27.91, + "learning_rate": 3.6577464788732396e-05, + "loss": 0.475, "step": 2010 }, { - "epoch": 7.0, - "eval_loss": 0.4961535334587097, - "eval_runtime": 131.6974, - "eval_samples_per_second": 4.04, - "eval_steps_per_second": 1.01, - "eval_wer": 0.2029311563926207, + "epoch": 28.0, + "eval_loss": 0.4919745624065399, + "eval_runtime": 126.8079, + "eval_samples_per_second": 4.195, + "eval_steps_per_second": 0.528, + "eval_wer": 0.22851449508259947, "step": 2016 }, { - "epoch": 7.01, - "learning_rate": 3.7855830388692577e-06, - "loss": 0.295, + "epoch": 28.06, + "learning_rate": 3.650704225352113e-05, + "loss": 0.4946, "step": 2020 }, { - "epoch": 7.05, - "learning_rate": 3.7841696113074206e-06, - "loss": 0.2862, + "epoch": 28.19, + "learning_rate": 3.643661971830986e-05, + "loss": 0.4748, "step": 2030 }, { - "epoch": 7.08, - "learning_rate": 3.782756183745583e-06, - "loss": 0.2683, + "epoch": 28.33, + "learning_rate": 3.6366197183098595e-05, + "loss": 0.4808, "step": 2040 }, { - "epoch": 7.12, - "learning_rate": 3.7813427561837454e-06, - "loss": 0.2845, + "epoch": 28.47, + "learning_rate": 3.6295774647887324e-05, + "loss": 0.4753, "step": 2050 }, { - "epoch": 7.15, - "learning_rate": 3.7799293286219078e-06, - "loss": 0.2863, + "epoch": 28.61, + "learning_rate": 3.622535211267606e-05, + "loss": 0.4885, "step": 2060 }, { - "epoch": 7.19, - "learning_rate": 3.7785159010600706e-06, - "loss": 0.2889, + "epoch": 28.75, + "learning_rate": 3.6154929577464794e-05, + "loss": 0.4905, "step": 2070 }, { - "epoch": 7.22, - "learning_rate": 3.777102473498233e-06, - "loss": 0.2837, + "epoch": 28.89, + "learning_rate": 3.608450704225352e-05, + "loss": 0.4921, "step": 2080 }, { - "epoch": 7.26, - "learning_rate": 3.775689045936396e-06, - "loss": 0.2816, + "epoch": 29.0, + "eval_loss": 0.48551997542381287, + "eval_runtime": 125.816, + "eval_samples_per_second": 4.228, + "eval_steps_per_second": 0.533, + "eval_wer": 0.2222793597737353, + "step": 2088 + }, + { + "epoch": 29.03, + "learning_rate": 3.601408450704226e-05, + "loss": 0.499, "step": 2090 }, { - "epoch": 7.29, - "learning_rate": 3.7742756183745583e-06, - "loss": 0.2938, + "epoch": 29.17, + "learning_rate": 3.5943661971830986e-05, + "loss": 0.4763, "step": 2100 }, { - "epoch": 7.33, - "learning_rate": 3.7728621908127207e-06, - "loss": 0.3051, + "epoch": 29.3, + "learning_rate": 3.587323943661972e-05, + "loss": 0.4753, "step": 2110 }, { - "epoch": 7.36, - "learning_rate": 3.771448763250883e-06, - "loss": 0.2662, + "epoch": 29.44, + "learning_rate": 3.580281690140846e-05, + "loss": 0.4754, "step": 2120 }, { - "epoch": 7.39, - "learning_rate": 3.770035335689046e-06, - "loss": 0.26, + "epoch": 29.58, + "learning_rate": 3.5732394366197185e-05, + "loss": 0.4753, "step": 2130 }, { - "epoch": 7.43, - "learning_rate": 3.7686219081272083e-06, - "loss": 0.2823, + "epoch": 29.72, + "learning_rate": 3.566197183098592e-05, + "loss": 0.4807, "step": 2140 }, { - "epoch": 7.46, - "learning_rate": 3.767208480565371e-06, - "loss": 0.2766, + "epoch": 29.86, + "learning_rate": 3.559154929577465e-05, + "loss": 0.4899, "step": 2150 }, { - "epoch": 7.5, - "learning_rate": 3.7657950530035336e-06, - "loss": 0.275, + "epoch": 30.0, + "learning_rate": 3.5521126760563384e-05, + "loss": 0.4875, + "step": 2160 + }, + { + "epoch": 30.0, + "eval_loss": 0.4977600574493408, + "eval_runtime": 126.131, + "eval_samples_per_second": 4.218, + "eval_steps_per_second": 0.531, + "eval_wer": 0.22112232435559556, "step": 2160 }, { - "epoch": 7.53, - "learning_rate": 3.764381625441696e-06, - "loss": 0.2968, + "epoch": 30.14, + "learning_rate": 3.545070422535211e-05, + "loss": 0.4823, "step": 2170 }, { - "epoch": 7.57, - "learning_rate": 3.7629681978798584e-06, - "loss": 0.2965, + "epoch": 30.28, + "learning_rate": 3.538028169014085e-05, + "loss": 0.4903, "step": 2180 }, { - "epoch": 7.6, - "learning_rate": 3.7615547703180212e-06, - "loss": 0.2724, + "epoch": 30.42, + "learning_rate": 3.5309859154929583e-05, + "loss": 0.4813, "step": 2190 }, { - "epoch": 7.64, - "learning_rate": 3.7601413427561836e-06, - "loss": 0.2829, + "epoch": 30.55, + "learning_rate": 3.523943661971831e-05, + "loss": 0.4825, "step": 2200 }, { - "epoch": 7.67, - "learning_rate": 3.7587279151943465e-06, - "loss": 0.2952, + "epoch": 30.69, + "learning_rate": 3.516901408450705e-05, + "loss": 0.4799, "step": 2210 }, { - "epoch": 7.71, - "learning_rate": 3.7573144876325085e-06, - "loss": 0.2675, + "epoch": 30.83, + "learning_rate": 3.5098591549295776e-05, + "loss": 0.4729, "step": 2220 }, { - "epoch": 7.74, - "learning_rate": 3.7559010600706713e-06, - "loss": 0.2608, + "epoch": 30.97, + "learning_rate": 3.502816901408451e-05, + "loss": 0.4699, "step": 2230 }, { - "epoch": 7.78, - "learning_rate": 3.7544876325088337e-06, - "loss": 0.2701, + "epoch": 31.0, + "eval_loss": 0.4961602985858917, + "eval_runtime": 127.3244, + "eval_samples_per_second": 4.178, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2335925949733239, + "step": 2232 + }, + { + "epoch": 31.11, + "learning_rate": 3.4957746478873246e-05, + "loss": 0.486, "step": 2240 }, { - "epoch": 7.81, - "learning_rate": 3.7530742049469965e-06, - "loss": 0.2797, + "epoch": 31.25, + "learning_rate": 3.4887323943661975e-05, + "loss": 0.4742, "step": 2250 }, { - "epoch": 7.85, - "learning_rate": 3.7518021201413426e-06, - "loss": 0.2733, + "epoch": 31.39, + "learning_rate": 3.481690140845071e-05, + "loss": 0.4563, "step": 2260 }, { - "epoch": 7.88, - "learning_rate": 3.750388692579505e-06, - "loss": 0.3008, + "epoch": 31.53, + "learning_rate": 3.474647887323944e-05, + "loss": 0.4764, "step": 2270 }, { - "epoch": 7.91, - "learning_rate": 3.748975265017668e-06, - "loss": 0.2855, + "epoch": 31.66, + "learning_rate": 3.4676056338028174e-05, + "loss": 0.486, "step": 2280 }, { - "epoch": 7.95, - "learning_rate": 3.7475618374558306e-06, - "loss": 0.2587, + "epoch": 31.8, + "learning_rate": 3.460563380281691e-05, + "loss": 0.4868, "step": 2290 }, { - "epoch": 7.98, - "learning_rate": 3.7461484098939926e-06, - "loss": 0.2922, + "epoch": 31.94, + "learning_rate": 3.453521126760563e-05, + "loss": 0.4787, "step": 2300 }, { - "epoch": 8.0, - "eval_loss": 0.507337212562561, - "eval_runtime": 130.1898, - "eval_samples_per_second": 4.086, - "eval_steps_per_second": 1.022, - "eval_wer": 0.2030597158835251, + "epoch": 32.0, + "eval_loss": 0.5129938721656799, + "eval_runtime": 127.1535, + "eval_samples_per_second": 4.184, + "eval_steps_per_second": 0.527, + "eval_wer": 0.22755029890081635, "step": 2304 }, { - "epoch": 8.02, - "learning_rate": 3.744734982332155e-06, - "loss": 0.2721, + "epoch": 32.08, + "learning_rate": 3.4464788732394366e-05, + "loss": 0.511, "step": 2310 }, { - "epoch": 8.06, - "learning_rate": 3.743321554770318e-06, - "loss": 0.305, + "epoch": 32.22, + "learning_rate": 3.4394366197183094e-05, + "loss": 0.4869, "step": 2320 }, { - "epoch": 8.09, - "learning_rate": 3.7419081272084803e-06, - "loss": 0.2736, + "epoch": 32.36, + "learning_rate": 3.432394366197183e-05, + "loss": 0.488, "step": 2330 }, { - "epoch": 8.12, - "learning_rate": 3.740494699646643e-06, - "loss": 0.2865, + "epoch": 32.5, + "learning_rate": 3.4253521126760565e-05, + "loss": 0.4946, "step": 2340 }, { - "epoch": 8.16, - "learning_rate": 3.739081272084805e-06, - "loss": 0.2774, + "epoch": 32.64, + "learning_rate": 3.4183098591549293e-05, + "loss": 0.4724, "step": 2350 }, { - "epoch": 8.19, - "learning_rate": 3.737667844522968e-06, - "loss": 0.2621, + "epoch": 32.78, + "learning_rate": 3.411267605633803e-05, + "loss": 0.4761, "step": 2360 }, { - "epoch": 8.23, - "learning_rate": 3.7362544169611303e-06, - "loss": 0.2849, + "epoch": 32.91, + "learning_rate": 3.404225352112676e-05, + "loss": 0.4631, "step": 2370 }, { - "epoch": 8.26, - "learning_rate": 3.734840989399293e-06, - "loss": 0.2744, + "epoch": 33.0, + "eval_loss": 0.5091267228126526, + "eval_runtime": 126.3003, + "eval_samples_per_second": 4.212, + "eval_steps_per_second": 0.53, + "eval_wer": 0.22575046602815452, + "step": 2376 + }, + { + "epoch": 33.06, + "learning_rate": 3.397887323943662e-05, + "loss": 0.4953, "step": 2380 }, { - "epoch": 8.3, - "learning_rate": 3.7334275618374556e-06, - "loss": 0.3042, + "epoch": 33.19, + "learning_rate": 3.390845070422535e-05, + "loss": 0.4811, "step": 2390 }, { - "epoch": 8.33, - "learning_rate": 3.7320141342756184e-06, - "loss": 0.2861, + "epoch": 33.33, + "learning_rate": 3.383802816901409e-05, + "loss": 0.4829, "step": 2400 }, { - "epoch": 8.37, - "learning_rate": 3.7306007067137804e-06, - "loss": 0.2774, + "epoch": 33.47, + "learning_rate": 3.376760563380282e-05, + "loss": 0.4882, "step": 2410 }, { - "epoch": 8.4, - "learning_rate": 3.7291872791519432e-06, - "loss": 0.2846, + "epoch": 33.61, + "learning_rate": 3.369718309859155e-05, + "loss": 0.4766, "step": 2420 }, { - "epoch": 8.44, - "learning_rate": 3.7277738515901056e-06, - "loss": 0.2448, + "epoch": 33.75, + "learning_rate": 3.362676056338028e-05, + "loss": 0.4811, "step": 2430 }, { - "epoch": 8.47, - "learning_rate": 3.7263604240282685e-06, - "loss": 0.2937, + "epoch": 33.89, + "learning_rate": 3.3556338028169016e-05, + "loss": 0.4697, "step": 2440 }, { - "epoch": 8.51, - "learning_rate": 3.724946996466431e-06, - "loss": 0.2963, + "epoch": 34.0, + "eval_loss": 0.5217466354370117, + "eval_runtime": 126.2747, + "eval_samples_per_second": 4.213, + "eval_steps_per_second": 0.531, + "eval_wer": 0.2479912579546185, + "step": 2448 + }, + { + "epoch": 34.03, + "learning_rate": 3.348591549295775e-05, + "loss": 0.5069, "step": 2450 }, { - "epoch": 8.54, - "learning_rate": 3.7235335689045937e-06, - "loss": 0.2583, + "epoch": 34.17, + "learning_rate": 3.341549295774648e-05, + "loss": 0.4806, "step": 2460 }, { - "epoch": 8.57, - "learning_rate": 3.7221201413427557e-06, - "loss": 0.2691, + "epoch": 34.3, + "learning_rate": 3.3345070422535215e-05, + "loss": 0.4772, "step": 2470 }, { - "epoch": 8.61, - "learning_rate": 3.7207067137809185e-06, - "loss": 0.2798, + "epoch": 34.44, + "learning_rate": 3.327464788732394e-05, + "loss": 0.5008, "step": 2480 }, { - "epoch": 8.64, - "learning_rate": 3.719293286219081e-06, - "loss": 0.2915, + "epoch": 34.58, + "learning_rate": 3.320422535211268e-05, + "loss": 0.4682, "step": 2490 }, { - "epoch": 8.68, - "learning_rate": 3.7178798586572438e-06, - "loss": 0.2906, + "epoch": 34.72, + "learning_rate": 3.3133802816901414e-05, + "loss": 0.4793, "step": 2500 }, { - "epoch": 8.71, - "learning_rate": 3.716466431095406e-06, - "loss": 0.2885, + "epoch": 34.86, + "learning_rate": 3.306338028169014e-05, + "loss": 0.4784, "step": 2510 }, { - "epoch": 8.75, - "learning_rate": 3.7150530035335686e-06, - "loss": 0.2899, + "epoch": 35.0, + "learning_rate": 3.299295774647888e-05, + "loss": 0.4677, "step": 2520 }, { - "epoch": 8.78, - "learning_rate": 3.713639575971731e-06, - "loss": 0.2726, + "epoch": 35.0, + "eval_loss": 0.485178142786026, + "eval_runtime": 125.8332, + "eval_samples_per_second": 4.228, + "eval_steps_per_second": 0.532, + "eval_wer": 0.2253647875554413, + "step": 2520 + }, + { + "epoch": 35.14, + "learning_rate": 3.2922535211267606e-05, + "loss": 0.4711, "step": 2530 }, { - "epoch": 8.82, - "learning_rate": 3.712226148409894e-06, - "loss": 0.2824, + "epoch": 35.28, + "learning_rate": 3.285211267605634e-05, + "loss": 0.4639, "step": 2540 }, { - "epoch": 8.85, - "learning_rate": 3.7108127208480563e-06, - "loss": 0.2846, + "epoch": 35.42, + "learning_rate": 3.278169014084507e-05, + "loss": 0.4555, "step": 2550 }, { - "epoch": 8.89, - "learning_rate": 3.709399293286219e-06, - "loss": 0.2734, + "epoch": 35.55, + "learning_rate": 3.2711267605633805e-05, + "loss": 0.4617, "step": 2560 }, { - "epoch": 8.92, - "learning_rate": 3.7079858657243815e-06, - "loss": 0.2696, + "epoch": 35.69, + "learning_rate": 3.264084507042254e-05, + "loss": 0.4641, "step": 2570 }, { - "epoch": 8.96, - "learning_rate": 3.706572438162544e-06, - "loss": 0.2703, + "epoch": 35.83, + "learning_rate": 3.257042253521127e-05, + "loss": 0.4723, "step": 2580 }, { - "epoch": 8.99, - "learning_rate": 3.7051590106007063e-06, - "loss": 0.266, + "epoch": 35.97, + "learning_rate": 3.2500000000000004e-05, + "loss": 0.4644, "step": 2590 }, { - "epoch": 9.0, - "eval_loss": 0.5159009695053101, - "eval_runtime": 130.5433, - "eval_samples_per_second": 4.075, - "eval_steps_per_second": 1.019, - "eval_wer": 0.2023526386835508, + "epoch": 36.0, + "eval_loss": 0.5170550346374512, + "eval_runtime": 126.7812, + "eval_samples_per_second": 4.196, + "eval_steps_per_second": 0.528, + "eval_wer": 0.23333547599151508, "step": 2592 }, { - "epoch": 9.03, - "learning_rate": 3.703745583038869e-06, - "loss": 0.2807, + "epoch": 36.11, + "learning_rate": 3.242957746478873e-05, + "loss": 0.481, "step": 2600 }, { - "epoch": 9.06, - "learning_rate": 3.7023321554770316e-06, - "loss": 0.2772, + "epoch": 36.25, + "learning_rate": 3.235915492957747e-05, + "loss": 0.4733, "step": 2610 }, { - "epoch": 9.1, - "learning_rate": 3.7009187279151944e-06, - "loss": 0.2813, + "epoch": 36.39, + "learning_rate": 3.22887323943662e-05, + "loss": 0.4548, "step": 2620 }, { - "epoch": 9.13, - "learning_rate": 3.6995053003533564e-06, - "loss": 0.2878, + "epoch": 36.53, + "learning_rate": 3.221830985915493e-05, + "loss": 0.4983, "step": 2630 }, { - "epoch": 9.17, - "learning_rate": 3.6980918727915192e-06, - "loss": 0.2934, + "epoch": 36.66, + "learning_rate": 3.214788732394367e-05, + "loss": 0.4708, "step": 2640 }, { - "epoch": 9.2, - "learning_rate": 3.6966784452296816e-06, - "loss": 0.2755, + "epoch": 36.8, + "learning_rate": 3.2077464788732395e-05, + "loss": 0.4757, "step": 2650 }, { - "epoch": 9.24, - "learning_rate": 3.6952650176678445e-06, - "loss": 0.2921, + "epoch": 36.94, + "learning_rate": 3.200704225352113e-05, + "loss": 0.476, "step": 2660 }, { - "epoch": 9.27, - "learning_rate": 3.693851590106007e-06, - "loss": 0.2499, + "epoch": 37.0, + "eval_loss": 0.4745345115661621, + "eval_runtime": 125.9959, + "eval_samples_per_second": 4.222, + "eval_steps_per_second": 0.532, + "eval_wer": 0.22086520537378673, + "step": 2664 + }, + { + "epoch": 37.08, + "learning_rate": 3.1936619718309866e-05, + "loss": 0.4848, "step": 2670 }, { - "epoch": 9.3, - "learning_rate": 3.6924381625441697e-06, - "loss": 0.2904, + "epoch": 37.22, + "learning_rate": 3.1866197183098594e-05, + "loss": 0.4821, "step": 2680 }, { - "epoch": 9.34, - "learning_rate": 3.6910247349823317e-06, - "loss": 0.2853, + "epoch": 37.36, + "learning_rate": 3.179577464788733e-05, + "loss": 0.4646, "step": 2690 }, { - "epoch": 9.37, - "learning_rate": 3.6896113074204945e-06, - "loss": 0.2855, + "epoch": 37.5, + "learning_rate": 3.172535211267606e-05, + "loss": 0.4606, "step": 2700 }, { - "epoch": 9.41, - "learning_rate": 3.688197879858657e-06, - "loss": 0.2839, + "epoch": 37.64, + "learning_rate": 3.165492957746479e-05, + "loss": 0.4373, "step": 2710 }, { - "epoch": 9.44, - "learning_rate": 3.6867844522968198e-06, - "loss": 0.2615, + "epoch": 37.78, + "learning_rate": 3.158450704225352e-05, + "loss": 0.4681, "step": 2720 }, { - "epoch": 9.48, - "learning_rate": 3.685371024734982e-06, - "loss": 0.3092, + "epoch": 37.91, + "learning_rate": 3.151408450704226e-05, + "loss": 0.4491, "step": 2730 }, { - "epoch": 9.51, - "learning_rate": 3.683957597173145e-06, - "loss": 0.2576, + "epoch": 38.0, + "eval_loss": 0.4898006319999695, + "eval_runtime": 126.7104, + "eval_samples_per_second": 4.199, + "eval_steps_per_second": 0.529, + "eval_wer": 0.22819309635533844, + "step": 2736 + }, + { + "epoch": 38.06, + "learning_rate": 3.144366197183099e-05, + "loss": 0.4659, "step": 2740 }, { - "epoch": 9.55, - "learning_rate": 3.682544169611307e-06, - "loss": 0.2947, + "epoch": 38.19, + "learning_rate": 3.137323943661972e-05, + "loss": 0.459, "step": 2750 }, { - "epoch": 9.58, - "learning_rate": 3.68113074204947e-06, - "loss": 0.2769, + "epoch": 38.33, + "learning_rate": 3.1302816901408456e-05, + "loss": 0.4414, "step": 2760 }, { - "epoch": 9.62, - "learning_rate": 3.6797173144876322e-06, - "loss": 0.2569, + "epoch": 38.47, + "learning_rate": 3.1232394366197184e-05, + "loss": 0.4677, "step": 2770 }, { - "epoch": 9.65, - "learning_rate": 3.678303886925795e-06, - "loss": 0.2908, + "epoch": 38.61, + "learning_rate": 3.116197183098591e-05, + "loss": 0.4553, "step": 2780 }, { - "epoch": 9.69, - "learning_rate": 3.6768904593639575e-06, - "loss": 0.2975, + "epoch": 38.75, + "learning_rate": 3.109154929577465e-05, + "loss": 0.4586, "step": 2790 }, { - "epoch": 9.72, - "learning_rate": 3.67547703180212e-06, - "loss": 0.26, + "epoch": 38.89, + "learning_rate": 3.102112676056338e-05, + "loss": 0.4432, "step": 2800 }, { - "epoch": 9.75, - "learning_rate": 3.6740636042402823e-06, - "loss": 0.2551, + "epoch": 39.0, + "eval_loss": 0.4738123416900635, + "eval_runtime": 126.1855, + "eval_samples_per_second": 4.216, + "eval_steps_per_second": 0.531, + "eval_wer": 0.22369351417368388, + "step": 2808 + }, + { + "epoch": 39.03, + "learning_rate": 3.095070422535211e-05, + "loss": 0.4937, "step": 2810 }, { - "epoch": 9.79, - "learning_rate": 3.672650176678445e-06, - "loss": 0.2701, + "epoch": 39.17, + "learning_rate": 3.088028169014085e-05, + "loss": 0.4637, "step": 2820 }, { - "epoch": 9.82, - "learning_rate": 3.6712367491166075e-06, - "loss": 0.2922, + "epoch": 39.3, + "learning_rate": 3.0809859154929576e-05, + "loss": 0.4711, "step": 2830 }, { - "epoch": 9.86, - "learning_rate": 3.6698233215547704e-06, - "loss": 0.2951, + "epoch": 39.44, + "learning_rate": 3.073943661971831e-05, + "loss": 0.4621, "step": 2840 }, { - "epoch": 9.89, - "learning_rate": 3.6684098939929328e-06, - "loss": 0.2508, + "epoch": 39.58, + "learning_rate": 3.066901408450704e-05, + "loss": 0.4702, "step": 2850 }, { - "epoch": 9.93, - "learning_rate": 3.666996466431095e-06, - "loss": 0.2844, + "epoch": 39.72, + "learning_rate": 3.0598591549295775e-05, + "loss": 0.4849, "step": 2860 }, { - "epoch": 9.96, - "learning_rate": 3.6655830388692576e-06, - "loss": 0.2914, + "epoch": 39.86, + "learning_rate": 3.052816901408451e-05, + "loss": 0.4627, "step": 2870 }, { - "epoch": 10.0, - "learning_rate": 3.6641696113074204e-06, - "loss": 0.2817, + "epoch": 40.0, + "learning_rate": 3.045774647887324e-05, + "loss": 0.4804, "step": 2880 }, { - "epoch": 10.0, - "eval_loss": 0.523847222328186, - "eval_runtime": 131.2872, - "eval_samples_per_second": 4.052, - "eval_steps_per_second": 1.013, - "eval_wer": 0.20106704377450665, + "epoch": 40.0, + "eval_loss": 0.47442981600761414, + "eval_runtime": 126.0003, + "eval_samples_per_second": 4.222, + "eval_steps_per_second": 0.532, + "eval_wer": 0.22452915086456257, "step": 2880 }, { - "epoch": 10.03, - "learning_rate": 3.662756183745583e-06, - "loss": 0.2805, + "epoch": 40.14, + "learning_rate": 3.038732394366197e-05, + "loss": 0.4869, "step": 2890 }, { - "epoch": 10.07, - "learning_rate": 3.6613427561837457e-06, - "loss": 0.2565, + "epoch": 40.28, + "learning_rate": 3.0316901408450706e-05, + "loss": 0.4599, "step": 2900 }, { - "epoch": 10.1, - "learning_rate": 3.659929328621908e-06, - "loss": 0.2575, + "epoch": 40.42, + "learning_rate": 3.0246478873239438e-05, + "loss": 0.4565, "step": 2910 }, { - "epoch": 10.14, - "learning_rate": 3.6585159010600705e-06, - "loss": 0.2875, + "epoch": 40.55, + "learning_rate": 3.017605633802817e-05, + "loss": 0.4611, "step": 2920 }, { - "epoch": 10.17, - "learning_rate": 3.657102473498233e-06, - "loss": 0.2961, + "epoch": 40.69, + "learning_rate": 3.01056338028169e-05, + "loss": 0.4487, "step": 2930 }, { - "epoch": 10.21, - "learning_rate": 3.6556890459363957e-06, - "loss": 0.2588, + "epoch": 40.83, + "learning_rate": 3.0035211267605633e-05, + "loss": 0.46, "step": 2940 }, { - "epoch": 10.24, - "learning_rate": 3.654275618374558e-06, - "loss": 0.2574, + "epoch": 40.97, + "learning_rate": 2.9964788732394365e-05, + "loss": 0.4479, "step": 2950 }, { - "epoch": 10.28, - "learning_rate": 3.652862190812721e-06, - "loss": 0.269, + "epoch": 41.0, + "eval_loss": 0.5006310939788818, + "eval_runtime": 125.9565, + "eval_samples_per_second": 4.224, + "eval_steps_per_second": 0.532, + "eval_wer": 0.22022240791926465, + "step": 2952 + }, + { + "epoch": 41.11, + "learning_rate": 2.98943661971831e-05, + "loss": 0.4604, "step": 2960 }, { - "epoch": 10.31, - "learning_rate": 3.651448763250883e-06, - "loss": 0.281, + "epoch": 41.25, + "learning_rate": 2.9823943661971832e-05, + "loss": 0.4544, "step": 2970 }, { - "epoch": 10.35, - "learning_rate": 3.650035335689046e-06, - "loss": 0.2859, + "epoch": 41.39, + "learning_rate": 2.9753521126760564e-05, + "loss": 0.4427, "step": 2980 }, { - "epoch": 10.38, - "learning_rate": 3.648621908127208e-06, - "loss": 0.2844, + "epoch": 41.53, + "learning_rate": 2.9683098591549296e-05, + "loss": 0.4401, "step": 2990 }, { - "epoch": 10.42, - "learning_rate": 3.647208480565371e-06, - "loss": 0.3113, + "epoch": 41.66, + "learning_rate": 2.9612676056338028e-05, + "loss": 0.4672, "step": 3000 }, { - "epoch": 10.45, - "learning_rate": 3.6457950530035334e-06, - "loss": 0.2806, + "epoch": 41.8, + "learning_rate": 2.9542253521126763e-05, + "loss": 0.4618, "step": 3010 }, { - "epoch": 10.48, - "learning_rate": 3.6443816254416963e-06, - "loss": 0.2926, + "epoch": 41.94, + "learning_rate": 2.9471830985915495e-05, + "loss": 0.4379, "step": 3020 }, { - "epoch": 10.52, - "learning_rate": 3.6429681978798583e-06, - "loss": 0.3066, + "epoch": 42.0, + "eval_loss": 0.475214421749115, + "eval_runtime": 126.1342, + "eval_samples_per_second": 4.218, + "eval_steps_per_second": 0.531, + "eval_wer": 0.2213794433374044, + "step": 3024 + }, + { + "epoch": 42.08, + "learning_rate": 2.9401408450704227e-05, + "loss": 0.4655, "step": 3030 }, { - "epoch": 10.55, - "learning_rate": 3.641554770318021e-06, - "loss": 0.278, + "epoch": 42.22, + "learning_rate": 2.933098591549296e-05, + "loss": 0.437, "step": 3040 }, { - "epoch": 10.59, - "learning_rate": 3.6401413427561835e-06, - "loss": 0.276, + "epoch": 42.36, + "learning_rate": 2.926056338028169e-05, + "loss": 0.454, "step": 3050 }, { - "epoch": 10.62, - "learning_rate": 3.6387279151943463e-06, - "loss": 0.2589, + "epoch": 42.5, + "learning_rate": 2.9190140845070422e-05, + "loss": 0.46, "step": 3060 }, { - "epoch": 10.66, - "learning_rate": 3.6373144876325088e-06, - "loss": 0.2792, + "epoch": 42.64, + "learning_rate": 2.9119718309859158e-05, + "loss": 0.4389, "step": 3070 }, { - "epoch": 10.69, - "learning_rate": 3.6359010600706716e-06, - "loss": 0.2706, + "epoch": 42.78, + "learning_rate": 2.904929577464789e-05, + "loss": 0.4554, "step": 3080 }, { - "epoch": 10.73, - "learning_rate": 3.6344876325088336e-06, - "loss": 0.2702, + "epoch": 42.91, + "learning_rate": 2.897887323943662e-05, + "loss": 0.4412, "step": 3090 }, { - "epoch": 10.76, - "learning_rate": 3.6330742049469964e-06, - "loss": 0.2818, - "step": 3100 + "epoch": 43.0, + "eval_loss": 0.47216537594795227, + "eval_runtime": 125.8233, + "eval_samples_per_second": 4.228, + "eval_steps_per_second": 0.532, + "eval_wer": 0.22105804461014333, + "step": 3096 }, { - "epoch": 10.8, - "learning_rate": 3.631660777385159e-06, - "loss": 0.2898, + "epoch": 43.06, + "learning_rate": 2.8908450704225353e-05, + "loss": 0.4685, + "step": 3100 + }, + { + "epoch": 43.19, + "learning_rate": 2.8838028169014085e-05, + "loss": 0.4424, "step": 3110 }, { - "epoch": 10.83, - "learning_rate": 3.6302473498233216e-06, - "loss": 0.2893, + "epoch": 43.33, + "learning_rate": 2.876760563380282e-05, + "loss": 0.4495, "step": 3120 }, { - "epoch": 10.87, - "learning_rate": 3.628833922261484e-06, - "loss": 0.275, + "epoch": 43.47, + "learning_rate": 2.8697183098591552e-05, + "loss": 0.4576, "step": 3130 }, { - "epoch": 10.9, - "learning_rate": 3.6274204946996465e-06, - "loss": 0.283, + "epoch": 43.61, + "learning_rate": 2.8626760563380284e-05, + "loss": 0.4564, "step": 3140 }, { - "epoch": 10.94, - "learning_rate": 3.626007067137809e-06, - "loss": 0.2606, + "epoch": 43.75, + "learning_rate": 2.8556338028169016e-05, + "loss": 0.4458, "step": 3150 }, { - "epoch": 10.97, - "learning_rate": 3.6245936395759717e-06, - "loss": 0.2922, + "epoch": 43.89, + "learning_rate": 2.8485915492957748e-05, + "loss": 0.4459, "step": 3160 }, { - "epoch": 11.0, - "eval_loss": 0.508041262626648, - "eval_runtime": 130.0766, - "eval_samples_per_second": 4.09, - "eval_steps_per_second": 1.022, - "eval_wer": 0.20113132351995885, + "epoch": 44.0, + "eval_loss": 0.4859280586242676, + "eval_runtime": 126.1798, + "eval_samples_per_second": 4.216, + "eval_steps_per_second": 0.531, + "eval_wer": 0.22028668766471685, "step": 3168 }, { - "epoch": 11.01, - "learning_rate": 3.623180212014134e-06, - "loss": 0.3119, + "epoch": 44.03, + "learning_rate": 2.841549295774648e-05, + "loss": 0.4697, "step": 3170 }, { - "epoch": 11.04, - "learning_rate": 3.621766784452297e-06, - "loss": 0.2549, + "epoch": 44.17, + "learning_rate": 2.8345070422535215e-05, + "loss": 0.4495, "step": 3180 }, { - "epoch": 11.08, - "learning_rate": 3.6203533568904594e-06, - "loss": 0.2656, + "epoch": 44.3, + "learning_rate": 2.8274647887323947e-05, + "loss": 0.4617, "step": 3190 }, { - "epoch": 11.11, - "learning_rate": 3.6189399293286218e-06, - "loss": 0.2914, + "epoch": 44.44, + "learning_rate": 2.820422535211268e-05, + "loss": 0.4659, "step": 3200 }, { - "epoch": 11.15, - "learning_rate": 3.617526501766784e-06, - "loss": 0.2861, + "epoch": 44.58, + "learning_rate": 2.813380281690141e-05, + "loss": 0.4591, "step": 3210 }, { - "epoch": 11.18, - "learning_rate": 3.616113074204947e-06, - "loss": 0.2998, + "epoch": 44.72, + "learning_rate": 2.8063380281690143e-05, + "loss": 0.4446, "step": 3220 }, { - "epoch": 11.21, - "learning_rate": 3.6146996466431094e-06, - "loss": 0.2821, + "epoch": 44.86, + "learning_rate": 2.7992957746478874e-05, + "loss": 0.4468, "step": 3230 }, { - "epoch": 11.25, - "learning_rate": 3.6132862190812723e-06, - "loss": 0.3008, + "epoch": 45.0, + "learning_rate": 2.792253521126761e-05, + "loss": 0.4541, "step": 3240 }, { - "epoch": 11.28, - "learning_rate": 3.6118727915194342e-06, - "loss": 0.26, + "epoch": 45.0, + "eval_loss": 0.48502814769744873, + "eval_runtime": 126.9478, + "eval_samples_per_second": 4.191, + "eval_steps_per_second": 0.528, + "eval_wer": 0.21893681301022047, + "step": 3240 + }, + { + "epoch": 45.14, + "learning_rate": 2.785211267605634e-05, + "loss": 0.4567, "step": 3250 }, { - "epoch": 11.32, - "learning_rate": 3.610459363957597e-06, - "loss": 0.2877, + "epoch": 45.28, + "learning_rate": 2.7781690140845073e-05, + "loss": 0.4562, "step": 3260 }, { - "epoch": 11.35, - "learning_rate": 3.6090459363957595e-06, - "loss": 0.3065, + "epoch": 45.42, + "learning_rate": 2.7711267605633805e-05, + "loss": 0.4478, "step": 3270 }, { - "epoch": 11.39, - "learning_rate": 3.6076325088339223e-06, - "loss": 0.2815, + "epoch": 45.55, + "learning_rate": 2.7640845070422537e-05, + "loss": 0.4544, "step": 3280 }, { - "epoch": 11.42, - "learning_rate": 3.6062190812720847e-06, - "loss": 0.2649, + "epoch": 45.69, + "learning_rate": 2.7570422535211272e-05, + "loss": 0.452, "step": 3290 }, { - "epoch": 11.46, - "learning_rate": 3.6048056537102476e-06, - "loss": 0.2859, + "epoch": 45.83, + "learning_rate": 2.7500000000000004e-05, + "loss": 0.4447, "step": 3300 }, { - "epoch": 11.49, - "learning_rate": 3.6033922261484095e-06, - "loss": 0.2826, + "epoch": 45.97, + "learning_rate": 2.7429577464788736e-05, + "loss": 0.4509, "step": 3310 }, { - "epoch": 11.53, - "learning_rate": 3.601978798586572e-06, - "loss": 0.2882, + "epoch": 46.0, + "eval_loss": 0.4837965965270996, + "eval_runtime": 126.0838, + "eval_samples_per_second": 4.219, + "eval_steps_per_second": 0.531, + "eval_wer": 0.21623706370122775, + "step": 3312 + }, + { + "epoch": 46.11, + "learning_rate": 2.7359154929577468e-05, + "loss": 0.4564, "step": 3320 }, { - "epoch": 11.56, - "learning_rate": 3.600565371024735e-06, - "loss": 0.2772, + "epoch": 46.25, + "learning_rate": 2.72887323943662e-05, + "loss": 0.4427, "step": 3330 }, { - "epoch": 11.6, - "learning_rate": 3.5991519434628976e-06, - "loss": 0.2678, + "epoch": 46.39, + "learning_rate": 2.7218309859154932e-05, + "loss": 0.4461, "step": 3340 }, { - "epoch": 11.63, - "learning_rate": 3.59773851590106e-06, - "loss": 0.2841, + "epoch": 46.53, + "learning_rate": 2.7147887323943667e-05, + "loss": 0.4434, "step": 3350 }, { - "epoch": 11.66, - "learning_rate": 3.596325088339223e-06, - "loss": 0.2982, + "epoch": 46.66, + "learning_rate": 2.7077464788732392e-05, + "loss": 0.4477, "step": 3360 }, { - "epoch": 11.7, - "learning_rate": 3.594911660777385e-06, - "loss": 0.2904, + "epoch": 46.8, + "learning_rate": 2.7007042253521124e-05, + "loss": 0.4417, "step": 3370 }, { - "epoch": 11.73, - "learning_rate": 3.5934982332155473e-06, - "loss": 0.2908, + "epoch": 46.94, + "learning_rate": 2.693661971830986e-05, + "loss": 0.4472, "step": 3380 }, { - "epoch": 11.77, - "learning_rate": 3.59208480565371e-06, - "loss": 0.2629, + "epoch": 47.0, + "eval_loss": 0.48925644159317017, + "eval_runtime": 126.2561, + "eval_samples_per_second": 4.214, + "eval_steps_per_second": 0.531, + "eval_wer": 0.2310856849006878, + "step": 3384 + }, + { + "epoch": 47.08, + "learning_rate": 2.686619718309859e-05, + "loss": 0.4608, "step": 3390 }, { - "epoch": 11.8, - "learning_rate": 3.5906713780918725e-06, - "loss": 0.2953, + "epoch": 47.22, + "learning_rate": 2.6795774647887323e-05, + "loss": 0.4448, "step": 3400 }, { - "epoch": 11.84, - "learning_rate": 3.5892579505300353e-06, - "loss": 0.2857, + "epoch": 47.36, + "learning_rate": 2.6725352112676055e-05, + "loss": 0.4368, "step": 3410 }, { - "epoch": 11.87, - "learning_rate": 3.5878445229681973e-06, - "loss": 0.2671, + "epoch": 47.5, + "learning_rate": 2.6654929577464787e-05, + "loss": 0.4388, "step": 3420 }, { - "epoch": 11.91, - "learning_rate": 3.58643109540636e-06, - "loss": 0.2685, + "epoch": 47.64, + "learning_rate": 2.658450704225352e-05, + "loss": 0.4271, "step": 3430 }, { - "epoch": 11.94, - "learning_rate": 3.5850176678445226e-06, - "loss": 0.287, + "epoch": 47.78, + "learning_rate": 2.6514084507042254e-05, + "loss": 0.4443, "step": 3440 }, { - "epoch": 11.98, - "learning_rate": 3.5836042402826854e-06, - "loss": 0.2869, + "epoch": 47.91, + "learning_rate": 2.6443661971830986e-05, + "loss": 0.4341, "step": 3450 }, { - "epoch": 12.0, - "eval_loss": 0.4973689019680023, - "eval_runtime": 129.1272, - "eval_samples_per_second": 4.12, - "eval_steps_per_second": 1.03, - "eval_wer": 0.20267403741081186, + "epoch": 48.0, + "eval_loss": 0.4899713695049286, + "eval_runtime": 127.6794, + "eval_samples_per_second": 4.167, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2198367294465514, "step": 3456 }, { - "epoch": 12.01, - "learning_rate": 3.582190812720848e-06, - "loss": 0.2896, + "epoch": 48.06, + "learning_rate": 2.6373239436619718e-05, + "loss": 0.4632, "step": 3460 }, { - "epoch": 12.05, - "learning_rate": 3.5807773851590106e-06, - "loss": 0.2994, + "epoch": 48.19, + "learning_rate": 2.630281690140845e-05, + "loss": 0.4492, "step": 3470 }, { - "epoch": 12.08, - "learning_rate": 3.5793639575971726e-06, - "loss": 0.2556, + "epoch": 48.33, + "learning_rate": 2.623239436619718e-05, + "loss": 0.4472, "step": 3480 }, { - "epoch": 12.12, - "learning_rate": 3.5779505300353355e-06, - "loss": 0.2681, + "epoch": 48.47, + "learning_rate": 2.6161971830985917e-05, + "loss": 0.4323, "step": 3490 }, { - "epoch": 12.15, - "learning_rate": 3.576537102473498e-06, - "loss": 0.2913, + "epoch": 48.61, + "learning_rate": 2.609154929577465e-05, + "loss": 0.4455, "step": 3500 }, { - "epoch": 12.19, - "learning_rate": 3.5751236749116607e-06, - "loss": 0.2544, + "epoch": 48.75, + "learning_rate": 2.602112676056338e-05, + "loss": 0.4441, "step": 3510 }, { - "epoch": 12.22, - "learning_rate": 3.573710247349823e-06, - "loss": 0.2785, + "epoch": 48.89, + "learning_rate": 2.5950704225352112e-05, + "loss": 0.4306, "step": 3520 }, { - "epoch": 12.26, - "learning_rate": 3.572296819787986e-06, - "loss": 0.2865, + "epoch": 49.0, + "eval_loss": 0.5051801800727844, + "eval_runtime": 126.7896, + "eval_samples_per_second": 4.196, + "eval_steps_per_second": 0.528, + "eval_wer": 0.21662274217394098, + "step": 3528 + }, + { + "epoch": 49.03, + "learning_rate": 2.5880281690140844e-05, + "loss": 0.4485, "step": 3530 }, { - "epoch": 12.29, - "learning_rate": 3.570883392226148e-06, - "loss": 0.3012, + "epoch": 49.17, + "learning_rate": 2.5809859154929576e-05, + "loss": 0.4317, "step": 3540 }, { - "epoch": 12.33, - "learning_rate": 3.5694699646643108e-06, - "loss": 0.2854, + "epoch": 49.3, + "learning_rate": 2.573943661971831e-05, + "loss": 0.4475, "step": 3550 }, { - "epoch": 12.36, - "learning_rate": 3.568056537102473e-06, - "loss": 0.3029, + "epoch": 49.44, + "learning_rate": 2.5669014084507043e-05, + "loss": 0.4293, "step": 3560 }, { - "epoch": 12.39, - "learning_rate": 3.566643109540636e-06, - "loss": 0.2927, + "epoch": 49.58, + "learning_rate": 2.5598591549295775e-05, + "loss": 0.4437, "step": 3570 }, { - "epoch": 12.43, - "learning_rate": 3.5652296819787984e-06, - "loss": 0.2681, + "epoch": 49.72, + "learning_rate": 2.5528169014084507e-05, + "loss": 0.4452, "step": 3580 }, { - "epoch": 12.46, - "learning_rate": 3.563816254416961e-06, - "loss": 0.2767, + "epoch": 49.86, + "learning_rate": 2.545774647887324e-05, + "loss": 0.4429, "step": 3590 }, { - "epoch": 12.5, - "learning_rate": 3.5624028268551232e-06, - "loss": 0.2824, + "epoch": 50.0, + "learning_rate": 2.5387323943661974e-05, + "loss": 0.44, + "step": 3600 + }, + { + "epoch": 50.0, + "eval_loss": 0.508723795413971, + "eval_runtime": 126.2458, + "eval_samples_per_second": 4.214, + "eval_steps_per_second": 0.531, + "eval_wer": 0.2229864369737096, "step": 3600 }, { - "epoch": 12.53, - "learning_rate": 3.5611307420494697e-06, - "loss": 0.2764, + "epoch": 50.14, + "learning_rate": 2.5316901408450706e-05, + "loss": 0.4377, "step": 3610 }, { - "epoch": 12.57, - "learning_rate": 3.559717314487632e-06, - "loss": 0.2487, + "epoch": 50.28, + "learning_rate": 2.5246478873239438e-05, + "loss": 0.4285, "step": 3620 }, { - "epoch": 12.6, - "learning_rate": 3.558303886925795e-06, - "loss": 0.2881, + "epoch": 50.42, + "learning_rate": 2.517605633802817e-05, + "loss": 0.4413, "step": 3630 }, { - "epoch": 12.64, - "learning_rate": 3.5568904593639574e-06, - "loss": 0.2865, + "epoch": 50.55, + "learning_rate": 2.51056338028169e-05, + "loss": 0.4518, "step": 3640 }, { - "epoch": 12.67, - "learning_rate": 3.55547703180212e-06, - "loss": 0.2817, + "epoch": 50.69, + "learning_rate": 2.5035211267605634e-05, + "loss": 0.4334, "step": 3650 }, { - "epoch": 12.71, - "learning_rate": 3.5540636042402826e-06, - "loss": 0.2677, + "epoch": 50.83, + "learning_rate": 2.496478873239437e-05, + "loss": 0.4406, "step": 3660 }, { - "epoch": 12.74, - "learning_rate": 3.552650176678445e-06, - "loss": 0.3031, + "epoch": 50.97, + "learning_rate": 2.48943661971831e-05, + "loss": 0.4425, "step": 3670 }, { - "epoch": 12.78, - "learning_rate": 3.5512367491166074e-06, - "loss": 0.2787, + "epoch": 51.0, + "eval_loss": 0.484998494386673, + "eval_runtime": 125.9671, + "eval_samples_per_second": 4.223, + "eval_steps_per_second": 0.532, + "eval_wer": 0.22002956868290802, + "step": 3672 + }, + { + "epoch": 51.11, + "learning_rate": 2.4823943661971833e-05, + "loss": 0.442, "step": 3680 }, { - "epoch": 12.81, - "learning_rate": 3.5498233215547702e-06, - "loss": 0.2761, + "epoch": 51.25, + "learning_rate": 2.4753521126760564e-05, + "loss": 0.435, "step": 3690 }, { - "epoch": 12.85, - "learning_rate": 3.5484098939929327e-06, - "loss": 0.2749, + "epoch": 51.39, + "learning_rate": 2.4683098591549296e-05, + "loss": 0.4345, "step": 3700 }, { - "epoch": 12.88, - "learning_rate": 3.5469964664310955e-06, - "loss": 0.2977, + "epoch": 51.53, + "learning_rate": 2.4612676056338028e-05, + "loss": 0.445, "step": 3710 }, { - "epoch": 12.91, - "learning_rate": 3.5455830388692575e-06, - "loss": 0.2686, + "epoch": 51.66, + "learning_rate": 2.4542253521126763e-05, + "loss": 0.4239, "step": 3720 }, { - "epoch": 12.95, - "learning_rate": 3.5441696113074203e-06, - "loss": 0.2724, + "epoch": 51.8, + "learning_rate": 2.4471830985915495e-05, + "loss": 0.427, "step": 3730 }, { - "epoch": 12.98, - "learning_rate": 3.5427561837455827e-06, - "loss": 0.284, + "epoch": 51.94, + "learning_rate": 2.4401408450704227e-05, + "loss": 0.4329, "step": 3740 }, { - "epoch": 13.0, - "eval_loss": 0.5104484558105469, - "eval_runtime": 128.6455, - "eval_samples_per_second": 4.135, - "eval_steps_per_second": 1.034, - "eval_wer": 0.200552805810889, + "epoch": 52.0, + "eval_loss": 0.4712650775909424, + "eval_runtime": 126.6273, + "eval_samples_per_second": 4.201, + "eval_steps_per_second": 0.529, + "eval_wer": 0.21887253326476827, "step": 3744 }, { - "epoch": 13.02, - "learning_rate": 3.5413427561837456e-06, - "loss": 0.2975, + "epoch": 52.08, + "learning_rate": 2.433098591549296e-05, + "loss": 0.4487, "step": 3750 }, { - "epoch": 13.06, - "learning_rate": 3.539929328621908e-06, - "loss": 0.2805, + "epoch": 52.22, + "learning_rate": 2.426056338028169e-05, + "loss": 0.4431, "step": 3760 }, { - "epoch": 13.09, - "learning_rate": 3.538515901060071e-06, - "loss": 0.2694, + "epoch": 52.36, + "learning_rate": 2.4190140845070426e-05, + "loss": 0.438, "step": 3770 }, { - "epoch": 13.12, - "learning_rate": 3.5371024734982328e-06, - "loss": 0.2523, + "epoch": 52.5, + "learning_rate": 2.4119718309859158e-05, + "loss": 0.4351, "step": 3780 }, { - "epoch": 13.16, - "learning_rate": 3.5356890459363956e-06, - "loss": 0.2933, + "epoch": 52.64, + "learning_rate": 2.404929577464789e-05, + "loss": 0.4231, "step": 3790 }, { - "epoch": 13.19, - "learning_rate": 3.534275618374558e-06, - "loss": 0.2829, + "epoch": 52.78, + "learning_rate": 2.3978873239436622e-05, + "loss": 0.4367, "step": 3800 }, { - "epoch": 13.23, - "learning_rate": 3.532862190812721e-06, - "loss": 0.261, + "epoch": 52.91, + "learning_rate": 2.390845070422535e-05, + "loss": 0.4335, "step": 3810 }, { - "epoch": 13.26, - "learning_rate": 3.5314487632508833e-06, - "loss": 0.2829, + "epoch": 53.0, + "eval_loss": 0.4828576147556305, + "eval_runtime": 126.5803, + "eval_samples_per_second": 4.203, + "eval_steps_per_second": 0.529, + "eval_wer": 0.21379443337404383, + "step": 3816 + }, + { + "epoch": 53.06, + "learning_rate": 2.3838028169014086e-05, + "loss": 0.4454, "step": 3820 }, { - "epoch": 13.3, - "learning_rate": 3.530035335689046e-06, - "loss": 0.2911, + "epoch": 53.19, + "learning_rate": 2.3767605633802817e-05, + "loss": 0.4323, "step": 3830 }, { - "epoch": 13.33, - "learning_rate": 3.528621908127208e-06, - "loss": 0.2769, + "epoch": 53.33, + "learning_rate": 2.369718309859155e-05, + "loss": 0.4371, "step": 3840 }, { - "epoch": 13.37, - "learning_rate": 3.527208480565371e-06, - "loss": 0.2595, + "epoch": 53.47, + "learning_rate": 2.362676056338028e-05, + "loss": 0.4435, "step": 3850 }, { - "epoch": 13.4, - "learning_rate": 3.5257950530035333e-06, - "loss": 0.2858, + "epoch": 53.61, + "learning_rate": 2.3556338028169013e-05, + "loss": 0.4307, "step": 3860 }, { - "epoch": 13.44, - "learning_rate": 3.524381625441696e-06, - "loss": 0.2498, + "epoch": 53.75, + "learning_rate": 2.348591549295775e-05, + "loss": 0.424, "step": 3870 }, { - "epoch": 13.47, - "learning_rate": 3.5229681978798586e-06, - "loss": 0.2919, + "epoch": 53.89, + "learning_rate": 2.341549295774648e-05, + "loss": 0.4184, "step": 3880 }, { - "epoch": 13.51, - "learning_rate": 3.521554770318021e-06, - "loss": 0.3099, + "epoch": 54.0, + "eval_loss": 0.5033903121948242, + "eval_runtime": 126.2852, + "eval_samples_per_second": 4.213, + "eval_steps_per_second": 0.531, + "eval_wer": 0.2127659574468085, + "step": 3888 + }, + { + "epoch": 54.03, + "learning_rate": 2.3345070422535212e-05, + "loss": 0.4599, "step": 3890 }, { - "epoch": 13.54, - "learning_rate": 3.5201413427561834e-06, - "loss": 0.2785, + "epoch": 54.17, + "learning_rate": 2.3274647887323944e-05, + "loss": 0.4255, "step": 3900 }, { - "epoch": 13.57, - "learning_rate": 3.5187279151943462e-06, - "loss": 0.2562, + "epoch": 54.3, + "learning_rate": 2.3204225352112676e-05, + "loss": 0.4408, "step": 3910 }, { - "epoch": 13.61, - "learning_rate": 3.5173144876325086e-06, - "loss": 0.2876, + "epoch": 54.44, + "learning_rate": 2.3133802816901408e-05, + "loss": 0.4261, "step": 3920 }, { - "epoch": 13.64, - "learning_rate": 3.5159010600706715e-06, - "loss": 0.2982, + "epoch": 54.58, + "learning_rate": 2.3063380281690143e-05, + "loss": 0.4391, "step": 3930 }, { - "epoch": 13.68, - "learning_rate": 3.514487632508834e-06, - "loss": 0.2774, + "epoch": 54.72, + "learning_rate": 2.2992957746478875e-05, + "loss": 0.44, "step": 3940 }, { - "epoch": 13.71, - "learning_rate": 3.5130742049469963e-06, - "loss": 0.2651, + "epoch": 54.86, + "learning_rate": 2.2922535211267607e-05, + "loss": 0.4379, "step": 3950 }, { - "epoch": 13.75, - "learning_rate": 3.5116607773851587e-06, - "loss": 0.2769, + "epoch": 55.0, + "learning_rate": 2.285211267605634e-05, + "loss": 0.4303, "step": 3960 }, { - "epoch": 13.78, - "learning_rate": 3.5102473498233215e-06, - "loss": 0.2744, + "epoch": 55.0, + "eval_loss": 0.4944688677787781, + "eval_runtime": 127.0851, + "eval_samples_per_second": 4.186, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21662274217394098, + "step": 3960 + }, + { + "epoch": 55.14, + "learning_rate": 2.278169014084507e-05, + "loss": 0.4272, "step": 3970 }, { - "epoch": 13.82, - "learning_rate": 3.508833922261484e-06, - "loss": 0.2922, + "epoch": 55.28, + "learning_rate": 2.2711267605633806e-05, + "loss": 0.4379, "step": 3980 }, { - "epoch": 13.85, - "learning_rate": 3.5074204946996468e-06, - "loss": 0.2784, + "epoch": 55.42, + "learning_rate": 2.2640845070422538e-05, + "loss": 0.4422, "step": 3990 }, { - "epoch": 13.89, - "learning_rate": 3.506007067137809e-06, - "loss": 0.2871, + "epoch": 55.55, + "learning_rate": 2.257042253521127e-05, + "loss": 0.4369, "step": 4000 }, { - "epoch": 13.92, - "learning_rate": 3.5045936395759716e-06, - "loss": 0.2628, + "epoch": 55.69, + "learning_rate": 2.25e-05, + "loss": 0.4451, "step": 4010 }, { - "epoch": 13.96, - "learning_rate": 3.503180212014134e-06, - "loss": 0.2794, + "epoch": 55.83, + "learning_rate": 2.2429577464788733e-05, + "loss": 0.4423, "step": 4020 }, { - "epoch": 13.99, - "learning_rate": 3.501766784452297e-06, - "loss": 0.2911, + "epoch": 55.97, + "learning_rate": 2.2359154929577465e-05, + "loss": 0.4519, "step": 4030 }, { - "epoch": 14.0, - "eval_loss": 0.5025652050971985, - "eval_runtime": 129.3001, - "eval_samples_per_second": 4.114, - "eval_steps_per_second": 1.029, - "eval_wer": 0.20170984122902874, + "epoch": 56.0, + "eval_loss": 0.5088710784912109, + "eval_runtime": 127.0232, + "eval_samples_per_second": 4.188, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21058044610143345, "step": 4032 }, { - "epoch": 14.03, - "learning_rate": 3.5003533568904592e-06, - "loss": 0.2873, + "epoch": 56.11, + "learning_rate": 2.22887323943662e-05, + "loss": 0.4343, "step": 4040 }, { - "epoch": 14.06, - "learning_rate": 3.498939929328622e-06, - "loss": 0.2802, + "epoch": 56.25, + "learning_rate": 2.2218309859154932e-05, + "loss": 0.4311, "step": 4050 }, { - "epoch": 14.1, - "learning_rate": 3.497526501766784e-06, - "loss": 0.2649, + "epoch": 56.39, + "learning_rate": 2.2147887323943664e-05, + "loss": 0.4214, "step": 4060 }, { - "epoch": 14.13, - "learning_rate": 3.496113074204947e-06, - "loss": 0.2909, + "epoch": 56.53, + "learning_rate": 2.2077464788732396e-05, + "loss": 0.4422, "step": 4070 }, { - "epoch": 14.17, - "learning_rate": 3.4946996466431093e-06, - "loss": 0.2844, + "epoch": 56.66, + "learning_rate": 2.2007042253521128e-05, + "loss": 0.4273, "step": 4080 }, { - "epoch": 14.2, - "learning_rate": 3.493286219081272e-06, - "loss": 0.2669, + "epoch": 56.8, + "learning_rate": 2.1936619718309863e-05, + "loss": 0.4416, "step": 4090 }, { - "epoch": 14.24, - "learning_rate": 3.4918727915194345e-06, - "loss": 0.2757, + "epoch": 56.94, + "learning_rate": 2.186619718309859e-05, + "loss": 0.4336, "step": 4100 }, { - "epoch": 14.27, - "learning_rate": 3.4904593639575974e-06, - "loss": 0.2774, + "epoch": 57.0, + "eval_loss": 0.5325378179550171, + "eval_runtime": 133.5981, + "eval_samples_per_second": 3.982, + "eval_steps_per_second": 0.502, + "eval_wer": 0.21463007006492255, + "step": 4104 + }, + { + "epoch": 57.08, + "learning_rate": 2.1795774647887324e-05, + "loss": 0.4356, "step": 4110 }, { - "epoch": 14.3, - "learning_rate": 3.4890459363957594e-06, - "loss": 0.2773, + "epoch": 57.22, + "learning_rate": 2.1725352112676055e-05, + "loss": 0.4303, "step": 4120 }, { - "epoch": 14.34, - "learning_rate": 3.487632508833922e-06, - "loss": 0.2743, + "epoch": 57.36, + "learning_rate": 2.1654929577464787e-05, + "loss": 0.4352, "step": 4130 }, { - "epoch": 14.37, - "learning_rate": 3.4862190812720846e-06, - "loss": 0.2583, + "epoch": 57.5, + "learning_rate": 2.1584507042253523e-05, + "loss": 0.4417, "step": 4140 }, { - "epoch": 14.41, - "learning_rate": 3.4848056537102474e-06, - "loss": 0.2636, + "epoch": 57.64, + "learning_rate": 2.1514084507042254e-05, + "loss": 0.4322, "step": 4150 }, { - "epoch": 14.44, - "learning_rate": 3.48339222614841e-06, - "loss": 0.2344, + "epoch": 57.78, + "learning_rate": 2.1443661971830986e-05, + "loss": 0.4461, "step": 4160 }, { - "epoch": 14.48, - "learning_rate": 3.4819787985865723e-06, - "loss": 0.2904, + "epoch": 57.91, + "learning_rate": 2.1373239436619718e-05, + "loss": 0.4274, "step": 4170 }, { - "epoch": 14.51, - "learning_rate": 3.4805653710247347e-06, - "loss": 0.2892, + "epoch": 58.0, + "eval_loss": 0.5188899636268616, + "eval_runtime": 126.4883, + "eval_samples_per_second": 4.206, + "eval_steps_per_second": 0.53, + "eval_wer": 0.22202224079192645, + "step": 4176 + }, + { + "epoch": 58.06, + "learning_rate": 2.130281690140845e-05, + "loss": 0.4454, "step": 4180 }, { - "epoch": 14.55, - "learning_rate": 3.4791519434628975e-06, - "loss": 0.2607, + "epoch": 58.19, + "learning_rate": 2.1232394366197182e-05, + "loss": 0.4345, "step": 4190 }, { - "epoch": 14.58, - "learning_rate": 3.47773851590106e-06, - "loss": 0.2952, + "epoch": 58.33, + "learning_rate": 2.1161971830985917e-05, + "loss": 0.4421, "step": 4200 }, { - "epoch": 14.62, - "learning_rate": 3.4763250883392227e-06, - "loss": 0.2731, + "epoch": 58.47, + "learning_rate": 2.109154929577465e-05, + "loss": 0.4358, "step": 4210 }, { - "epoch": 14.65, - "learning_rate": 3.474911660777385e-06, - "loss": 0.2973, + "epoch": 58.61, + "learning_rate": 2.102112676056338e-05, + "loss": 0.4267, "step": 4220 }, { - "epoch": 14.69, - "learning_rate": 3.4734982332155476e-06, - "loss": 0.2897, + "epoch": 58.75, + "learning_rate": 2.0950704225352113e-05, + "loss": 0.4531, "step": 4230 }, { - "epoch": 14.72, - "learning_rate": 3.47208480565371e-06, - "loss": 0.2761, + "epoch": 58.89, + "learning_rate": 2.0880281690140845e-05, + "loss": 0.4217, "step": 4240 }, { - "epoch": 14.75, - "learning_rate": 3.470671378091873e-06, - "loss": 0.2716, + "epoch": 59.0, + "eval_loss": 0.5071147084236145, + "eval_runtime": 126.2477, + "eval_samples_per_second": 4.214, + "eval_steps_per_second": 0.531, + "eval_wer": 0.2119303207559298, + "step": 4248 + }, + { + "epoch": 59.03, + "learning_rate": 2.080985915492958e-05, + "loss": 0.4357, "step": 4250 }, { - "epoch": 14.79, - "learning_rate": 3.4692579505300352e-06, - "loss": 0.2473, + "epoch": 59.17, + "learning_rate": 2.0739436619718312e-05, + "loss": 0.4185, "step": 4260 }, { - "epoch": 14.82, - "learning_rate": 3.467844522968198e-06, - "loss": 0.3024, + "epoch": 59.3, + "learning_rate": 2.0669014084507044e-05, + "loss": 0.4357, "step": 4270 }, { - "epoch": 14.86, - "learning_rate": 3.4664310954063605e-06, - "loss": 0.2873, + "epoch": 59.44, + "learning_rate": 2.0598591549295776e-05, + "loss": 0.433, "step": 4280 }, { - "epoch": 14.89, - "learning_rate": 3.4650176678445224e-06, - "loss": 0.278, + "epoch": 59.58, + "learning_rate": 2.0528169014084507e-05, + "loss": 0.4387, "step": 4290 }, { - "epoch": 14.93, - "learning_rate": 3.4636042402826853e-06, - "loss": 0.2486, + "epoch": 59.72, + "learning_rate": 2.045774647887324e-05, + "loss": 0.4357, "step": 4300 }, { - "epoch": 14.96, - "learning_rate": 3.462190812720848e-06, - "loss": 0.2668, + "epoch": 59.86, + "learning_rate": 2.0387323943661975e-05, + "loss": 0.3986, "step": 4310 }, { - "epoch": 15.0, - "learning_rate": 3.4607773851590105e-06, - "loss": 0.2864, + "epoch": 60.0, + "learning_rate": 2.0316901408450707e-05, + "loss": 0.4173, "step": 4320 }, { - "epoch": 15.0, - "eval_loss": 0.5064656138420105, - "eval_runtime": 129.204, - "eval_samples_per_second": 4.118, - "eval_steps_per_second": 1.029, - "eval_wer": 0.20023140708362794, + "epoch": 60.0, + "eval_loss": 0.5162719488143921, + "eval_runtime": 126.1056, + "eval_samples_per_second": 4.219, + "eval_steps_per_second": 0.531, + "eval_wer": 0.218486854792055, "step": 4320 }, { - "epoch": 15.03, - "learning_rate": 3.4593639575971734e-06, - "loss": 0.2883, + "epoch": 60.14, + "learning_rate": 2.024647887323944e-05, + "loss": 0.4373, "step": 4330 }, { - "epoch": 15.07, - "learning_rate": 3.4579505300353353e-06, - "loss": 0.2741, + "epoch": 60.28, + "learning_rate": 2.017605633802817e-05, + "loss": 0.4161, "step": 4340 }, { - "epoch": 15.1, - "learning_rate": 3.4565371024734977e-06, - "loss": 0.2775, + "epoch": 60.42, + "learning_rate": 2.0105633802816902e-05, + "loss": 0.4227, "step": 4350 }, { - "epoch": 15.14, - "learning_rate": 3.4551236749116606e-06, - "loss": 0.287, + "epoch": 60.55, + "learning_rate": 2.0035211267605637e-05, + "loss": 0.417, "step": 4360 }, { - "epoch": 15.17, - "learning_rate": 3.453710247349823e-06, - "loss": 0.2964, + "epoch": 60.69, + "learning_rate": 1.996478873239437e-05, + "loss": 0.4254, "step": 4370 }, { - "epoch": 15.21, - "learning_rate": 3.452296819787986e-06, - "loss": 0.2907, + "epoch": 60.83, + "learning_rate": 1.98943661971831e-05, + "loss": 0.4221, "step": 4380 }, { - "epoch": 15.24, - "learning_rate": 3.4508833922261482e-06, - "loss": 0.282, + "epoch": 60.97, + "learning_rate": 1.9823943661971833e-05, + "loss": 0.4221, "step": 4390 }, { - "epoch": 15.28, - "learning_rate": 3.4494699646643106e-06, - "loss": 0.2511, + "epoch": 61.0, + "eval_loss": 0.48502665758132935, + "eval_runtime": 125.8546, + "eval_samples_per_second": 4.227, + "eval_steps_per_second": 0.532, + "eval_wer": 0.21893681301022047, + "step": 4392 + }, + { + "epoch": 61.11, + "learning_rate": 1.975352112676056e-05, + "loss": 0.4402, "step": 4400 }, { - "epoch": 15.31, - "learning_rate": 3.448056537102473e-06, - "loss": 0.284, + "epoch": 61.25, + "learning_rate": 1.9683098591549297e-05, + "loss": 0.4362, "step": 4410 }, { - "epoch": 15.35, - "learning_rate": 3.446643109540636e-06, - "loss": 0.2856, + "epoch": 61.39, + "learning_rate": 1.961267605633803e-05, + "loss": 0.42, "step": 4420 }, { - "epoch": 15.38, - "learning_rate": 3.4452296819787983e-06, - "loss": 0.2694, + "epoch": 61.53, + "learning_rate": 1.954225352112676e-05, + "loss": 0.4152, "step": 4430 }, { - "epoch": 15.42, - "learning_rate": 3.443816254416961e-06, - "loss": 0.2572, + "epoch": 61.66, + "learning_rate": 1.9471830985915492e-05, + "loss": 0.4042, "step": 4440 }, { - "epoch": 15.45, - "learning_rate": 3.4424028268551235e-06, - "loss": 0.2929, + "epoch": 61.8, + "learning_rate": 1.9401408450704224e-05, + "loss": 0.4293, "step": 4450 }, { - "epoch": 15.48, - "learning_rate": 3.440989399293286e-06, - "loss": 0.2973, + "epoch": 61.94, + "learning_rate": 1.933098591549296e-05, + "loss": 0.4244, "step": 4460 }, { - "epoch": 15.52, - "learning_rate": 3.4395759717314484e-06, - "loss": 0.2767, + "epoch": 62.0, + "eval_loss": 0.4899979829788208, + "eval_runtime": 125.4884, + "eval_samples_per_second": 4.239, + "eval_steps_per_second": 0.534, + "eval_wer": 0.21533714726489683, + "step": 4464 + }, + { + "epoch": 62.08, + "learning_rate": 1.926056338028169e-05, + "loss": 0.4405, "step": 4470 }, { - "epoch": 15.55, - "learning_rate": 3.438162544169611e-06, - "loss": 0.26, + "epoch": 62.22, + "learning_rate": 1.9190140845070423e-05, + "loss": 0.4257, "step": 4480 }, { - "epoch": 15.59, - "learning_rate": 3.4367491166077736e-06, - "loss": 0.2813, + "epoch": 62.36, + "learning_rate": 1.9119718309859155e-05, + "loss": 0.4237, "step": 4490 }, { - "epoch": 15.62, - "learning_rate": 3.4353356890459364e-06, - "loss": 0.2703, + "epoch": 62.5, + "learning_rate": 1.9049295774647887e-05, + "loss": 0.4236, "step": 4500 }, { - "epoch": 15.66, - "learning_rate": 3.4339222614840984e-06, - "loss": 0.2875, + "epoch": 62.64, + "learning_rate": 1.897887323943662e-05, + "loss": 0.414, "step": 4510 }, { - "epoch": 15.69, - "learning_rate": 3.4325088339222613e-06, - "loss": 0.2561, + "epoch": 62.78, + "learning_rate": 1.8908450704225354e-05, + "loss": 0.426, "step": 4520 }, { - "epoch": 15.73, - "learning_rate": 3.4310954063604237e-06, - "loss": 0.271, + "epoch": 62.91, + "learning_rate": 1.8838028169014086e-05, + "loss": 0.4147, "step": 4530 }, { - "epoch": 15.76, - "learning_rate": 3.4296819787985865e-06, - "loss": 0.2934, + "epoch": 63.0, + "eval_loss": 0.4965975284576416, + "eval_runtime": 126.8176, + "eval_samples_per_second": 4.195, + "eval_steps_per_second": 0.528, + "eval_wer": 0.2077521373015363, + "step": 4536 + }, + { + "epoch": 63.06, + "learning_rate": 1.8767605633802818e-05, + "loss": 0.4279, "step": 4540 }, { - "epoch": 15.8, - "learning_rate": 3.428268551236749e-06, - "loss": 0.2791, + "epoch": 63.19, + "learning_rate": 1.869718309859155e-05, + "loss": 0.4237, "step": 4550 }, { - "epoch": 15.83, - "learning_rate": 3.4268551236749117e-06, - "loss": 0.2896, + "epoch": 63.33, + "learning_rate": 1.862676056338028e-05, + "loss": 0.4317, "step": 4560 }, { - "epoch": 15.87, - "learning_rate": 3.4254416961130737e-06, - "loss": 0.3179, + "epoch": 63.47, + "learning_rate": 1.8556338028169014e-05, + "loss": 0.4234, "step": 4570 }, { - "epoch": 15.9, - "learning_rate": 3.4240282685512366e-06, - "loss": 0.2716, + "epoch": 63.61, + "learning_rate": 1.848591549295775e-05, + "loss": 0.424, "step": 4580 }, { - "epoch": 15.94, - "learning_rate": 3.422614840989399e-06, - "loss": 0.3019, + "epoch": 63.75, + "learning_rate": 1.841549295774648e-05, + "loss": 0.4191, "step": 4590 }, { - "epoch": 15.97, - "learning_rate": 3.421201413427562e-06, - "loss": 0.2779, + "epoch": 63.89, + "learning_rate": 1.8345070422535213e-05, + "loss": 0.4135, "step": 4600 }, { - "epoch": 16.0, - "eval_loss": 0.5024499297142029, - "eval_runtime": 129.1181, - "eval_samples_per_second": 4.12, - "eval_steps_per_second": 1.03, - "eval_wer": 0.20100276402905445, + "epoch": 64.0, + "eval_loss": 0.5242801308631897, + "eval_runtime": 126.406, + "eval_samples_per_second": 4.209, + "eval_steps_per_second": 0.53, + "eval_wer": 0.21662274217394098, "step": 4608 }, { - "epoch": 16.01, - "learning_rate": 3.419787985865724e-06, - "loss": 0.3, + "epoch": 64.03, + "learning_rate": 1.8274647887323944e-05, + "loss": 0.4383, "step": 4610 }, { - "epoch": 16.04, - "learning_rate": 3.418374558303887e-06, - "loss": 0.2691, + "epoch": 64.17, + "learning_rate": 1.8204225352112676e-05, + "loss": 0.4271, "step": 4620 }, { - "epoch": 16.08, - "learning_rate": 3.416961130742049e-06, - "loss": 0.2599, + "epoch": 64.3, + "learning_rate": 1.813380281690141e-05, + "loss": 0.4191, "step": 4630 }, { - "epoch": 16.11, - "learning_rate": 3.415547703180212e-06, - "loss": 0.2636, + "epoch": 64.44, + "learning_rate": 1.8063380281690143e-05, + "loss": 0.4142, "step": 4640 }, { - "epoch": 16.15, - "learning_rate": 3.4141342756183743e-06, - "loss": 0.2902, + "epoch": 64.58, + "learning_rate": 1.7992957746478875e-05, + "loss": 0.4244, "step": 4650 }, { - "epoch": 16.18, - "learning_rate": 3.412720848056537e-06, - "loss": 0.2577, + "epoch": 64.72, + "learning_rate": 1.7922535211267607e-05, + "loss": 0.4209, "step": 4660 }, { - "epoch": 16.21, - "learning_rate": 3.4113074204946995e-06, - "loss": 0.2813, + "epoch": 64.86, + "learning_rate": 1.785211267605634e-05, + "loss": 0.4215, "step": 4670 }, { - "epoch": 16.25, - "learning_rate": 3.409893992932862e-06, - "loss": 0.2619, + "epoch": 65.0, + "learning_rate": 1.778169014084507e-05, + "loss": 0.4127, + "step": 4680 + }, + { + "epoch": 65.0, + "eval_loss": 0.4889000952243805, + "eval_runtime": 125.6271, + "eval_samples_per_second": 4.235, + "eval_steps_per_second": 0.533, + "eval_wer": 0.21642990293758438, "step": 4680 }, { - "epoch": 16.28, - "learning_rate": 3.4084805653710243e-06, - "loss": 0.2685, + "epoch": 65.14, + "learning_rate": 1.7711267605633806e-05, + "loss": 0.4334, "step": 4690 }, { - "epoch": 16.32, - "learning_rate": 3.407067137809187e-06, - "loss": 0.2886, + "epoch": 65.28, + "learning_rate": 1.7640845070422535e-05, + "loss": 0.4268, "step": 4700 }, { - "epoch": 16.35, - "learning_rate": 3.4056537102473496e-06, - "loss": 0.2828, + "epoch": 65.42, + "learning_rate": 1.7570422535211267e-05, + "loss": 0.4253, "step": 4710 }, { - "epoch": 16.39, - "learning_rate": 3.4042402826855124e-06, - "loss": 0.2643, + "epoch": 65.55, + "learning_rate": 1.75e-05, + "loss": 0.4091, "step": 4720 }, { - "epoch": 16.42, - "learning_rate": 3.402826855123675e-06, - "loss": 0.2722, + "epoch": 65.69, + "learning_rate": 1.7429577464788734e-05, + "loss": 0.4193, "step": 4730 }, { - "epoch": 16.46, - "learning_rate": 3.4014134275618372e-06, - "loss": 0.2868, + "epoch": 65.83, + "learning_rate": 1.7359154929577466e-05, + "loss": 0.4216, "step": 4740 }, { - "epoch": 16.49, - "learning_rate": 3.3999999999999996e-06, - "loss": 0.2736, + "epoch": 65.97, + "learning_rate": 1.7288732394366197e-05, + "loss": 0.3979, "step": 4750 }, { - "epoch": 16.53, - "learning_rate": 3.3985865724381625e-06, - "loss": 0.2888, + "epoch": 66.0, + "eval_loss": 0.49280083179473877, + "eval_runtime": 127.1568, + "eval_samples_per_second": 4.184, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21732981937391527, + "step": 4752 + }, + { + "epoch": 66.11, + "learning_rate": 1.721830985915493e-05, + "loss": 0.4282, "step": 4760 }, { - "epoch": 16.56, - "learning_rate": 3.397173144876325e-06, - "loss": 0.2616, + "epoch": 66.25, + "learning_rate": 1.714788732394366e-05, + "loss": 0.4229, "step": 4770 }, { - "epoch": 16.6, - "learning_rate": 3.3957597173144877e-06, - "loss": 0.2736, + "epoch": 66.39, + "learning_rate": 1.7077464788732393e-05, + "loss": 0.4173, "step": 4780 }, { - "epoch": 16.63, - "learning_rate": 3.3943462897526497e-06, - "loss": 0.2678, + "epoch": 66.53, + "learning_rate": 1.700704225352113e-05, + "loss": 0.4271, "step": 4790 }, { - "epoch": 16.66, - "learning_rate": 3.3929328621908125e-06, - "loss": 0.2739, + "epoch": 66.66, + "learning_rate": 1.693661971830986e-05, + "loss": 0.4215, "step": 4800 }, { - "epoch": 16.7, - "learning_rate": 3.391519434628975e-06, - "loss": 0.252, + "epoch": 66.8, + "learning_rate": 1.6866197183098592e-05, + "loss": 0.4183, "step": 4810 }, { - "epoch": 16.73, - "learning_rate": 3.3901060070671378e-06, - "loss": 0.2913, + "epoch": 66.94, + "learning_rate": 1.6795774647887324e-05, + "loss": 0.4151, "step": 4820 }, { - "epoch": 16.77, - "learning_rate": 3.3886925795053e-06, - "loss": 0.2935, + "epoch": 67.0, + "eval_loss": 0.4978279173374176, + "eval_runtime": 127.0381, + "eval_samples_per_second": 4.188, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21315163591952177, + "step": 4824 + }, + { + "epoch": 67.08, + "learning_rate": 1.6725352112676056e-05, + "loss": 0.4173, "step": 4830 }, { - "epoch": 16.8, - "learning_rate": 3.387279151943463e-06, - "loss": 0.2672, + "epoch": 67.22, + "learning_rate": 1.665492957746479e-05, + "loss": 0.4197, "step": 4840 }, { - "epoch": 16.84, - "learning_rate": 3.385865724381625e-06, - "loss": 0.2693, + "epoch": 67.36, + "learning_rate": 1.6584507042253523e-05, + "loss": 0.401, "step": 4850 }, { - "epoch": 16.87, - "learning_rate": 3.384452296819788e-06, - "loss": 0.2723, + "epoch": 67.5, + "learning_rate": 1.6514084507042255e-05, + "loss": 0.4155, "step": 4860 }, { - "epoch": 16.91, - "learning_rate": 3.3830388692579502e-06, - "loss": 0.2571, + "epoch": 67.64, + "learning_rate": 1.6443661971830987e-05, + "loss": 0.4174, "step": 4870 }, { - "epoch": 16.94, - "learning_rate": 3.381625441696113e-06, - "loss": 0.2511, + "epoch": 67.78, + "learning_rate": 1.637323943661972e-05, + "loss": 0.416, "step": 4880 }, { - "epoch": 16.98, - "learning_rate": 3.3802120141342755e-06, - "loss": 0.2766, + "epoch": 67.91, + "learning_rate": 1.630281690140845e-05, + "loss": 0.4157, "step": 4890 }, { - "epoch": 17.0, - "eval_loss": 0.5078305006027222, - "eval_runtime": 129.3828, - "eval_samples_per_second": 4.112, - "eval_steps_per_second": 1.028, - "eval_wer": 0.1998457286109147, + "epoch": 68.0, + "eval_loss": 0.5226835012435913, + "eval_runtime": 126.8668, + "eval_samples_per_second": 4.193, + "eval_steps_per_second": 0.528, + "eval_wer": 0.21687986115574984, "step": 4896 }, { - "epoch": 17.01, - "learning_rate": 3.3787985865724383e-06, - "loss": 0.2968, + "epoch": 68.06, + "learning_rate": 1.6232394366197186e-05, + "loss": 0.4272, "step": 4900 }, { - "epoch": 17.05, - "learning_rate": 3.3773851590106003e-06, - "loss": 0.2869, + "epoch": 68.19, + "learning_rate": 1.6161971830985918e-05, + "loss": 0.4193, "step": 4910 }, { - "epoch": 17.08, - "learning_rate": 3.375971731448763e-06, - "loss": 0.2671, + "epoch": 68.33, + "learning_rate": 1.609154929577465e-05, + "loss": 0.4207, "step": 4920 }, { - "epoch": 17.12, - "learning_rate": 3.3745583038869255e-06, - "loss": 0.2651, + "epoch": 68.47, + "learning_rate": 1.602112676056338e-05, + "loss": 0.4255, "step": 4930 }, { - "epoch": 17.15, - "learning_rate": 3.3731448763250884e-06, - "loss": 0.262, + "epoch": 68.61, + "learning_rate": 1.5950704225352113e-05, + "loss": 0.4123, "step": 4940 }, { - "epoch": 17.19, - "learning_rate": 3.371731448763251e-06, - "loss": 0.2579, + "epoch": 68.75, + "learning_rate": 1.588028169014085e-05, + "loss": 0.4082, "step": 4950 }, { - "epoch": 17.22, - "learning_rate": 3.370318021201413e-06, - "loss": 0.2801, + "epoch": 68.89, + "learning_rate": 1.580985915492958e-05, + "loss": 0.4135, "step": 4960 }, { - "epoch": 17.26, - "learning_rate": 3.3689045936395756e-06, - "loss": 0.2667, + "epoch": 69.0, + "eval_loss": 0.48659974336624146, + "eval_runtime": 127.0425, + "eval_samples_per_second": 4.188, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21295879668316514, + "step": 4968 + }, + { + "epoch": 69.03, + "learning_rate": 1.5739436619718312e-05, + "loss": 0.4276, "step": 4970 }, { - "epoch": 17.29, - "learning_rate": 3.3674911660777384e-06, - "loss": 0.2852, + "epoch": 69.17, + "learning_rate": 1.5669014084507044e-05, + "loss": 0.4104, "step": 4980 }, { - "epoch": 17.33, - "learning_rate": 3.366077738515901e-06, - "loss": 0.2515, + "epoch": 69.3, + "learning_rate": 1.5598591549295773e-05, + "loss": 0.4186, "step": 4990 }, { - "epoch": 17.36, - "learning_rate": 3.3646643109540637e-06, - "loss": 0.2632, + "epoch": 69.44, + "learning_rate": 1.5528169014084508e-05, + "loss": 0.4111, "step": 5000 }, { - "epoch": 17.39, - "learning_rate": 3.363250883392226e-06, - "loss": 0.2756, + "epoch": 69.58, + "learning_rate": 1.545774647887324e-05, + "loss": 0.4146, "step": 5010 }, { - "epoch": 17.43, - "learning_rate": 3.3618374558303885e-06, - "loss": 0.2703, + "epoch": 69.72, + "learning_rate": 1.538732394366197e-05, + "loss": 0.4143, "step": 5020 }, { - "epoch": 17.46, - "learning_rate": 3.360424028268551e-06, - "loss": 0.2706, + "epoch": 69.86, + "learning_rate": 1.5316901408450704e-05, + "loss": 0.4029, "step": 5030 }, { - "epoch": 17.5, - "learning_rate": 3.3590106007067137e-06, - "loss": 0.3145, + "epoch": 70.0, + "learning_rate": 1.5246478873239437e-05, + "loss": 0.4109, + "step": 5040 + }, + { + "epoch": 70.0, + "eval_loss": 0.484768807888031, + "eval_runtime": 127.258, + "eval_samples_per_second": 4.18, + "eval_steps_per_second": 0.526, + "eval_wer": 0.20935913093784148, "step": 5040 }, { - "epoch": 17.53, - "learning_rate": 3.357597173144876e-06, - "loss": 0.2588, + "epoch": 70.14, + "learning_rate": 1.5176056338028169e-05, + "loss": 0.4176, "step": 5050 }, { - "epoch": 17.57, - "learning_rate": 3.356183745583039e-06, - "loss": 0.278, + "epoch": 70.28, + "learning_rate": 1.5105633802816901e-05, + "loss": 0.4091, "step": 5060 }, { - "epoch": 17.6, - "learning_rate": 3.3547703180212014e-06, - "loss": 0.2612, + "epoch": 70.42, + "learning_rate": 1.5035211267605634e-05, + "loss": 0.4115, "step": 5070 }, { - "epoch": 17.64, - "learning_rate": 3.353356890459364e-06, - "loss": 0.2747, + "epoch": 70.55, + "learning_rate": 1.4964788732394366e-05, + "loss": 0.4036, "step": 5080 }, { - "epoch": 17.67, - "learning_rate": 3.3519434628975262e-06, - "loss": 0.2839, + "epoch": 70.69, + "learning_rate": 1.4894366197183098e-05, + "loss": 0.4078, "step": 5090 }, { - "epoch": 17.71, - "learning_rate": 3.350530035335689e-06, - "loss": 0.3041, + "epoch": 70.83, + "learning_rate": 1.4823943661971832e-05, + "loss": 0.4158, "step": 5100 }, { - "epoch": 17.74, - "learning_rate": 3.3491166077738515e-06, - "loss": 0.28, + "epoch": 70.97, + "learning_rate": 1.4753521126760564e-05, + "loss": 0.4084, "step": 5110 }, { - "epoch": 17.78, - "learning_rate": 3.3477031802120143e-06, - "loss": 0.2479, + "epoch": 71.0, + "eval_loss": 0.5011652112007141, + "eval_runtime": 126.6418, + "eval_samples_per_second": 4.201, + "eval_steps_per_second": 0.529, + "eval_wer": 0.2168155814102976, + "step": 5112 + }, + { + "epoch": 71.11, + "learning_rate": 1.4683098591549296e-05, + "loss": 0.4189, "step": 5120 }, { - "epoch": 17.81, - "learning_rate": 3.3462897526501763e-06, - "loss": 0.2859, + "epoch": 71.25, + "learning_rate": 1.4612676056338029e-05, + "loss": 0.4007, "step": 5130 }, { - "epoch": 17.85, - "learning_rate": 3.344876325088339e-06, - "loss": 0.2879, + "epoch": 71.39, + "learning_rate": 1.4542253521126761e-05, + "loss": 0.4055, "step": 5140 }, { - "epoch": 17.88, - "learning_rate": 3.3434628975265015e-06, - "loss": 0.2668, + "epoch": 71.53, + "learning_rate": 1.4471830985915495e-05, + "loss": 0.4133, "step": 5150 }, { - "epoch": 17.91, - "learning_rate": 3.3420494699646644e-06, - "loss": 0.2703, + "epoch": 71.66, + "learning_rate": 1.4401408450704226e-05, + "loss": 0.4116, "step": 5160 }, { - "epoch": 17.95, - "learning_rate": 3.3406360424028268e-06, - "loss": 0.2949, + "epoch": 71.8, + "learning_rate": 1.4330985915492958e-05, + "loss": 0.4091, "step": 5170 }, { - "epoch": 17.98, - "learning_rate": 3.3392226148409896e-06, - "loss": 0.2872, + "epoch": 71.94, + "learning_rate": 1.4260563380281692e-05, + "loss": 0.4078, "step": 5180 }, { - "epoch": 18.0, - "eval_loss": 0.5114011764526367, - "eval_runtime": 129.1607, - "eval_samples_per_second": 4.119, - "eval_steps_per_second": 1.03, - "eval_wer": 0.19811017548370508, + "epoch": 72.0, + "eval_loss": 0.4835646152496338, + "eval_runtime": 126.9914, + "eval_samples_per_second": 4.189, + "eval_steps_per_second": 0.528, + "eval_wer": 0.21855113453750724, "step": 5184 }, { - "epoch": 18.02, - "learning_rate": 3.3378091872791516e-06, - "loss": 0.2889, + "epoch": 72.08, + "learning_rate": 1.4190140845070424e-05, + "loss": 0.4281, "step": 5190 }, { - "epoch": 18.06, - "learning_rate": 3.3363957597173144e-06, - "loss": 0.2601, + "epoch": 72.22, + "learning_rate": 1.4119718309859156e-05, + "loss": 0.4153, "step": 5200 }, { - "epoch": 18.09, - "learning_rate": 3.334982332155477e-06, - "loss": 0.2864, + "epoch": 72.36, + "learning_rate": 1.404929577464789e-05, + "loss": 0.3969, "step": 5210 }, { - "epoch": 18.12, - "learning_rate": 3.3335689045936397e-06, - "loss": 0.2753, + "epoch": 72.5, + "learning_rate": 1.3978873239436621e-05, + "loss": 0.4048, "step": 5220 }, { - "epoch": 18.16, - "learning_rate": 3.332155477031802e-06, - "loss": 0.298, + "epoch": 72.64, + "learning_rate": 1.3908450704225353e-05, + "loss": 0.4015, "step": 5230 }, { - "epoch": 18.19, - "learning_rate": 3.330742049469965e-06, - "loss": 0.2637, + "epoch": 72.78, + "learning_rate": 1.3838028169014086e-05, + "loss": 0.4018, "step": 5240 }, { - "epoch": 18.23, - "learning_rate": 3.329328621908127e-06, - "loss": 0.2674, + "epoch": 72.91, + "learning_rate": 1.3767605633802818e-05, + "loss": 0.4106, "step": 5250 }, { - "epoch": 18.26, - "learning_rate": 3.3279151943462897e-06, - "loss": 0.2606, + "epoch": 73.0, + "eval_loss": 0.48354992270469666, + "eval_runtime": 126.0348, + "eval_samples_per_second": 4.221, + "eval_steps_per_second": 0.532, + "eval_wer": 0.21315163591952177, + "step": 5256 + }, + { + "epoch": 73.06, + "learning_rate": 1.3697183098591552e-05, + "loss": 0.4178, "step": 5260 }, { - "epoch": 18.3, - "learning_rate": 3.326501766784452e-06, - "loss": 0.2987, + "epoch": 73.19, + "learning_rate": 1.3626760563380284e-05, + "loss": 0.4125, "step": 5270 }, { - "epoch": 18.33, - "learning_rate": 3.325088339222615e-06, - "loss": 0.2924, + "epoch": 73.33, + "learning_rate": 1.3556338028169016e-05, + "loss": 0.4111, "step": 5280 }, { - "epoch": 18.37, - "learning_rate": 3.3236749116607774e-06, - "loss": 0.3043, + "epoch": 73.47, + "learning_rate": 1.3485915492957746e-05, + "loss": 0.4044, "step": 5290 }, { - "epoch": 18.4, - "learning_rate": 3.3222614840989398e-06, - "loss": 0.2727, + "epoch": 73.61, + "learning_rate": 1.3415492957746478e-05, + "loss": 0.4043, "step": 5300 }, { - "epoch": 18.44, - "learning_rate": 3.320848056537102e-06, - "loss": 0.2463, + "epoch": 73.75, + "learning_rate": 1.3345070422535211e-05, + "loss": 0.4028, "step": 5310 }, { - "epoch": 18.47, - "learning_rate": 3.319434628975265e-06, - "loss": 0.3037, + "epoch": 73.89, + "learning_rate": 1.3274647887323943e-05, + "loss": 0.3977, "step": 5320 }, { - "epoch": 18.51, - "learning_rate": 3.3180212014134274e-06, - "loss": 0.2611, + "epoch": 74.0, + "eval_loss": 0.5025292634963989, + "eval_runtime": 127.807, + "eval_samples_per_second": 4.163, + "eval_steps_per_second": 0.524, + "eval_wer": 0.215080028283088, + "step": 5328 + }, + { + "epoch": 74.03, + "learning_rate": 1.3204225352112675e-05, + "loss": 0.4266, "step": 5330 }, { - "epoch": 18.54, - "learning_rate": 3.3166077738515903e-06, - "loss": 0.2597, + "epoch": 74.17, + "learning_rate": 1.3133802816901409e-05, + "loss": 0.394, "step": 5340 }, { - "epoch": 18.57, - "learning_rate": 3.3151943462897527e-06, - "loss": 0.2875, + "epoch": 74.3, + "learning_rate": 1.306338028169014e-05, + "loss": 0.406, "step": 5350 }, { - "epoch": 18.61, - "learning_rate": 3.313780918727915e-06, - "loss": 0.2847, + "epoch": 74.44, + "learning_rate": 1.2992957746478872e-05, + "loss": 0.4028, "step": 5360 }, { - "epoch": 18.64, - "learning_rate": 3.3123674911660775e-06, - "loss": 0.2741, + "epoch": 74.58, + "learning_rate": 1.2922535211267606e-05, + "loss": 0.4033, "step": 5370 }, { - "epoch": 18.68, - "learning_rate": 3.3109540636042403e-06, - "loss": 0.2683, + "epoch": 74.72, + "learning_rate": 1.2852112676056338e-05, + "loss": 0.4069, "step": 5380 }, { - "epoch": 18.71, - "learning_rate": 3.3095406360424027e-06, - "loss": 0.2637, + "epoch": 74.86, + "learning_rate": 1.2781690140845071e-05, + "loss": 0.4146, "step": 5390 }, { - "epoch": 18.75, - "learning_rate": 3.3081272084805656e-06, - "loss": 0.2755, + "epoch": 75.0, + "learning_rate": 1.2711267605633803e-05, + "loss": 0.4056, + "step": 5400 + }, + { + "epoch": 75.0, + "eval_loss": 0.4893050789833069, + "eval_runtime": 126.5689, + "eval_samples_per_second": 4.203, + "eval_steps_per_second": 0.529, + "eval_wer": 0.2190653725011249, "step": 5400 }, { - "epoch": 18.78, - "learning_rate": 3.3067137809187276e-06, - "loss": 0.2604, + "epoch": 75.14, + "learning_rate": 1.2640845070422535e-05, + "loss": 0.4257, "step": 5410 }, { - "epoch": 18.82, - "learning_rate": 3.30530035335689e-06, - "loss": 0.3166, + "epoch": 75.28, + "learning_rate": 1.2570422535211269e-05, + "loss": 0.4147, "step": 5420 }, { - "epoch": 18.85, - "learning_rate": 3.303886925795053e-06, - "loss": 0.2882, + "epoch": 75.42, + "learning_rate": 1.25e-05, + "loss": 0.4026, "step": 5430 }, { - "epoch": 18.89, - "learning_rate": 3.302473498233215e-06, - "loss": 0.2685, + "epoch": 75.55, + "learning_rate": 1.2429577464788732e-05, + "loss": 0.408, "step": 5440 }, { - "epoch": 18.92, - "learning_rate": 3.301060070671378e-06, - "loss": 0.2697, + "epoch": 75.69, + "learning_rate": 1.2359154929577466e-05, + "loss": 0.3983, "step": 5450 }, { - "epoch": 18.96, - "learning_rate": 3.2996466431095405e-06, - "loss": 0.2673, + "epoch": 75.83, + "learning_rate": 1.2288732394366198e-05, + "loss": 0.4046, "step": 5460 }, { - "epoch": 18.99, - "learning_rate": 3.298233215547703e-06, - "loss": 0.268, + "epoch": 75.97, + "learning_rate": 1.221830985915493e-05, + "loss": 0.4019, "step": 5470 }, { - "epoch": 19.0, - "eval_loss": 0.5078134536743164, - "eval_runtime": 128.8142, - "eval_samples_per_second": 4.13, - "eval_steps_per_second": 1.032, - "eval_wer": 0.19798161599280067, + "epoch": 76.0, + "eval_loss": 0.48530757427215576, + "eval_runtime": 127.0771, + "eval_samples_per_second": 4.186, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21083756508324228, "step": 5472 }, { - "epoch": 19.03, - "learning_rate": 3.2968197879858653e-06, - "loss": 0.2845, + "epoch": 76.11, + "learning_rate": 1.2147887323943663e-05, + "loss": 0.4, "step": 5480 }, { - "epoch": 19.06, - "learning_rate": 3.295406360424028e-06, - "loss": 0.2673, + "epoch": 76.25, + "learning_rate": 1.2077464788732395e-05, + "loss": 0.412, "step": 5490 }, { - "epoch": 19.1, - "learning_rate": 3.2939929328621905e-06, - "loss": 0.2458, + "epoch": 76.39, + "learning_rate": 1.2007042253521129e-05, + "loss": 0.413, "step": 5500 }, { - "epoch": 19.13, - "learning_rate": 3.2925795053003533e-06, - "loss": 0.288, + "epoch": 76.53, + "learning_rate": 1.1936619718309859e-05, + "loss": 0.4135, "step": 5510 }, { - "epoch": 19.17, - "learning_rate": 3.2911660777385158e-06, - "loss": 0.2833, + "epoch": 76.66, + "learning_rate": 1.1866197183098591e-05, + "loss": 0.4109, "step": 5520 }, { - "epoch": 19.2, - "learning_rate": 3.289752650176678e-06, - "loss": 0.264, + "epoch": 76.8, + "learning_rate": 1.1795774647887324e-05, + "loss": 0.4061, "step": 5530 }, { - "epoch": 19.24, - "learning_rate": 3.2883392226148406e-06, - "loss": 0.2782, + "epoch": 76.94, + "learning_rate": 1.1725352112676056e-05, + "loss": 0.4147, "step": 5540 }, { - "epoch": 19.27, - "learning_rate": 3.2869257950530034e-06, - "loss": 0.2702, + "epoch": 77.0, + "eval_loss": 0.48485973477363586, + "eval_runtime": 125.8319, + "eval_samples_per_second": 4.228, + "eval_steps_per_second": 0.532, + "eval_wer": 0.21308735617406954, + "step": 5544 + }, + { + "epoch": 77.08, + "learning_rate": 1.1654929577464788e-05, + "loss": 0.4043, "step": 5550 }, { - "epoch": 19.3, - "learning_rate": 3.285512367491166e-06, - "loss": 0.2908, + "epoch": 77.22, + "learning_rate": 1.1584507042253522e-05, + "loss": 0.4025, "step": 5560 }, { - "epoch": 19.34, - "learning_rate": 3.2840989399293287e-06, - "loss": 0.2852, + "epoch": 77.36, + "learning_rate": 1.1514084507042254e-05, + "loss": 0.4097, "step": 5570 }, { - "epoch": 19.37, - "learning_rate": 3.2826855123674906e-06, - "loss": 0.2657, + "epoch": 77.5, + "learning_rate": 1.1443661971830987e-05, + "loss": 0.4132, "step": 5580 }, { - "epoch": 19.41, - "learning_rate": 3.2812720848056535e-06, - "loss": 0.2553, + "epoch": 77.64, + "learning_rate": 1.1373239436619719e-05, + "loss": 0.3952, "step": 5590 }, { - "epoch": 19.44, - "learning_rate": 3.279858657243816e-06, - "loss": 0.2556, + "epoch": 77.78, + "learning_rate": 1.1302816901408451e-05, + "loss": 0.4721, "step": 5600 }, { - "epoch": 19.48, - "learning_rate": 3.2784452296819787e-06, - "loss": 0.2677, + "epoch": 77.91, + "learning_rate": 1.1232394366197185e-05, + "loss": 0.4075, "step": 5610 }, { - "epoch": 19.51, - "learning_rate": 3.277031802120141e-06, - "loss": 0.276, + "epoch": 78.0, + "eval_loss": 0.5035993456840515, + "eval_runtime": 127.1426, + "eval_samples_per_second": 4.184, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2117374815195732, + "step": 5616 + }, + { + "epoch": 78.06, + "learning_rate": 1.1161971830985916e-05, + "loss": 0.4084, "step": 5620 }, { - "epoch": 19.55, - "learning_rate": 3.275618374558304e-06, - "loss": 0.2622, + "epoch": 78.19, + "learning_rate": 1.1091549295774648e-05, + "loss": 0.3951, "step": 5630 }, { - "epoch": 19.58, - "learning_rate": 3.274204946996466e-06, - "loss": 0.2778, + "epoch": 78.33, + "learning_rate": 1.1021126760563382e-05, + "loss": 0.402, "step": 5640 }, { - "epoch": 19.62, - "learning_rate": 3.2727915194346288e-06, - "loss": 0.2744, + "epoch": 78.47, + "learning_rate": 1.0950704225352114e-05, + "loss": 0.3994, "step": 5650 }, { - "epoch": 19.65, - "learning_rate": 3.271378091872791e-06, - "loss": 0.287, + "epoch": 78.61, + "learning_rate": 1.0880281690140846e-05, + "loss": 0.398, "step": 5660 }, { - "epoch": 19.69, - "learning_rate": 3.269964664310954e-06, - "loss": 0.2831, + "epoch": 78.75, + "learning_rate": 1.0809859154929577e-05, + "loss": 0.4013, "step": 5670 }, { - "epoch": 19.72, - "learning_rate": 3.2685512367491164e-06, - "loss": 0.256, + "epoch": 78.89, + "learning_rate": 1.073943661971831e-05, + "loss": 0.4064, "step": 5680 }, { - "epoch": 19.75, - "learning_rate": 3.2671378091872793e-06, - "loss": 0.2609, + "epoch": 79.0, + "eval_loss": 0.47934702038764954, + "eval_runtime": 126.7605, + "eval_samples_per_second": 4.197, + "eval_steps_per_second": 0.529, + "eval_wer": 0.21328019541042617, + "step": 5688 + }, + { + "epoch": 79.03, + "learning_rate": 1.0669014084507043e-05, + "loss": 0.42, "step": 5690 }, { - "epoch": 19.79, - "learning_rate": 3.2657243816254412e-06, - "loss": 0.2601, + "epoch": 79.17, + "learning_rate": 1.0598591549295775e-05, + "loss": 0.402, "step": 5700 }, { - "epoch": 19.82, - "learning_rate": 3.264310954063604e-06, - "loss": 0.2834, + "epoch": 79.3, + "learning_rate": 1.0528169014084507e-05, + "loss": 0.4035, "step": 5710 }, { - "epoch": 19.86, - "learning_rate": 3.2628975265017665e-06, - "loss": 0.2889, + "epoch": 79.44, + "learning_rate": 1.045774647887324e-05, + "loss": 0.3983, "step": 5720 }, { - "epoch": 19.89, - "learning_rate": 3.2614840989399293e-06, - "loss": 0.2617, + "epoch": 79.58, + "learning_rate": 1.0387323943661972e-05, + "loss": 0.4034, "step": 5730 }, { - "epoch": 19.93, - "learning_rate": 3.2600706713780917e-06, - "loss": 0.2747, + "epoch": 79.72, + "learning_rate": 1.0316901408450706e-05, + "loss": 0.409, "step": 5740 }, { - "epoch": 19.96, - "learning_rate": 3.258657243816254e-06, - "loss": 0.2867, + "epoch": 79.86, + "learning_rate": 1.0246478873239438e-05, + "loss": 0.4005, "step": 5750 }, { - "epoch": 20.0, - "learning_rate": 3.2572438162544166e-06, - "loss": 0.2631, + "epoch": 80.0, + "learning_rate": 1.017605633802817e-05, + "loss": 0.4035, "step": 5760 }, { - "epoch": 20.0, - "eval_loss": 0.5262243747711182, - "eval_runtime": 129.2103, - "eval_samples_per_second": 4.117, - "eval_steps_per_second": 1.029, - "eval_wer": 0.20209551970174197, + "epoch": 80.0, + "eval_loss": 0.4917033612728119, + "eval_runtime": 126.9746, + "eval_samples_per_second": 4.19, + "eval_steps_per_second": 0.528, + "eval_wer": 0.20826637526515396, "step": 5760 }, { - "epoch": 20.03, - "learning_rate": 3.2558303886925794e-06, - "loss": 0.2689, + "epoch": 80.14, + "learning_rate": 1.0105633802816903e-05, + "loss": 0.4008, "step": 5770 }, { - "epoch": 20.07, - "learning_rate": 3.254416961130742e-06, - "loss": 0.2906, + "epoch": 80.28, + "learning_rate": 1.0035211267605635e-05, + "loss": 0.4, "step": 5780 }, { - "epoch": 20.1, - "learning_rate": 3.2530035335689046e-06, - "loss": 0.2586, + "epoch": 80.42, + "learning_rate": 9.964788732394367e-06, + "loss": 0.3955, "step": 5790 }, { - "epoch": 20.14, - "learning_rate": 3.251590106007067e-06, - "loss": 0.2732, + "epoch": 80.55, + "learning_rate": 9.894366197183099e-06, + "loss": 0.3864, "step": 5800 }, { - "epoch": 20.17, - "learning_rate": 3.2501766784452294e-06, - "loss": 0.2528, + "epoch": 80.69, + "learning_rate": 9.82394366197183e-06, + "loss": 0.398, "step": 5810 }, { - "epoch": 20.21, - "learning_rate": 3.248763250883392e-06, - "loss": 0.26, + "epoch": 80.83, + "learning_rate": 9.753521126760564e-06, + "loss": 0.4061, "step": 5820 }, { - "epoch": 20.24, - "learning_rate": 3.2473498233215547e-06, - "loss": 0.279, + "epoch": 80.97, + "learning_rate": 9.683098591549296e-06, + "loss": 0.4083, "step": 5830 }, { - "epoch": 20.28, - "learning_rate": 3.245936395759717e-06, - "loss": 0.2506, + "epoch": 81.0, + "eval_loss": 0.4724813997745514, + "eval_runtime": 126.4508, + "eval_samples_per_second": 4.207, + "eval_steps_per_second": 0.53, + "eval_wer": 0.21160892202866877, + "step": 5832 + }, + { + "epoch": 81.11, + "learning_rate": 9.612676056338028e-06, + "loss": 0.4011, "step": 5840 }, { - "epoch": 20.31, - "learning_rate": 3.24452296819788e-06, - "loss": 0.2886, + "epoch": 81.25, + "learning_rate": 9.542253521126761e-06, + "loss": 0.4006, "step": 5850 }, { - "epoch": 20.35, - "learning_rate": 3.2431095406360423e-06, - "loss": 0.2779, + "epoch": 81.39, + "learning_rate": 9.471830985915493e-06, + "loss": 0.3875, "step": 5860 }, { - "epoch": 20.38, - "learning_rate": 3.2416961130742048e-06, - "loss": 0.2731, + "epoch": 81.53, + "learning_rate": 9.401408450704225e-06, + "loss": 0.4037, "step": 5870 }, { - "epoch": 20.42, - "learning_rate": 3.240282685512367e-06, - "loss": 0.2575, + "epoch": 81.66, + "learning_rate": 9.330985915492959e-06, + "loss": 0.4018, "step": 5880 }, { - "epoch": 20.45, - "learning_rate": 3.23886925795053e-06, - "loss": 0.2671, + "epoch": 81.8, + "learning_rate": 9.26056338028169e-06, + "loss": 0.3989, "step": 5890 }, { - "epoch": 20.48, - "learning_rate": 3.2374558303886924e-06, - "loss": 0.2901, + "epoch": 81.94, + "learning_rate": 9.190140845070422e-06, + "loss": 0.3954, "step": 5900 }, { - "epoch": 20.52, - "learning_rate": 3.2360424028268552e-06, - "loss": 0.2778, + "epoch": 82.0, + "eval_loss": 0.4957520365715027, + "eval_runtime": 126.407, + "eval_samples_per_second": 4.209, + "eval_steps_per_second": 0.53, + "eval_wer": 0.2119303207559298, + "step": 5904 + }, + { + "epoch": 82.08, + "learning_rate": 9.119718309859156e-06, + "loss": 0.4178, "step": 5910 }, { - "epoch": 20.55, - "learning_rate": 3.2346289752650172e-06, - "loss": 0.2629, + "epoch": 82.22, + "learning_rate": 9.049295774647888e-06, + "loss": 0.4004, "step": 5920 }, { - "epoch": 20.59, - "learning_rate": 3.23321554770318e-06, - "loss": 0.2539, + "epoch": 82.36, + "learning_rate": 8.978873239436621e-06, + "loss": 0.3828, "step": 5930 }, { - "epoch": 20.62, - "learning_rate": 3.2318021201413425e-06, - "loss": 0.2697, + "epoch": 82.5, + "learning_rate": 8.908450704225353e-06, + "loss": 0.403, "step": 5940 }, { - "epoch": 20.66, - "learning_rate": 3.2303886925795053e-06, - "loss": 0.279, + "epoch": 82.64, + "learning_rate": 8.838028169014084e-06, + "loss": 0.3932, "step": 5950 }, { - "epoch": 20.69, - "learning_rate": 3.2289752650176677e-06, - "loss": 0.2869, + "epoch": 82.78, + "learning_rate": 8.767605633802817e-06, + "loss": 0.3964, "step": 5960 }, { - "epoch": 20.73, - "learning_rate": 3.2275618374558305e-06, - "loss": 0.2761, + "epoch": 82.91, + "learning_rate": 8.697183098591549e-06, + "loss": 0.395, "step": 5970 }, { - "epoch": 20.76, - "learning_rate": 3.2261484098939925e-06, - "loss": 0.2775, + "epoch": 83.0, + "eval_loss": 0.4897911846637726, + "eval_runtime": 126.9226, + "eval_samples_per_second": 4.192, + "eval_steps_per_second": 0.528, + "eval_wer": 0.2134730346467828, + "step": 5976 + }, + { + "epoch": 83.06, + "learning_rate": 8.626760563380283e-06, + "loss": 0.4032, "step": 5980 }, { - "epoch": 20.8, - "learning_rate": 3.2247349823321554e-06, - "loss": 0.2639, + "epoch": 83.19, + "learning_rate": 8.556338028169014e-06, + "loss": 0.409, "step": 5990 }, { - "epoch": 20.83, - "learning_rate": 3.2233215547703178e-06, - "loss": 0.2925, + "epoch": 83.33, + "learning_rate": 8.485915492957746e-06, + "loss": 0.3947, "step": 6000 }, { - "epoch": 20.87, - "learning_rate": 3.2219081272084806e-06, - "loss": 0.2851, + "epoch": 83.47, + "learning_rate": 8.41549295774648e-06, + "loss": 0.4052, "step": 6010 }, { - "epoch": 20.9, - "learning_rate": 3.220494699646643e-06, - "loss": 0.2682, + "epoch": 83.61, + "learning_rate": 8.345070422535212e-06, + "loss": 0.3859, "step": 6020 }, { - "epoch": 20.94, - "learning_rate": 3.2190812720848054e-06, - "loss": 0.2541, + "epoch": 83.75, + "learning_rate": 8.274647887323944e-06, + "loss": 0.3938, "step": 6030 }, { - "epoch": 20.97, - "learning_rate": 3.217667844522968e-06, - "loss": 0.2753, + "epoch": 83.89, + "learning_rate": 8.204225352112677e-06, + "loss": 0.391, "step": 6040 }, { - "epoch": 21.0, - "eval_loss": 0.5161154866218567, - "eval_runtime": 128.857, - "eval_samples_per_second": 4.129, - "eval_steps_per_second": 1.032, - "eval_wer": 0.19913865141094042, + "epoch": 84.0, + "eval_loss": 0.4821723997592926, + "eval_runtime": 126.3131, + "eval_samples_per_second": 4.212, + "eval_steps_per_second": 0.53, + "eval_wer": 0.2151443080285402, "step": 6048 }, { - "epoch": 21.01, - "learning_rate": 3.2162544169611307e-06, - "loss": 0.296, + "epoch": 84.03, + "learning_rate": 8.133802816901409e-06, + "loss": 0.4098, "step": 6050 }, { - "epoch": 21.04, - "learning_rate": 3.214840989399293e-06, - "loss": 0.2774, + "epoch": 84.17, + "learning_rate": 8.063380281690141e-06, + "loss": 0.3925, "step": 6060 }, { - "epoch": 21.08, - "learning_rate": 3.213427561837456e-06, - "loss": 0.2601, + "epoch": 84.3, + "learning_rate": 7.992957746478875e-06, + "loss": 0.3969, "step": 6070 }, { - "epoch": 21.11, - "learning_rate": 3.2120141342756183e-06, - "loss": 0.2738, + "epoch": 84.44, + "learning_rate": 7.922535211267606e-06, + "loss": 0.4094, "step": 6080 }, { - "epoch": 21.15, - "learning_rate": 3.2106007067137807e-06, - "loss": 0.2756, + "epoch": 84.58, + "learning_rate": 7.852112676056338e-06, + "loss": 0.392, "step": 6090 }, { - "epoch": 21.18, - "learning_rate": 3.209187279151943e-06, - "loss": 0.2851, + "epoch": 84.72, + "learning_rate": 7.78169014084507e-06, + "loss": 0.3862, "step": 6100 }, { - "epoch": 21.21, - "learning_rate": 3.207773851590106e-06, - "loss": 0.2786, + "epoch": 84.86, + "learning_rate": 7.711267605633802e-06, + "loss": 0.4002, "step": 6110 }, { - "epoch": 21.25, - "learning_rate": 3.2063604240282684e-06, - "loss": 0.2685, + "epoch": 85.0, + "learning_rate": 7.640845070422536e-06, + "loss": 0.3983, + "step": 6120 + }, + { + "epoch": 85.0, + "eval_loss": 0.48090094327926636, + "eval_runtime": 125.8708, + "eval_samples_per_second": 4.227, + "eval_steps_per_second": 0.532, + "eval_wer": 0.21096612457414668, "step": 6120 }, { - "epoch": 21.28, - "learning_rate": 3.204946996466431e-06, - "loss": 0.2652, + "epoch": 85.14, + "learning_rate": 7.5704225352112675e-06, + "loss": 0.3878, "step": 6130 }, { - "epoch": 21.32, - "learning_rate": 3.2035335689045936e-06, - "loss": 0.278, + "epoch": 85.28, + "learning_rate": 7.5e-06, + "loss": 0.3909, "step": 6140 }, { - "epoch": 21.35, - "learning_rate": 3.202120141342756e-06, - "loss": 0.2855, + "epoch": 85.42, + "learning_rate": 7.429577464788733e-06, + "loss": 0.4052, "step": 6150 }, { - "epoch": 21.39, - "learning_rate": 3.2007067137809184e-06, - "loss": 0.2757, + "epoch": 85.55, + "learning_rate": 7.359154929577465e-06, + "loss": 0.3954, "step": 6160 }, { - "epoch": 21.42, - "learning_rate": 3.1992932862190813e-06, - "loss": 0.2702, + "epoch": 85.69, + "learning_rate": 7.2887323943661975e-06, + "loss": 0.4011, "step": 6170 }, { - "epoch": 21.46, - "learning_rate": 3.1978798586572437e-06, - "loss": 0.2765, + "epoch": 85.83, + "learning_rate": 7.21830985915493e-06, + "loss": 0.3947, "step": 6180 }, { - "epoch": 21.49, - "learning_rate": 3.1964664310954065e-06, - "loss": 0.2616, + "epoch": 85.97, + "learning_rate": 7.147887323943662e-06, + "loss": 0.3883, "step": 6190 }, { - "epoch": 21.53, - "learning_rate": 3.1950530035335685e-06, - "loss": 0.2795, + "epoch": 86.0, + "eval_loss": 0.4980515241622925, + "eval_runtime": 126.7334, + "eval_samples_per_second": 4.198, + "eval_steps_per_second": 0.529, + "eval_wer": 0.21077328533779005, + "step": 6192 + }, + { + "epoch": 86.11, + "learning_rate": 7.077464788732395e-06, + "loss": 0.4021, "step": 6200 }, { - "epoch": 21.56, - "learning_rate": 3.1936395759717313e-06, - "loss": 0.2716, + "epoch": 86.25, + "learning_rate": 7.0070422535211276e-06, + "loss": 0.398, "step": 6210 }, { - "epoch": 21.6, - "learning_rate": 3.1922261484098937e-06, - "loss": 0.2697, + "epoch": 86.39, + "learning_rate": 6.93661971830986e-06, + "loss": 0.3908, "step": 6220 }, { - "epoch": 21.63, - "learning_rate": 3.1908127208480566e-06, - "loss": 0.2416, + "epoch": 86.53, + "learning_rate": 6.866197183098592e-06, + "loss": 0.388, "step": 6230 }, { - "epoch": 21.66, - "learning_rate": 3.189399293286219e-06, - "loss": 0.2782, + "epoch": 86.66, + "learning_rate": 6.795774647887325e-06, + "loss": 0.3938, "step": 6240 }, { - "epoch": 21.7, - "learning_rate": 3.187985865724382e-06, - "loss": 0.2617, + "epoch": 86.8, + "learning_rate": 6.725352112676056e-06, + "loss": 0.3923, "step": 6250 }, { - "epoch": 21.73, - "learning_rate": 3.186572438162544e-06, - "loss": 0.2701, + "epoch": 86.94, + "learning_rate": 6.654929577464789e-06, + "loss": 0.3955, "step": 6260 }, { - "epoch": 21.77, - "learning_rate": 3.1851590106007066e-06, - "loss": 0.2894, + "epoch": 87.0, + "eval_loss": 0.4876667559146881, + "eval_runtime": 126.7989, + "eval_samples_per_second": 4.196, + "eval_steps_per_second": 0.528, + "eval_wer": 0.2110946840650511, + "step": 6264 + }, + { + "epoch": 87.08, + "learning_rate": 6.584507042253521e-06, + "loss": 0.4023, "step": 6270 }, { - "epoch": 21.8, - "learning_rate": 3.183745583038869e-06, - "loss": 0.2634, + "epoch": 87.22, + "learning_rate": 6.514084507042253e-06, + "loss": 0.4015, "step": 6280 }, { - "epoch": 21.84, - "learning_rate": 3.182332155477032e-06, - "loss": 0.2928, + "epoch": 87.36, + "learning_rate": 6.443661971830986e-06, + "loss": 0.3818, "step": 6290 }, { - "epoch": 21.87, - "learning_rate": 3.1809187279151943e-06, - "loss": 0.2425, + "epoch": 87.5, + "learning_rate": 6.373239436619719e-06, + "loss": 0.3921, "step": 6300 }, { - "epoch": 21.91, - "learning_rate": 3.179505300353357e-06, - "loss": 0.272, + "epoch": 87.64, + "learning_rate": 6.3028169014084505e-06, + "loss": 0.3817, "step": 6310 }, { - "epoch": 21.94, - "learning_rate": 3.178091872791519e-06, - "loss": 0.2818, + "epoch": 87.78, + "learning_rate": 6.232394366197183e-06, + "loss": 0.384, "step": 6320 }, { - "epoch": 21.98, - "learning_rate": 3.176678445229682e-06, - "loss": 0.2797, + "epoch": 87.91, + "learning_rate": 6.161971830985916e-06, + "loss": 0.3983, "step": 6330 }, { - "epoch": 22.0, - "eval_loss": 0.5096527338027954, - "eval_runtime": 129.6264, - "eval_samples_per_second": 4.104, - "eval_steps_per_second": 1.026, - "eval_wer": 0.20093848428360223, + "epoch": 88.0, + "eval_loss": 0.48789334297180176, + "eval_runtime": 126.1213, + "eval_samples_per_second": 4.218, + "eval_steps_per_second": 0.531, + "eval_wer": 0.213537314392235, "step": 6336 }, { - "epoch": 22.01, - "learning_rate": 3.1752650176678444e-06, - "loss": 0.3083, + "epoch": 88.06, + "learning_rate": 6.091549295774649e-06, + "loss": 0.4158, "step": 6340 }, { - "epoch": 22.05, - "learning_rate": 3.173851590106007e-06, - "loss": 0.2683, + "epoch": 88.19, + "learning_rate": 6.021126760563381e-06, + "loss": 0.3983, "step": 6350 }, { - "epoch": 22.08, - "learning_rate": 3.1724381625441696e-06, - "loss": 0.2614, + "epoch": 88.33, + "learning_rate": 5.9507042253521125e-06, + "loss": 0.3945, "step": 6360 }, { - "epoch": 22.12, - "learning_rate": 3.171024734982332e-06, - "loss": 0.2664, + "epoch": 88.47, + "learning_rate": 5.880281690140845e-06, + "loss": 0.3896, "step": 6370 }, { - "epoch": 22.15, - "learning_rate": 3.1696113074204944e-06, - "loss": 0.2813, + "epoch": 88.61, + "learning_rate": 5.809859154929578e-06, + "loss": 0.3819, "step": 6380 }, { - "epoch": 22.19, - "learning_rate": 3.1681978798586572e-06, - "loss": 0.2609, + "epoch": 88.75, + "learning_rate": 5.73943661971831e-06, + "loss": 0.3939, "step": 6390 }, { - "epoch": 22.22, - "learning_rate": 3.1667844522968197e-06, - "loss": 0.2811, + "epoch": 88.89, + "learning_rate": 5.6690140845070425e-06, + "loss": 0.3877, "step": 6400 }, { - "epoch": 22.26, - "learning_rate": 3.1653710247349825e-06, - "loss": 0.2664, + "epoch": 89.0, + "eval_loss": 0.5021692514419556, + "eval_runtime": 126.1298, + "eval_samples_per_second": 4.218, + "eval_steps_per_second": 0.531, + "eval_wer": 0.21495146879218358, + "step": 6408 + }, + { + "epoch": 89.03, + "learning_rate": 5.598591549295775e-06, + "loss": 0.4044, "step": 6410 }, { - "epoch": 22.29, - "learning_rate": 3.163957597173145e-06, - "loss": 0.3003, + "epoch": 89.17, + "learning_rate": 5.528169014084508e-06, + "loss": 0.3919, "step": 6420 }, { - "epoch": 22.33, - "learning_rate": 3.1625441696113073e-06, - "loss": 0.2665, + "epoch": 89.3, + "learning_rate": 5.457746478873239e-06, + "loss": 0.3851, "step": 6430 }, { - "epoch": 22.36, - "learning_rate": 3.1611307420494697e-06, - "loss": 0.2603, + "epoch": 89.44, + "learning_rate": 5.387323943661972e-06, + "loss": 0.3872, "step": 6440 }, { - "epoch": 22.39, - "learning_rate": 3.1597173144876326e-06, - "loss": 0.2702, + "epoch": 89.58, + "learning_rate": 5.3169014084507044e-06, + "loss": 0.3845, "step": 6450 }, { - "epoch": 22.43, - "learning_rate": 3.158303886925795e-06, - "loss": 0.2403, + "epoch": 89.72, + "learning_rate": 5.246478873239437e-06, + "loss": 0.3998, "step": 6460 }, { - "epoch": 22.46, - "learning_rate": 3.156890459363958e-06, - "loss": 0.272, + "epoch": 89.86, + "learning_rate": 5.176056338028169e-06, + "loss": 0.3925, "step": 6470 }, { - "epoch": 22.5, - "learning_rate": 3.15547703180212e-06, - "loss": 0.308, + "epoch": 90.0, + "learning_rate": 5.105633802816902e-06, + "loss": 0.3992, "step": 6480 }, { - "epoch": 22.53, - "learning_rate": 3.154063604240282e-06, - "loss": 0.275, + "epoch": 90.0, + "eval_loss": 0.5071265697479248, + "eval_runtime": 126.7801, + "eval_samples_per_second": 4.196, + "eval_steps_per_second": 0.528, + "eval_wer": 0.21167320177412097, + "step": 6480 + }, + { + "epoch": 90.14, + "learning_rate": 5.0352112676056345e-06, + "loss": 0.395, "step": 6490 }, { - "epoch": 22.57, - "learning_rate": 3.152650176678445e-06, - "loss": 0.2824, + "epoch": 90.28, + "learning_rate": 4.964788732394366e-06, + "loss": 0.4013, "step": 6500 }, { - "epoch": 22.6, - "learning_rate": 3.1512367491166074e-06, - "loss": 0.2734, + "epoch": 90.42, + "learning_rate": 4.894366197183098e-06, + "loss": 0.3944, "step": 6510 }, { - "epoch": 22.64, - "learning_rate": 3.1498233215547703e-06, - "loss": 0.2686, + "epoch": 90.55, + "learning_rate": 4.823943661971831e-06, + "loss": 0.389, "step": 6520 }, { - "epoch": 22.67, - "learning_rate": 3.148409893992933e-06, - "loss": 0.2826, + "epoch": 90.69, + "learning_rate": 4.753521126760564e-06, + "loss": 0.3898, "step": 6530 }, { - "epoch": 22.71, - "learning_rate": 3.146996466431095e-06, - "loss": 0.2878, + "epoch": 90.83, + "learning_rate": 4.683098591549296e-06, + "loss": 0.3917, "step": 6540 }, { - "epoch": 22.74, - "learning_rate": 3.1455830388692575e-06, - "loss": 0.2793, + "epoch": 90.97, + "learning_rate": 4.612676056338028e-06, + "loss": 0.393, "step": 6550 }, { - "epoch": 22.78, - "learning_rate": 3.1441696113074203e-06, - "loss": 0.2574, + "epoch": 91.0, + "eval_loss": 0.4833681583404541, + "eval_runtime": 131.3542, + "eval_samples_per_second": 4.05, + "eval_steps_per_second": 0.51, + "eval_wer": 0.21083756508324228, + "step": 6552 + }, + { + "epoch": 91.11, + "learning_rate": 4.542253521126761e-06, + "loss": 0.3948, "step": 6560 }, { - "epoch": 22.81, - "learning_rate": 3.1427561837455827e-06, - "loss": 0.2733, + "epoch": 91.25, + "learning_rate": 4.471830985915494e-06, + "loss": 0.3899, "step": 6570 }, { - "epoch": 22.85, - "learning_rate": 3.1413427561837456e-06, - "loss": 0.2887, + "epoch": 91.39, + "learning_rate": 4.401408450704226e-06, + "loss": 0.3798, "step": 6580 }, { - "epoch": 22.88, - "learning_rate": 3.139929328621908e-06, - "loss": 0.2801, + "epoch": 91.53, + "learning_rate": 4.3309859154929575e-06, + "loss": 0.3839, "step": 6590 }, { - "epoch": 22.91, - "learning_rate": 3.1385159010600704e-06, - "loss": 0.2739, + "epoch": 91.66, + "learning_rate": 4.26056338028169e-06, + "loss": 0.3819, "step": 6600 }, { - "epoch": 22.95, - "learning_rate": 3.137102473498233e-06, - "loss": 0.2622, + "epoch": 91.8, + "learning_rate": 4.190140845070423e-06, + "loss": 0.3805, "step": 6610 }, { - "epoch": 22.98, - "learning_rate": 3.1356890459363956e-06, - "loss": 0.2667, + "epoch": 91.94, + "learning_rate": 4.119718309859155e-06, + "loss": 0.3941, "step": 6620 }, { - "epoch": 23.0, - "eval_loss": 0.5130947828292847, - "eval_runtime": 130.2324, - "eval_samples_per_second": 4.085, - "eval_steps_per_second": 1.021, - "eval_wer": 0.19952432988365365, + "epoch": 92.0, + "eval_loss": 0.4961974024772644, + "eval_runtime": 131.7625, + "eval_samples_per_second": 4.038, + "eval_steps_per_second": 0.508, + "eval_wer": 0.2119303207559298, "step": 6624 }, { - "epoch": 23.02, - "learning_rate": 3.134275618374558e-06, - "loss": 0.2649, + "epoch": 92.08, + "learning_rate": 4.0492957746478875e-06, + "loss": 0.408, "step": 6630 }, { - "epoch": 23.06, - "learning_rate": 3.132862190812721e-06, - "loss": 0.2847, + "epoch": 92.22, + "learning_rate": 3.97887323943662e-06, + "loss": 0.3884, "step": 6640 }, { - "epoch": 23.09, - "learning_rate": 3.131448763250883e-06, - "loss": 0.2679, + "epoch": 92.36, + "learning_rate": 3.908450704225353e-06, + "loss": 0.3812, "step": 6650 }, { - "epoch": 23.12, - "learning_rate": 3.1300353356890457e-06, - "loss": 0.284, + "epoch": 92.5, + "learning_rate": 3.838028169014085e-06, + "loss": 0.3852, "step": 6660 }, { - "epoch": 23.16, - "learning_rate": 3.128621908127208e-06, - "loss": 0.2729, + "epoch": 92.64, + "learning_rate": 3.767605633802817e-06, + "loss": 0.3827, "step": 6670 }, { - "epoch": 23.19, - "learning_rate": 3.127208480565371e-06, - "loss": 0.2708, + "epoch": 92.78, + "learning_rate": 3.6971830985915494e-06, + "loss": 0.3944, "step": 6680 }, { - "epoch": 23.23, - "learning_rate": 3.1257950530035333e-06, - "loss": 0.2851, + "epoch": 92.91, + "learning_rate": 3.6267605633802817e-06, + "loss": 0.3877, "step": 6690 }, { - "epoch": 23.26, - "learning_rate": 3.124381625441696e-06, - "loss": 0.262, + "epoch": 93.0, + "eval_loss": 0.4878864586353302, + "eval_runtime": 127.8576, + "eval_samples_per_second": 4.161, + "eval_steps_per_second": 0.524, + "eval_wer": 0.20762357781063187, + "step": 6696 + }, + { + "epoch": 93.06, + "learning_rate": 3.5563380281690144e-06, + "loss": 0.4055, "step": 6700 }, { - "epoch": 23.3, - "learning_rate": 3.122968197879858e-06, - "loss": 0.2997, + "epoch": 93.19, + "learning_rate": 3.4859154929577467e-06, + "loss": 0.3828, "step": 6710 }, { - "epoch": 23.33, - "learning_rate": 3.121554770318021e-06, - "loss": 0.2653, + "epoch": 93.33, + "learning_rate": 3.4154929577464795e-06, + "loss": 0.3835, "step": 6720 }, { - "epoch": 23.37, - "learning_rate": 3.1201413427561834e-06, - "loss": 0.2544, + "epoch": 93.47, + "learning_rate": 3.3450704225352113e-06, + "loss": 0.3891, "step": 6730 }, { - "epoch": 23.4, - "learning_rate": 3.1187279151943462e-06, - "loss": 0.2888, + "epoch": 93.61, + "learning_rate": 3.2746478873239436e-06, + "loss": 0.394, "step": 6740 }, { - "epoch": 23.44, - "learning_rate": 3.1173144876325086e-06, - "loss": 0.2837, + "epoch": 93.75, + "learning_rate": 3.204225352112676e-06, + "loss": 0.3938, "step": 6750 }, { - "epoch": 23.47, - "learning_rate": 3.1159010600706715e-06, - "loss": 0.2824, + "epoch": 93.89, + "learning_rate": 3.1338028169014087e-06, + "loss": 0.3709, "step": 6760 }, { - "epoch": 23.51, - "learning_rate": 3.1144876325088335e-06, - "loss": 0.3101, + "epoch": 94.0, + "eval_loss": 0.48774513602256775, + "eval_runtime": 126.6111, + "eval_samples_per_second": 4.202, + "eval_steps_per_second": 0.529, + "eval_wer": 0.20897345246512825, + "step": 6768 + }, + { + "epoch": 94.03, + "learning_rate": 3.063380281690141e-06, + "loss": 0.3925, "step": 6770 }, { - "epoch": 23.54, - "learning_rate": 3.1130742049469963e-06, - "loss": 0.2965, + "epoch": 94.17, + "learning_rate": 2.9929577464788733e-06, + "loss": 0.3871, "step": 6780 }, { - "epoch": 23.57, - "learning_rate": 3.1116607773851587e-06, - "loss": 0.2739, + "epoch": 94.3, + "learning_rate": 2.9225352112676056e-06, + "loss": 0.3915, "step": 6790 }, { - "epoch": 23.61, - "learning_rate": 3.1102473498233215e-06, - "loss": 0.2697, + "epoch": 94.44, + "learning_rate": 2.8521126760563383e-06, + "loss": 0.3777, "step": 6800 }, { - "epoch": 23.64, - "learning_rate": 3.108833922261484e-06, - "loss": 0.2837, + "epoch": 94.58, + "learning_rate": 2.7816901408450706e-06, + "loss": 0.3821, "step": 6810 }, { - "epoch": 23.68, - "learning_rate": 3.1074204946996464e-06, - "loss": 0.277, + "epoch": 94.72, + "learning_rate": 2.711267605633803e-06, + "loss": 0.3909, "step": 6820 }, { - "epoch": 23.71, - "learning_rate": 3.1060070671378088e-06, - "loss": 0.2887, + "epoch": 94.86, + "learning_rate": 2.640845070422535e-06, + "loss": 0.3907, "step": 6830 }, { - "epoch": 23.75, - "learning_rate": 3.1045936395759716e-06, - "loss": 0.2765, + "epoch": 95.0, + "learning_rate": 2.570422535211268e-06, + "loss": 0.3905, + "step": 6840 + }, + { + "epoch": 95.0, + "eval_loss": 0.49698197841644287, + "eval_runtime": 126.8507, + "eval_samples_per_second": 4.194, + "eval_steps_per_second": 0.528, + "eval_wer": 0.21295879668316514, "step": 6840 }, { - "epoch": 23.78, - "learning_rate": 3.103180212014134e-06, - "loss": 0.2468, + "epoch": 95.14, + "learning_rate": 2.5e-06, + "loss": 0.3814, "step": 6850 }, { - "epoch": 23.82, - "learning_rate": 3.101766784452297e-06, - "loss": 0.2786, + "epoch": 95.28, + "learning_rate": 2.4295774647887325e-06, + "loss": 0.3908, "step": 6860 }, { - "epoch": 23.85, - "learning_rate": 3.1003533568904593e-06, - "loss": 0.2561, + "epoch": 95.42, + "learning_rate": 2.359154929577465e-06, + "loss": 0.387, "step": 6870 }, { - "epoch": 23.89, - "learning_rate": 3.0989399293286217e-06, - "loss": 0.2494, + "epoch": 95.55, + "learning_rate": 2.2887323943661975e-06, + "loss": 0.3889, "step": 6880 }, { - "epoch": 23.92, - "learning_rate": 3.097526501766784e-06, - "loss": 0.2619, + "epoch": 95.69, + "learning_rate": 2.21830985915493e-06, + "loss": 0.3781, "step": 6890 }, { - "epoch": 23.96, - "learning_rate": 3.096113074204947e-06, - "loss": 0.2629, + "epoch": 95.83, + "learning_rate": 2.147887323943662e-06, + "loss": 0.3948, "step": 6900 }, { - "epoch": 23.99, - "learning_rate": 3.0946996466431093e-06, - "loss": 0.2722, + "epoch": 95.97, + "learning_rate": 2.0774647887323944e-06, + "loss": 0.3918, "step": 6910 }, { - "epoch": 24.0, - "eval_loss": 0.5097522735595703, - "eval_runtime": 129.544, - "eval_samples_per_second": 4.107, - "eval_steps_per_second": 1.027, - "eval_wer": 0.199010091920036, + "epoch": 96.0, + "eval_loss": 0.48947659134864807, + "eval_runtime": 127.7315, + "eval_samples_per_second": 4.165, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21064472584688565, "step": 6912 }, { - "epoch": 24.03, - "learning_rate": 3.093286219081272e-06, - "loss": 0.2714, + "epoch": 96.11, + "learning_rate": 2.007042253521127e-06, + "loss": 0.3879, "step": 6920 }, { - "epoch": 24.06, - "learning_rate": 3.0918727915194346e-06, - "loss": 0.2682, + "epoch": 96.25, + "learning_rate": 1.936619718309859e-06, + "loss": 0.3809, "step": 6930 }, { - "epoch": 24.1, - "learning_rate": 3.090459363957597e-06, - "loss": 0.2623, + "epoch": 96.39, + "learning_rate": 1.8661971830985915e-06, + "loss": 0.3702, "step": 6940 }, { - "epoch": 24.13, - "learning_rate": 3.0890459363957594e-06, - "loss": 0.279, + "epoch": 96.53, + "learning_rate": 1.795774647887324e-06, + "loss": 0.3975, "step": 6950 }, { - "epoch": 24.17, - "learning_rate": 3.0876325088339222e-06, - "loss": 0.2612, + "epoch": 96.66, + "learning_rate": 1.7253521126760566e-06, + "loss": 0.3847, "step": 6960 }, { - "epoch": 24.2, - "learning_rate": 3.0862190812720846e-06, - "loss": 0.2505, + "epoch": 96.8, + "learning_rate": 1.6549295774647886e-06, + "loss": 0.389, "step": 6970 }, { - "epoch": 24.24, - "learning_rate": 3.0848056537102475e-06, - "loss": 0.281, + "epoch": 96.94, + "learning_rate": 1.5845070422535212e-06, + "loss": 0.3954, "step": 6980 }, { - "epoch": 24.27, - "learning_rate": 3.0833922261484094e-06, - "loss": 0.2653, + "epoch": 97.0, + "eval_loss": 0.48836567997932434, + "eval_runtime": 128.4968, + "eval_samples_per_second": 4.14, + "eval_steps_per_second": 0.521, + "eval_wer": 0.2079449765378929, + "step": 6984 + }, + { + "epoch": 97.08, + "learning_rate": 1.5140845070422537e-06, + "loss": 0.3846, "step": 6990 }, { - "epoch": 24.3, - "learning_rate": 3.0819787985865723e-06, - "loss": 0.2881, + "epoch": 97.22, + "learning_rate": 1.443661971830986e-06, + "loss": 0.384, "step": 7000 }, { - "epoch": 24.34, - "learning_rate": 3.0805653710247347e-06, - "loss": 0.2596, + "epoch": 97.36, + "learning_rate": 1.3732394366197185e-06, + "loss": 0.3841, "step": 7010 }, { - "epoch": 24.37, - "learning_rate": 3.0791519434628975e-06, - "loss": 0.2459, + "epoch": 97.5, + "learning_rate": 1.3028169014084508e-06, + "loss": 0.3786, "step": 7020 }, { - "epoch": 24.41, - "learning_rate": 3.07773851590106e-06, - "loss": 0.2838, + "epoch": 97.64, + "learning_rate": 1.232394366197183e-06, + "loss": 0.3702, "step": 7030 }, { - "epoch": 24.44, - "learning_rate": 3.0763250883392228e-06, - "loss": 0.2497, + "epoch": 97.78, + "learning_rate": 1.1619718309859156e-06, + "loss": 0.3828, "step": 7040 }, { - "epoch": 24.48, - "learning_rate": 3.0749116607773847e-06, - "loss": 0.2907, + "epoch": 97.91, + "learning_rate": 1.0915492957746479e-06, + "loss": 0.3979, "step": 7050 }, { - "epoch": 24.51, - "learning_rate": 3.0734982332155476e-06, - "loss": 0.2954, + "epoch": 98.0, + "eval_loss": 0.48947107791900635, + "eval_runtime": 130.633, + "eval_samples_per_second": 4.072, + "eval_steps_per_second": 0.513, + "eval_wer": 0.20974480941055473, + "step": 7056 + }, + { + "epoch": 98.06, + "learning_rate": 1.0211267605633804e-06, + "loss": 0.3893, "step": 7060 }, { - "epoch": 24.55, - "learning_rate": 3.07208480565371e-06, - "loss": 0.2536, + "epoch": 98.19, + "learning_rate": 9.507042253521127e-07, + "loss": 0.378, "step": 7070 }, { - "epoch": 24.58, - "learning_rate": 3.070671378091873e-06, - "loss": 0.2554, + "epoch": 98.33, + "learning_rate": 8.802816901408452e-07, + "loss": 0.3816, "step": 7080 }, { - "epoch": 24.62, - "learning_rate": 3.0692579505300352e-06, - "loss": 0.2779, + "epoch": 98.47, + "learning_rate": 8.098591549295775e-07, + "loss": 0.3932, "step": 7090 }, { - "epoch": 24.65, - "learning_rate": 3.067844522968198e-06, - "loss": 0.2681, + "epoch": 98.61, + "learning_rate": 7.394366197183099e-07, + "loss": 0.3814, "step": 7100 }, { - "epoch": 24.69, - "learning_rate": 3.06643109540636e-06, - "loss": 0.2715, + "epoch": 98.75, + "learning_rate": 6.690140845070423e-07, + "loss": 0.3789, "step": 7110 }, { - "epoch": 24.72, - "learning_rate": 3.065017667844523e-06, - "loss": 0.2692, + "epoch": 98.89, + "learning_rate": 5.985915492957746e-07, + "loss": 0.373, "step": 7120 }, { - "epoch": 24.75, - "learning_rate": 3.0636042402826853e-06, - "loss": 0.2646, + "epoch": 99.0, + "eval_loss": 0.4874747097492218, + "eval_runtime": 126.7367, + "eval_samples_per_second": 4.198, + "eval_steps_per_second": 0.529, + "eval_wer": 0.20762357781063187, + "step": 7128 + }, + { + "epoch": 99.03, + "learning_rate": 5.28169014084507e-07, + "loss": 0.4034, "step": 7130 }, { - "epoch": 24.79, - "learning_rate": 3.062190812720848e-06, - "loss": 0.2585, + "epoch": 99.17, + "learning_rate": 4.5774647887323947e-07, + "loss": 0.3873, "step": 7140 }, { - "epoch": 24.82, - "learning_rate": 3.0607773851590105e-06, - "loss": 0.2706, + "epoch": 99.3, + "learning_rate": 3.873239436619719e-07, + "loss": 0.3784, "step": 7150 }, { - "epoch": 24.86, - "learning_rate": 3.059363957597173e-06, - "loss": 0.2796, + "epoch": 99.44, + "learning_rate": 3.1690140845070423e-07, + "loss": 0.3909, "step": 7160 }, { - "epoch": 24.89, - "learning_rate": 3.0579505300353354e-06, - "loss": 0.2645, + "epoch": 99.58, + "learning_rate": 2.4647887323943664e-07, + "loss": 0.3863, "step": 7170 }, { - "epoch": 24.93, - "learning_rate": 3.056537102473498e-06, - "loss": 0.2374, + "epoch": 99.72, + "learning_rate": 1.7605633802816901e-07, + "loss": 0.3796, "step": 7180 }, { - "epoch": 24.96, - "learning_rate": 3.0551236749116606e-06, - "loss": 0.285, + "epoch": 99.86, + "learning_rate": 1.056338028169014e-07, + "loss": 0.3699, "step": 7190 }, { - "epoch": 25.0, - "learning_rate": 3.0537102473498234e-06, - "loss": 0.3026, + "epoch": 100.0, + "learning_rate": 3.5211267605633804e-08, + "loss": 0.3769, "step": 7200 }, { - "epoch": 25.0, - "eval_loss": 0.5193008780479431, - "eval_runtime": 129.4939, - "eval_samples_per_second": 4.108, - "eval_steps_per_second": 1.027, - "eval_wer": 0.200552805810889, + "epoch": 100.0, + "eval_loss": 0.490430623292923, + "eval_runtime": 126.8664, + "eval_samples_per_second": 4.193, + "eval_steps_per_second": 0.528, + "eval_wer": 0.20871633348331942, "step": 7200 }, - { - "epoch": 25.03, - "learning_rate": 3.052296819787986e-06, - "loss": 0.3016, - "step": 7210 - }, - { - "epoch": 25.07, - "learning_rate": 3.0508833922261483e-06, - "loss": 0.2787, - "step": 7220 - }, - { - "epoch": 25.1, - "learning_rate": 3.0494699646643107e-06, - "loss": 0.2695, - "step": 7230 - }, - { - "epoch": 25.14, - "learning_rate": 3.048197879858657e-06, - "loss": 0.2666, - "step": 7240 - }, - { - "epoch": 25.17, - "learning_rate": 3.0467844522968195e-06, - "loss": 0.2892, - "step": 7250 - }, - { - "epoch": 25.21, - "learning_rate": 3.0453710247349824e-06, - "loss": 0.262, - "step": 7260 - }, - { - "epoch": 25.24, - "learning_rate": 3.0439575971731448e-06, - "loss": 0.2557, - "step": 7270 - }, - { - "epoch": 25.28, - "learning_rate": 3.0425441696113076e-06, - "loss": 0.255, - "step": 7280 - }, - { - "epoch": 25.31, - "learning_rate": 3.0411307420494696e-06, - "loss": 0.2848, - "step": 7290 - }, - { - "epoch": 25.35, - "learning_rate": 3.0397173144876324e-06, - "loss": 0.2734, - "step": 7300 - }, - { - "epoch": 25.38, - "learning_rate": 3.038303886925795e-06, - "loss": 0.2719, - "step": 7310 - }, - { - "epoch": 25.42, - "learning_rate": 3.0368904593639577e-06, - "loss": 0.2672, - "step": 7320 - }, - { - "epoch": 25.45, - "learning_rate": 3.03547703180212e-06, - "loss": 0.266, - "step": 7330 - }, - { - "epoch": 25.48, - "learning_rate": 3.034063604240283e-06, - "loss": 0.3005, - "step": 7340 - }, - { - "epoch": 25.52, - "learning_rate": 3.032650176678445e-06, - "loss": 0.2512, - "step": 7350 - }, - { - "epoch": 25.55, - "learning_rate": 3.0312367491166077e-06, - "loss": 0.2525, - "step": 7360 - }, - { - "epoch": 25.59, - "learning_rate": 3.02982332155477e-06, - "loss": 0.2543, - "step": 7370 - }, - { - "epoch": 25.62, - "learning_rate": 3.028409893992933e-06, - "loss": 0.2881, - "step": 7380 - }, - { - "epoch": 25.66, - "learning_rate": 3.0269964664310954e-06, - "loss": 0.2569, - "step": 7390 - }, - { - "epoch": 25.69, - "learning_rate": 3.0255830388692582e-06, - "loss": 0.2721, - "step": 7400 - }, - { - "epoch": 25.73, - "learning_rate": 3.02416961130742e-06, - "loss": 0.2717, - "step": 7410 - }, - { - "epoch": 25.76, - "learning_rate": 3.022756183745583e-06, - "loss": 0.2897, - "step": 7420 - }, - { - "epoch": 25.8, - "learning_rate": 3.0213427561837454e-06, - "loss": 0.2652, - "step": 7430 - }, - { - "epoch": 25.83, - "learning_rate": 3.0199293286219083e-06, - "loss": 0.2545, - "step": 7440 - }, - { - "epoch": 25.87, - "learning_rate": 3.0185159010600707e-06, - "loss": 0.2826, - "step": 7450 - }, - { - "epoch": 25.9, - "learning_rate": 3.0171024734982327e-06, - "loss": 0.2638, - "step": 7460 - }, - { - "epoch": 25.94, - "learning_rate": 3.0156890459363955e-06, - "loss": 0.2592, - "step": 7470 - }, - { - "epoch": 25.97, - "learning_rate": 3.014275618374558e-06, - "loss": 0.2888, - "step": 7480 - }, - { - "epoch": 26.0, - "eval_loss": 0.49870219826698303, - "eval_runtime": 130.4803, - "eval_samples_per_second": 4.077, - "eval_steps_per_second": 1.019, - "eval_wer": 0.19856013370187053, - "step": 7488 - }, - { - "epoch": 26.01, - "learning_rate": 3.0128621908127208e-06, - "loss": 0.2858, - "step": 7490 - }, - { - "epoch": 26.04, - "learning_rate": 3.011448763250883e-06, - "loss": 0.28, - "step": 7500 - }, - { - "epoch": 26.08, - "learning_rate": 3.010035335689046e-06, - "loss": 0.2725, - "step": 7510 - }, - { - "epoch": 26.11, - "learning_rate": 3.008621908127208e-06, - "loss": 0.271, - "step": 7520 - }, - { - "epoch": 26.15, - "learning_rate": 3.007208480565371e-06, - "loss": 0.2829, - "step": 7530 - }, - { - "epoch": 26.18, - "learning_rate": 3.0057950530035332e-06, - "loss": 0.2639, - "step": 7540 - }, - { - "epoch": 26.21, - "learning_rate": 3.004381625441696e-06, - "loss": 0.256, - "step": 7550 - }, - { - "epoch": 26.25, - "learning_rate": 3.0029681978798585e-06, - "loss": 0.2738, - "step": 7560 - }, - { - "epoch": 26.28, - "learning_rate": 3.001554770318021e-06, - "loss": 0.2642, - "step": 7570 - }, - { - "epoch": 26.32, - "learning_rate": 3.0001413427561833e-06, - "loss": 0.2953, - "step": 7580 - }, - { - "epoch": 26.35, - "learning_rate": 2.998727915194346e-06, - "loss": 0.2696, - "step": 7590 - }, - { - "epoch": 26.39, - "learning_rate": 2.9973144876325085e-06, - "loss": 0.2801, - "step": 7600 - }, - { - "epoch": 26.42, - "learning_rate": 2.9959010600706714e-06, - "loss": 0.2846, - "step": 7610 - }, - { - "epoch": 26.46, - "learning_rate": 2.9944876325088338e-06, - "loss": 0.2726, - "step": 7620 - }, - { - "epoch": 26.49, - "learning_rate": 2.993074204946996e-06, - "loss": 0.2773, - "step": 7630 - }, - { - "epoch": 26.53, - "learning_rate": 2.9916607773851586e-06, - "loss": 0.2555, - "step": 7640 - }, - { - "epoch": 26.56, - "learning_rate": 2.9902473498233214e-06, - "loss": 0.2797, - "step": 7650 - }, - { - "epoch": 26.6, - "learning_rate": 2.988833922261484e-06, - "loss": 0.2519, - "step": 7660 - }, - { - "epoch": 26.63, - "learning_rate": 2.9874204946996467e-06, - "loss": 0.2665, - "step": 7670 - }, - { - "epoch": 26.66, - "learning_rate": 2.986007067137809e-06, - "loss": 0.2618, - "step": 7680 - }, - { - "epoch": 26.7, - "learning_rate": 2.9845936395759715e-06, - "loss": 0.2807, - "step": 7690 - }, - { - "epoch": 26.73, - "learning_rate": 2.983180212014134e-06, - "loss": 0.2786, - "step": 7700 - }, - { - "epoch": 26.77, - "learning_rate": 2.9817667844522967e-06, - "loss": 0.2579, - "step": 7710 - }, - { - "epoch": 26.8, - "learning_rate": 2.980353356890459e-06, - "loss": 0.2748, - "step": 7720 - }, - { - "epoch": 26.84, - "learning_rate": 2.978939929328622e-06, - "loss": 0.2755, - "step": 7730 - }, - { - "epoch": 26.87, - "learning_rate": 2.977526501766784e-06, - "loss": 0.2483, - "step": 7740 - }, - { - "epoch": 26.91, - "learning_rate": 2.9761130742049468e-06, - "loss": 0.2753, - "step": 7750 - }, - { - "epoch": 26.94, - "learning_rate": 2.974699646643109e-06, - "loss": 0.2455, - "step": 7760 - }, - { - "epoch": 26.98, - "learning_rate": 2.973286219081272e-06, - "loss": 0.2732, - "step": 7770 - }, - { - "epoch": 27.0, - "eval_loss": 0.5063392519950867, - "eval_runtime": 129.9156, - "eval_samples_per_second": 4.095, - "eval_steps_per_second": 1.024, - "eval_wer": 0.20074564504724562, - "step": 7776 - }, - { - "epoch": 27.01, - "learning_rate": 2.9718727915194344e-06, - "loss": 0.2939, - "step": 7780 - }, - { - "epoch": 27.05, - "learning_rate": 2.9704593639575973e-06, - "loss": 0.2713, - "step": 7790 - }, - { - "epoch": 27.08, - "learning_rate": 2.9690459363957593e-06, - "loss": 0.2683, - "step": 7800 - }, - { - "epoch": 27.12, - "learning_rate": 2.967632508833922e-06, - "loss": 0.2905, - "step": 7810 - }, - { - "epoch": 27.15, - "learning_rate": 2.9662190812720845e-06, - "loss": 0.2755, - "step": 7820 - }, - { - "epoch": 27.19, - "learning_rate": 2.9648056537102473e-06, - "loss": 0.2745, - "step": 7830 - }, - { - "epoch": 27.22, - "learning_rate": 2.9633922261484097e-06, - "loss": 0.2813, - "step": 7840 - }, - { - "epoch": 27.26, - "learning_rate": 2.9619787985865726e-06, - "loss": 0.2405, - "step": 7850 - }, - { - "epoch": 27.29, - "learning_rate": 2.9605653710247346e-06, - "loss": 0.2778, - "step": 7860 - }, - { - "epoch": 27.33, - "learning_rate": 2.9591519434628974e-06, - "loss": 0.2785, - "step": 7870 - }, - { - "epoch": 27.36, - "learning_rate": 2.95773851590106e-06, - "loss": 0.2665, - "step": 7880 - }, - { - "epoch": 27.39, - "learning_rate": 2.9563250883392226e-06, - "loss": 0.2905, - "step": 7890 - }, - { - "epoch": 27.43, - "learning_rate": 2.954911660777385e-06, - "loss": 0.2611, - "step": 7900 - }, - { - "epoch": 27.46, - "learning_rate": 2.9534982332155475e-06, - "loss": 0.2633, - "step": 7910 - }, - { - "epoch": 27.5, - "learning_rate": 2.95208480565371e-06, - "loss": 0.2525, - "step": 7920 - }, - { - "epoch": 27.53, - "learning_rate": 2.9506713780918727e-06, - "loss": 0.2627, - "step": 7930 - }, - { - "epoch": 27.57, - "learning_rate": 2.949257950530035e-06, - "loss": 0.2834, - "step": 7940 - }, - { - "epoch": 27.6, - "learning_rate": 2.947844522968198e-06, - "loss": 0.2709, - "step": 7950 - }, - { - "epoch": 27.64, - "learning_rate": 2.9464310954063604e-06, - "loss": 0.2637, - "step": 7960 - }, - { - "epoch": 27.67, - "learning_rate": 2.9450176678445228e-06, - "loss": 0.304, - "step": 7970 - }, - { - "epoch": 27.71, - "learning_rate": 2.943604240282685e-06, - "loss": 0.2664, - "step": 7980 - }, - { - "epoch": 27.74, - "learning_rate": 2.942190812720848e-06, - "loss": 0.2684, - "step": 7990 - }, - { - "epoch": 27.78, - "learning_rate": 2.9407773851590104e-06, - "loss": 0.2641, - "step": 8000 - }, - { - "epoch": 27.81, - "learning_rate": 2.9393639575971732e-06, - "loss": 0.2767, - "step": 8010 - }, - { - "epoch": 27.85, - "learning_rate": 2.9379505300353357e-06, - "loss": 0.2825, - "step": 8020 - }, - { - "epoch": 27.88, - "learning_rate": 2.936537102473498e-06, - "loss": 0.2747, - "step": 8030 - }, - { - "epoch": 27.91, - "learning_rate": 2.9351236749116605e-06, - "loss": 0.2877, - "step": 8040 - }, - { - "epoch": 27.95, - "learning_rate": 2.9337102473498233e-06, - "loss": 0.2703, - "step": 8050 - }, - { - "epoch": 27.98, - "learning_rate": 2.9322968197879857e-06, - "loss": 0.2567, - "step": 8060 - }, - { - "epoch": 28.0, - "eval_loss": 0.5102671980857849, - "eval_runtime": 130.0784, - "eval_samples_per_second": 4.09, - "eval_steps_per_second": 1.022, - "eval_wer": 0.2015170019926721, - "step": 8064 - }, - { - "epoch": 28.02, - "learning_rate": 2.9308833922261486e-06, - "loss": 0.2758, - "step": 8070 - }, - { - "epoch": 28.06, - "learning_rate": 2.9294699646643105e-06, - "loss": 0.2866, - "step": 8080 - }, - { - "epoch": 28.09, - "learning_rate": 2.9280565371024734e-06, - "loss": 0.2397, - "step": 8090 - }, - { - "epoch": 28.12, - "learning_rate": 2.9266431095406358e-06, - "loss": 0.2718, - "step": 8100 - }, - { - "epoch": 28.16, - "learning_rate": 2.9252296819787986e-06, - "loss": 0.2795, - "step": 8110 - }, - { - "epoch": 28.19, - "learning_rate": 2.923816254416961e-06, - "loss": 0.258, - "step": 8120 - }, - { - "epoch": 28.23, - "learning_rate": 2.922402826855124e-06, - "loss": 0.2651, - "step": 8130 - }, - { - "epoch": 28.26, - "learning_rate": 2.920989399293286e-06, - "loss": 0.2741, - "step": 8140 - }, - { - "epoch": 28.3, - "learning_rate": 2.9195759717314487e-06, - "loss": 0.286, - "step": 8150 - }, - { - "epoch": 28.33, - "learning_rate": 2.918162544169611e-06, - "loss": 0.2716, - "step": 8160 - }, - { - "epoch": 28.37, - "learning_rate": 2.916749116607774e-06, - "loss": 0.2594, - "step": 8170 - }, - { - "epoch": 28.4, - "learning_rate": 2.9153356890459363e-06, - "loss": 0.2958, - "step": 8180 - }, - { - "epoch": 28.44, - "learning_rate": 2.9139222614840987e-06, - "loss": 0.2742, - "step": 8190 - }, - { - "epoch": 28.47, - "learning_rate": 2.912508833922261e-06, - "loss": 0.2678, - "step": 8200 - }, - { - "epoch": 28.51, - "learning_rate": 2.911095406360424e-06, - "loss": 0.2961, - "step": 8210 - }, - { - "epoch": 28.54, - "learning_rate": 2.9096819787985864e-06, - "loss": 0.2675, - "step": 8220 - }, - { - "epoch": 28.57, - "learning_rate": 2.9082685512367492e-06, - "loss": 0.2722, - "step": 8230 - }, - { - "epoch": 28.61, - "learning_rate": 2.9068551236749116e-06, - "loss": 0.257, - "step": 8240 - }, - { - "epoch": 28.64, - "learning_rate": 2.905441696113074e-06, - "loss": 0.3073, - "step": 8250 - }, - { - "epoch": 28.68, - "learning_rate": 2.9040282685512365e-06, - "loss": 0.2852, - "step": 8260 - }, - { - "epoch": 28.71, - "learning_rate": 2.9026148409893993e-06, - "loss": 0.275, - "step": 8270 - }, - { - "epoch": 28.75, - "learning_rate": 2.9012014134275617e-06, - "loss": 0.272, - "step": 8280 - }, - { - "epoch": 28.78, - "learning_rate": 2.8997879858657245e-06, - "loss": 0.2732, - "step": 8290 - }, - { - "epoch": 28.82, - "learning_rate": 2.898374558303887e-06, - "loss": 0.2734, - "step": 8300 - }, - { - "epoch": 28.85, - "learning_rate": 2.8969611307420493e-06, - "loss": 0.2581, - "step": 8310 - }, - { - "epoch": 28.89, - "learning_rate": 2.8955477031802118e-06, - "loss": 0.2689, - "step": 8320 - }, - { - "epoch": 28.92, - "learning_rate": 2.8941342756183746e-06, - "loss": 0.2592, - "step": 8330 - }, - { - "epoch": 28.96, - "learning_rate": 2.892720848056537e-06, - "loss": 0.261, - "step": 8340 - }, - { - "epoch": 28.99, - "learning_rate": 2.8913074204947e-06, - "loss": 0.2845, - "step": 8350 - }, - { - "epoch": 29.0, - "eval_loss": 0.5084418058395386, - "eval_runtime": 129.7694, - "eval_samples_per_second": 4.1, - "eval_steps_per_second": 1.025, - "eval_wer": 0.20203123995628977, - "step": 8352 - }, - { - "epoch": 29.03, - "learning_rate": 2.889893992932862e-06, - "loss": 0.2541, - "step": 8360 - }, - { - "epoch": 29.06, - "learning_rate": 2.8884805653710247e-06, - "loss": 0.2822, - "step": 8370 - }, - { - "epoch": 29.1, - "learning_rate": 2.887067137809187e-06, - "loss": 0.2498, - "step": 8380 - }, - { - "epoch": 29.13, - "learning_rate": 2.88565371024735e-06, - "loss": 0.2908, - "step": 8390 - }, - { - "epoch": 29.17, - "learning_rate": 2.8842402826855123e-06, - "loss": 0.2679, - "step": 8400 - }, - { - "epoch": 29.2, - "learning_rate": 2.882826855123675e-06, - "loss": 0.2352, - "step": 8410 - }, - { - "epoch": 29.24, - "learning_rate": 2.881413427561837e-06, - "loss": 0.2733, - "step": 8420 - }, - { - "epoch": 29.27, - "learning_rate": 2.88e-06, - "loss": 0.2427, - "step": 8430 - }, - { - "epoch": 29.3, - "learning_rate": 2.8785865724381624e-06, - "loss": 0.2692, - "step": 8440 - }, - { - "epoch": 29.34, - "learning_rate": 2.877173144876325e-06, - "loss": 0.27, - "step": 8450 - }, - { - "epoch": 29.37, - "learning_rate": 2.8757597173144876e-06, - "loss": 0.2465, - "step": 8460 - }, - { - "epoch": 29.41, - "learning_rate": 2.8743462897526504e-06, - "loss": 0.2853, - "step": 8470 - }, - { - "epoch": 29.44, - "learning_rate": 2.8729328621908124e-06, - "loss": 0.2536, - "step": 8480 - }, - { - "epoch": 29.48, - "learning_rate": 2.8715194346289753e-06, - "loss": 0.2824, - "step": 8490 - }, - { - "epoch": 29.51, - "learning_rate": 2.8701060070671377e-06, - "loss": 0.2749, - "step": 8500 - }, - { - "epoch": 29.55, - "learning_rate": 2.8686925795053005e-06, - "loss": 0.2399, - "step": 8510 - }, - { - "epoch": 29.58, - "learning_rate": 2.867279151943463e-06, - "loss": 0.2557, - "step": 8520 - }, - { - "epoch": 29.62, - "learning_rate": 2.865865724381625e-06, - "loss": 0.2561, - "step": 8530 - }, - { - "epoch": 29.65, - "learning_rate": 2.8644522968197877e-06, - "loss": 0.2758, - "step": 8540 - }, - { - "epoch": 29.69, - "learning_rate": 2.86303886925795e-06, - "loss": 0.2755, - "step": 8550 - }, - { - "epoch": 29.72, - "learning_rate": 2.861625441696113e-06, - "loss": 0.2732, - "step": 8560 - }, - { - "epoch": 29.75, - "learning_rate": 2.860212014134276e-06, - "loss": 0.282, - "step": 8570 - }, - { - "epoch": 29.79, - "learning_rate": 2.8587985865724382e-06, - "loss": 0.2516, - "step": 8580 - }, - { - "epoch": 29.82, - "learning_rate": 2.8573851590106e-06, - "loss": 0.2953, - "step": 8590 - }, - { - "epoch": 29.86, - "learning_rate": 2.855971731448763e-06, - "loss": 0.3114, - "step": 8600 - }, - { - "epoch": 29.89, - "learning_rate": 2.8545583038869254e-06, - "loss": 0.2853, - "step": 8610 - }, - { - "epoch": 29.93, - "learning_rate": 2.8531448763250883e-06, - "loss": 0.2648, - "step": 8620 - }, - { - "epoch": 29.96, - "learning_rate": 2.8517314487632507e-06, - "loss": 0.2812, - "step": 8630 - }, - { - "epoch": 30.0, - "learning_rate": 2.8503180212014135e-06, - "loss": 0.2591, - "step": 8640 - }, - { - "epoch": 30.0, - "eval_loss": 0.5109365582466125, - "eval_runtime": 129.6483, - "eval_samples_per_second": 4.103, - "eval_steps_per_second": 1.026, - "eval_wer": 0.1989458121745838, - "step": 8640 - }, - { - "epoch": 30.03, - "learning_rate": 2.8489045936395755e-06, - "loss": 0.272, - "step": 8650 - }, - { - "epoch": 30.07, - "learning_rate": 2.8474911660777383e-06, - "loss": 0.2787, - "step": 8660 - }, - { - "epoch": 30.1, - "learning_rate": 2.8460777385159007e-06, - "loss": 0.2711, - "step": 8670 - }, - { - "epoch": 30.14, - "learning_rate": 2.8446643109540636e-06, - "loss": 0.2828, - "step": 8680 - }, - { - "epoch": 30.17, - "learning_rate": 2.843250883392226e-06, - "loss": 0.2688, - "step": 8690 - }, - { - "epoch": 30.21, - "learning_rate": 2.8418374558303884e-06, - "loss": 0.2588, - "step": 8700 - }, - { - "epoch": 30.24, - "learning_rate": 2.840424028268551e-06, - "loss": 0.2539, - "step": 8710 - }, - { - "epoch": 30.28, - "learning_rate": 2.8390106007067136e-06, - "loss": 0.2443, - "step": 8720 - }, - { - "epoch": 30.31, - "learning_rate": 2.837597173144876e-06, - "loss": 0.2713, - "step": 8730 - }, - { - "epoch": 30.35, - "learning_rate": 2.836183745583039e-06, - "loss": 0.2811, - "step": 8740 - }, - { - "epoch": 30.38, - "learning_rate": 2.8347703180212013e-06, - "loss": 0.2653, - "step": 8750 - }, - { - "epoch": 30.42, - "learning_rate": 2.8333568904593637e-06, - "loss": 0.276, - "step": 8760 - }, - { - "epoch": 30.45, - "learning_rate": 2.831943462897526e-06, - "loss": 0.2519, - "step": 8770 - }, - { - "epoch": 30.48, - "learning_rate": 2.830530035335689e-06, - "loss": 0.2805, - "step": 8780 - }, - { - "epoch": 30.52, - "learning_rate": 2.8291166077738514e-06, - "loss": 0.2823, - "step": 8790 - }, - { - "epoch": 30.55, - "learning_rate": 2.827703180212014e-06, - "loss": 0.2714, - "step": 8800 - }, - { - "epoch": 30.59, - "learning_rate": 2.826289752650176e-06, - "loss": 0.2786, - "step": 8810 - }, - { - "epoch": 30.62, - "learning_rate": 2.824876325088339e-06, - "loss": 0.2636, - "step": 8820 - }, - { - "epoch": 30.66, - "learning_rate": 2.8234628975265014e-06, - "loss": 0.2723, - "step": 8830 - }, - { - "epoch": 30.69, - "learning_rate": 2.8220494699646643e-06, - "loss": 0.2795, - "step": 8840 - }, - { - "epoch": 30.73, - "learning_rate": 2.8206360424028267e-06, - "loss": 0.2547, - "step": 8850 - }, - { - "epoch": 30.76, - "learning_rate": 2.8192226148409895e-06, - "loss": 0.256, - "step": 8860 - }, - { - "epoch": 30.8, - "learning_rate": 2.8178091872791515e-06, - "loss": 0.2494, - "step": 8870 - }, - { - "epoch": 30.83, - "learning_rate": 2.8163957597173143e-06, - "loss": 0.2634, - "step": 8880 - }, - { - "epoch": 30.87, - "learning_rate": 2.8149823321554767e-06, - "loss": 0.2868, - "step": 8890 - }, - { - "epoch": 30.9, - "learning_rate": 2.8135689045936396e-06, - "loss": 0.247, - "step": 8900 - }, - { - "epoch": 30.94, - "learning_rate": 2.812155477031802e-06, - "loss": 0.2527, - "step": 8910 - }, - { - "epoch": 30.97, - "learning_rate": 2.810742049469965e-06, - "loss": 0.2777, - "step": 8920 - }, - { - "epoch": 31.0, - "eval_loss": 0.5179172158241272, - "eval_runtime": 129.9918, - "eval_samples_per_second": 4.093, - "eval_steps_per_second": 1.023, - "eval_wer": 0.19939577039274925, - "step": 8928 - }, - { - "epoch": 31.01, - "learning_rate": 2.8093286219081268e-06, - "loss": 0.2692, - "step": 8930 - }, - { - "epoch": 31.04, - "learning_rate": 2.8079151943462896e-06, - "loss": 0.2848, - "step": 8940 - }, - { - "epoch": 31.08, - "learning_rate": 2.806501766784452e-06, - "loss": 0.2704, - "step": 8950 - }, - { - "epoch": 31.11, - "learning_rate": 2.805088339222615e-06, - "loss": 0.253, - "step": 8960 - }, - { - "epoch": 31.15, - "learning_rate": 2.8036749116607773e-06, - "loss": 0.3008, - "step": 8970 - }, - { - "epoch": 31.18, - "learning_rate": 2.8022614840989397e-06, - "loss": 0.2674, - "step": 8980 - }, - { - "epoch": 31.21, - "learning_rate": 2.800848056537102e-06, - "loss": 0.2581, - "step": 8990 - }, - { - "epoch": 31.25, - "learning_rate": 2.799434628975265e-06, - "loss": 0.2539, - "step": 9000 - }, - { - "epoch": 31.28, - "learning_rate": 2.7980212014134273e-06, - "loss": 0.2625, - "step": 9010 - }, - { - "epoch": 31.32, - "learning_rate": 2.79660777385159e-06, - "loss": 0.2533, - "step": 9020 - }, - { - "epoch": 31.35, - "learning_rate": 2.7951943462897526e-06, - "loss": 0.2822, - "step": 9030 - }, - { - "epoch": 31.39, - "learning_rate": 2.793780918727915e-06, - "loss": 0.2678, - "step": 9040 - }, - { - "epoch": 31.42, - "learning_rate": 2.7923674911660774e-06, - "loss": 0.26, - "step": 9050 - }, - { - "epoch": 31.46, - "learning_rate": 2.7909540636042402e-06, - "loss": 0.2568, - "step": 9060 - }, - { - "epoch": 31.49, - "learning_rate": 2.7895406360424026e-06, - "loss": 0.2713, - "step": 9070 - }, - { - "epoch": 31.53, - "learning_rate": 2.7881272084805655e-06, - "loss": 0.2664, - "step": 9080 - }, - { - "epoch": 31.56, - "learning_rate": 2.786713780918728e-06, - "loss": 0.2682, - "step": 9090 - }, - { - "epoch": 31.6, - "learning_rate": 2.7853003533568903e-06, - "loss": 0.2739, - "step": 9100 - }, - { - "epoch": 31.63, - "learning_rate": 2.7838869257950527e-06, - "loss": 0.2553, - "step": 9110 - }, - { - "epoch": 31.66, - "learning_rate": 2.7824734982332155e-06, - "loss": 0.2882, - "step": 9120 - }, - { - "epoch": 31.7, - "learning_rate": 2.781060070671378e-06, - "loss": 0.252, - "step": 9130 - }, - { - "epoch": 31.73, - "learning_rate": 2.7796466431095408e-06, - "loss": 0.257, - "step": 9140 - }, - { - "epoch": 31.77, - "learning_rate": 2.7782332155477028e-06, - "loss": 0.271, - "step": 9150 - }, - { - "epoch": 31.8, - "learning_rate": 2.7768197879858656e-06, - "loss": 0.263, - "step": 9160 - }, - { - "epoch": 31.84, - "learning_rate": 2.775406360424028e-06, - "loss": 0.2663, - "step": 9170 - }, - { - "epoch": 31.87, - "learning_rate": 2.773992932862191e-06, - "loss": 0.274, - "step": 9180 - }, - { - "epoch": 31.91, - "learning_rate": 2.7725795053003532e-06, - "loss": 0.2567, - "step": 9190 - }, - { - "epoch": 31.94, - "learning_rate": 2.771166077738516e-06, - "loss": 0.2676, - "step": 9200 - }, - { - "epoch": 31.98, - "learning_rate": 2.769752650176678e-06, - "loss": 0.2784, - "step": 9210 - }, - { - "epoch": 32.0, - "eval_loss": 0.518265962600708, - "eval_runtime": 129.4613, - "eval_samples_per_second": 4.109, - "eval_steps_per_second": 1.027, - "eval_wer": 0.1989458121745838, - "step": 9216 - }, - { - "epoch": 32.01, - "learning_rate": 2.768339222614841e-06, - "loss": 0.2617, - "step": 9220 - }, - { - "epoch": 32.05, - "learning_rate": 2.7669257950530033e-06, - "loss": 0.2787, - "step": 9230 - }, - { - "epoch": 32.08, - "learning_rate": 2.765512367491166e-06, - "loss": 0.2495, - "step": 9240 - }, - { - "epoch": 32.12, - "learning_rate": 2.7640989399293285e-06, - "loss": 0.249, - "step": 9250 - }, - { - "epoch": 32.15, - "learning_rate": 2.7626855123674914e-06, - "loss": 0.2824, - "step": 9260 - }, - { - "epoch": 32.19, - "learning_rate": 2.7612720848056534e-06, - "loss": 0.2872, - "step": 9270 - }, - { - "epoch": 32.22, - "learning_rate": 2.759858657243816e-06, - "loss": 0.2743, - "step": 9280 - }, - { - "epoch": 32.26, - "learning_rate": 2.7585865724381622e-06, - "loss": 0.2752, - "step": 9290 - }, - { - "epoch": 32.29, - "learning_rate": 2.757173144876325e-06, - "loss": 0.2671, - "step": 9300 - }, - { - "epoch": 32.33, - "learning_rate": 2.7557597173144875e-06, - "loss": 0.2559, - "step": 9310 - }, - { - "epoch": 32.36, - "learning_rate": 2.7543462897526503e-06, - "loss": 0.2762, - "step": 9320 - }, - { - "epoch": 32.39, - "learning_rate": 2.7529328621908127e-06, - "loss": 0.2633, - "step": 9330 - }, - { - "epoch": 32.43, - "learning_rate": 2.751519434628975e-06, - "loss": 0.2554, - "step": 9340 - }, - { - "epoch": 32.46, - "learning_rate": 2.7501060070671375e-06, - "loss": 0.2922, - "step": 9350 - }, - { - "epoch": 32.5, - "learning_rate": 2.7486925795053004e-06, - "loss": 0.2827, - "step": 9360 - }, - { - "epoch": 32.53, - "learning_rate": 2.747279151943463e-06, - "loss": 0.2491, - "step": 9370 - }, - { - "epoch": 32.57, - "learning_rate": 2.7458657243816256e-06, - "loss": 0.2386, - "step": 9380 - }, - { - "epoch": 32.6, - "learning_rate": 2.744452296819788e-06, - "loss": 0.2375, - "step": 9390 - }, - { - "epoch": 32.64, - "learning_rate": 2.7430388692579504e-06, - "loss": 0.2663, - "step": 9400 - }, - { - "epoch": 32.67, - "learning_rate": 2.741625441696113e-06, - "loss": 0.2674, - "step": 9410 - }, - { - "epoch": 32.71, - "learning_rate": 2.7402120141342757e-06, - "loss": 0.2609, - "step": 9420 - }, - { - "epoch": 32.74, - "learning_rate": 2.738798586572438e-06, - "loss": 0.2538, - "step": 9430 - }, - { - "epoch": 32.78, - "learning_rate": 2.737385159010601e-06, - "loss": 0.268, - "step": 9440 - }, - { - "epoch": 32.81, - "learning_rate": 2.735971731448763e-06, - "loss": 0.2698, - "step": 9450 - }, - { - "epoch": 32.85, - "learning_rate": 2.7345583038869257e-06, - "loss": 0.2826, - "step": 9460 - }, - { - "epoch": 32.88, - "learning_rate": 2.733144876325088e-06, - "loss": 0.249, - "step": 9470 - }, - { - "epoch": 32.91, - "learning_rate": 2.731731448763251e-06, - "loss": 0.2555, - "step": 9480 - }, - { - "epoch": 32.95, - "learning_rate": 2.7303180212014134e-06, - "loss": 0.243, - "step": 9490 - }, - { - "epoch": 32.98, - "learning_rate": 2.7289045936395762e-06, - "loss": 0.2801, - "step": 9500 - }, - { - "epoch": 33.0, - "eval_loss": 0.5222018957138062, - "eval_runtime": 129.2645, - "eval_samples_per_second": 4.116, - "eval_steps_per_second": 1.029, - "eval_wer": 0.20029568682908017, - "step": 9504 - }, - { - "epoch": 33.02, - "learning_rate": 2.7274911660777382e-06, - "loss": 0.2721, - "step": 9510 - }, - { - "epoch": 33.06, - "learning_rate": 2.7260777385159006e-06, - "loss": 0.2799, - "step": 9520 - }, - { - "epoch": 33.09, - "learning_rate": 2.7246643109540635e-06, - "loss": 0.2719, - "step": 9530 - }, - { - "epoch": 33.12, - "learning_rate": 2.7232508833922263e-06, - "loss": 0.2716, - "step": 9540 - }, - { - "epoch": 33.16, - "learning_rate": 2.7218374558303887e-06, - "loss": 0.2768, - "step": 9550 - }, - { - "epoch": 33.19, - "learning_rate": 2.7204240282685515e-06, - "loss": 0.2619, - "step": 9560 - }, - { - "epoch": 33.23, - "learning_rate": 2.7190106007067135e-06, - "loss": 0.2864, - "step": 9570 - }, - { - "epoch": 33.26, - "learning_rate": 2.717597173144876e-06, - "loss": 0.2651, - "step": 9580 - }, - { - "epoch": 33.3, - "learning_rate": 2.7161837455830388e-06, - "loss": 0.2799, - "step": 9590 - }, - { - "epoch": 33.33, - "learning_rate": 2.714770318021201e-06, - "loss": 0.2821, - "step": 9600 - }, - { - "epoch": 33.37, - "learning_rate": 2.713356890459364e-06, - "loss": 0.2742, - "step": 9610 - }, - { - "epoch": 33.4, - "learning_rate": 2.711943462897526e-06, - "loss": 0.267, - "step": 9620 - }, - { - "epoch": 33.44, - "learning_rate": 2.710530035335689e-06, - "loss": 0.2676, - "step": 9630 - }, - { - "epoch": 33.47, - "learning_rate": 2.7091166077738512e-06, - "loss": 0.2992, - "step": 9640 - }, - { - "epoch": 33.51, - "learning_rate": 2.707703180212014e-06, - "loss": 0.3028, - "step": 9650 - }, - { - "epoch": 33.54, - "learning_rate": 2.7062897526501765e-06, - "loss": 0.2624, - "step": 9660 - }, - { - "epoch": 33.57, - "learning_rate": 2.7048763250883393e-06, - "loss": 0.2673, - "step": 9670 - }, - { - "epoch": 33.61, - "learning_rate": 2.7034628975265013e-06, - "loss": 0.2599, - "step": 9680 - }, - { - "epoch": 33.64, - "learning_rate": 2.702049469964664e-06, - "loss": 0.2548, - "step": 9690 - }, - { - "epoch": 33.68, - "learning_rate": 2.7006360424028265e-06, - "loss": 0.2647, - "step": 9700 - }, - { - "epoch": 33.71, - "learning_rate": 2.6992226148409894e-06, - "loss": 0.264, - "step": 9710 - }, - { - "epoch": 33.75, - "learning_rate": 2.6978091872791518e-06, - "loss": 0.2615, - "step": 9720 - }, - { - "epoch": 33.78, - "learning_rate": 2.696395759717314e-06, - "loss": 0.2579, - "step": 9730 - }, - { - "epoch": 33.82, - "learning_rate": 2.6949823321554766e-06, - "loss": 0.2806, - "step": 9740 - }, - { - "epoch": 33.85, - "learning_rate": 2.6935689045936394e-06, - "loss": 0.2679, - "step": 9750 - }, - { - "epoch": 33.89, - "learning_rate": 2.692155477031802e-06, - "loss": 0.2415, - "step": 9760 - }, - { - "epoch": 33.92, - "learning_rate": 2.6907420494699647e-06, - "loss": 0.2645, - "step": 9770 - }, - { - "epoch": 33.96, - "learning_rate": 2.689328621908127e-06, - "loss": 0.2602, - "step": 9780 - }, - { - "epoch": 33.99, - "learning_rate": 2.6879151943462895e-06, - "loss": 0.2554, - "step": 9790 - }, - { - "epoch": 34.0, - "eval_loss": 0.5137259364128113, - "eval_runtime": 129.6969, - "eval_samples_per_second": 4.102, - "eval_steps_per_second": 1.025, - "eval_wer": 0.199010091920036, - "step": 9792 - }, - { - "epoch": 34.03, - "learning_rate": 2.686501766784452e-06, - "loss": 0.2962, - "step": 9800 - }, - { - "epoch": 34.06, - "learning_rate": 2.6850883392226147e-06, - "loss": 0.2692, - "step": 9810 - }, - { - "epoch": 34.1, - "learning_rate": 2.683674911660777e-06, - "loss": 0.2522, - "step": 9820 - }, - { - "epoch": 34.13, - "learning_rate": 2.68226148409894e-06, - "loss": 0.2894, - "step": 9830 - }, - { - "epoch": 34.17, - "learning_rate": 2.6808480565371024e-06, - "loss": 0.2864, - "step": 9840 - }, - { - "epoch": 34.2, - "learning_rate": 2.679434628975265e-06, - "loss": 0.2564, - "step": 9850 - }, - { - "epoch": 34.24, - "learning_rate": 2.678021201413427e-06, - "loss": 0.2632, - "step": 9860 - }, - { - "epoch": 34.27, - "learning_rate": 2.67660777385159e-06, - "loss": 0.2442, - "step": 9870 - }, - { - "epoch": 34.3, - "learning_rate": 2.6751943462897525e-06, - "loss": 0.2923, - "step": 9880 - }, - { - "epoch": 34.34, - "learning_rate": 2.6737809187279153e-06, - "loss": 0.2789, - "step": 9890 - }, - { - "epoch": 34.37, - "learning_rate": 2.6723674911660773e-06, - "loss": 0.2835, - "step": 9900 - }, - { - "epoch": 34.41, - "learning_rate": 2.67095406360424e-06, - "loss": 0.2634, - "step": 9910 - }, - { - "epoch": 34.44, - "learning_rate": 2.6695406360424025e-06, - "loss": 0.2771, - "step": 9920 - }, - { - "epoch": 34.48, - "learning_rate": 2.6681272084805653e-06, - "loss": 0.2659, - "step": 9930 - }, - { - "epoch": 34.51, - "learning_rate": 2.6667137809187278e-06, - "loss": 0.2556, - "step": 9940 - }, - { - "epoch": 34.55, - "learning_rate": 2.6653003533568906e-06, - "loss": 0.2524, - "step": 9950 - }, - { - "epoch": 34.58, - "learning_rate": 2.6638869257950526e-06, - "loss": 0.2783, - "step": 9960 - }, - { - "epoch": 34.62, - "learning_rate": 2.6624734982332154e-06, - "loss": 0.245, - "step": 9970 - }, - { - "epoch": 34.65, - "learning_rate": 2.661060070671378e-06, - "loss": 0.2642, - "step": 9980 - }, - { - "epoch": 34.69, - "learning_rate": 2.6596466431095407e-06, - "loss": 0.2945, - "step": 9990 - }, - { - "epoch": 34.72, - "learning_rate": 2.658233215547703e-06, - "loss": 0.25, - "step": 10000 - }, - { - "epoch": 34.75, - "learning_rate": 2.656819787985866e-06, - "loss": 0.2635, - "step": 10010 - }, - { - "epoch": 34.79, - "learning_rate": 2.655406360424028e-06, - "loss": 0.2492, - "step": 10020 - }, - { - "epoch": 34.82, - "learning_rate": 2.6539929328621907e-06, - "loss": 0.2789, - "step": 10030 - }, - { - "epoch": 34.86, - "learning_rate": 2.652579505300353e-06, - "loss": 0.2797, - "step": 10040 - }, - { - "epoch": 34.89, - "learning_rate": 2.651166077738516e-06, - "loss": 0.2378, - "step": 10050 - }, - { - "epoch": 34.93, - "learning_rate": 2.6497526501766784e-06, - "loss": 0.2545, - "step": 10060 - }, - { - "epoch": 34.96, - "learning_rate": 2.6483392226148408e-06, - "loss": 0.2677, - "step": 10070 - }, - { - "epoch": 35.0, - "learning_rate": 2.646925795053003e-06, - "loss": 0.2708, - "step": 10080 - }, - { - "epoch": 35.0, - "eval_loss": 0.5093948841094971, - "eval_runtime": 129.527, - "eval_samples_per_second": 4.107, - "eval_steps_per_second": 1.027, - "eval_wer": 0.19643890210194767, - "step": 10080 - }, - { - "epoch": 35.03, - "learning_rate": 2.645512367491166e-06, - "loss": 0.2628, - "step": 10090 - }, - { - "epoch": 35.07, - "learning_rate": 2.6440989399293284e-06, - "loss": 0.263, - "step": 10100 - }, - { - "epoch": 35.1, - "learning_rate": 2.6426855123674913e-06, - "loss": 0.241, - "step": 10110 - }, - { - "epoch": 35.14, - "learning_rate": 2.6412720848056537e-06, - "loss": 0.2802, - "step": 10120 - }, - { - "epoch": 35.17, - "learning_rate": 2.639858657243816e-06, - "loss": 0.2675, - "step": 10130 - }, - { - "epoch": 35.21, - "learning_rate": 2.6384452296819785e-06, - "loss": 0.2626, - "step": 10140 - }, - { - "epoch": 35.24, - "learning_rate": 2.6370318021201413e-06, - "loss": 0.2853, - "step": 10150 - }, - { - "epoch": 35.28, - "learning_rate": 2.6356183745583037e-06, - "loss": 0.2683, - "step": 10160 - }, - { - "epoch": 35.31, - "learning_rate": 2.6342049469964666e-06, - "loss": 0.269, - "step": 10170 - }, - { - "epoch": 35.35, - "learning_rate": 2.632791519434629e-06, - "loss": 0.2872, - "step": 10180 - }, - { - "epoch": 35.38, - "learning_rate": 2.6313780918727914e-06, - "loss": 0.2519, - "step": 10190 - }, - { - "epoch": 35.42, - "learning_rate": 2.629964664310954e-06, - "loss": 0.2554, - "step": 10200 - }, - { - "epoch": 35.45, - "learning_rate": 2.6285512367491166e-06, - "loss": 0.2548, - "step": 10210 - }, - { - "epoch": 35.48, - "learning_rate": 2.627137809187279e-06, - "loss": 0.291, - "step": 10220 - }, - { - "epoch": 35.52, - "learning_rate": 2.625724381625442e-06, - "loss": 0.2507, - "step": 10230 - }, - { - "epoch": 35.55, - "learning_rate": 2.624310954063604e-06, - "loss": 0.2681, - "step": 10240 - }, - { - "epoch": 35.59, - "learning_rate": 2.6228975265017667e-06, - "loss": 0.2637, - "step": 10250 - }, - { - "epoch": 35.62, - "learning_rate": 2.621484098939929e-06, - "loss": 0.2707, - "step": 10260 - }, - { - "epoch": 35.66, - "learning_rate": 2.620070671378092e-06, - "loss": 0.2784, - "step": 10270 - }, - { - "epoch": 35.69, - "learning_rate": 2.6186572438162543e-06, - "loss": 0.28, - "step": 10280 - }, - { - "epoch": 35.73, - "learning_rate": 2.617243816254417e-06, - "loss": 0.2459, - "step": 10290 - }, - { - "epoch": 35.76, - "learning_rate": 2.615830388692579e-06, - "loss": 0.2663, - "step": 10300 - }, - { - "epoch": 35.8, - "learning_rate": 2.614416961130742e-06, - "loss": 0.2546, - "step": 10310 - }, - { - "epoch": 35.83, - "learning_rate": 2.6130035335689044e-06, - "loss": 0.2632, - "step": 10320 - }, - { - "epoch": 35.87, - "learning_rate": 2.6115901060070672e-06, - "loss": 0.2692, - "step": 10330 - }, - { - "epoch": 35.9, - "learning_rate": 2.6101766784452296e-06, - "loss": 0.292, - "step": 10340 - }, - { - "epoch": 35.94, - "learning_rate": 2.608763250883392e-06, - "loss": 0.2487, - "step": 10350 - }, - { - "epoch": 35.97, - "learning_rate": 2.6073498233215545e-06, - "loss": 0.27, - "step": 10360 - }, - { - "epoch": 36.0, - "eval_loss": 0.5076168775558472, - "eval_runtime": 129.8583, - "eval_samples_per_second": 4.097, - "eval_steps_per_second": 1.024, - "eval_wer": 0.19798161599280067, - "step": 10368 - }, - { - "epoch": 36.01, - "learning_rate": 2.6059363957597173e-06, - "loss": 0.2559, - "step": 10370 - }, - { - "epoch": 36.04, - "learning_rate": 2.6045229681978797e-06, - "loss": 0.2505, - "step": 10380 - }, - { - "epoch": 36.08, - "learning_rate": 2.6031095406360425e-06, - "loss": 0.279, - "step": 10390 - }, - { - "epoch": 36.11, - "learning_rate": 2.601696113074205e-06, - "loss": 0.2585, - "step": 10400 - }, - { - "epoch": 36.15, - "learning_rate": 2.6002826855123674e-06, - "loss": 0.2484, - "step": 10410 - }, - { - "epoch": 36.18, - "learning_rate": 2.5988692579505298e-06, - "loss": 0.2734, - "step": 10420 - }, - { - "epoch": 36.21, - "learning_rate": 2.5974558303886926e-06, - "loss": 0.2707, - "step": 10430 - }, - { - "epoch": 36.25, - "learning_rate": 2.596042402826855e-06, - "loss": 0.2594, - "step": 10440 - }, - { - "epoch": 36.28, - "learning_rate": 2.594628975265018e-06, - "loss": 0.248, - "step": 10450 - }, - { - "epoch": 36.32, - "learning_rate": 2.5932155477031803e-06, - "loss": 0.2647, - "step": 10460 - }, - { - "epoch": 36.35, - "learning_rate": 2.5918021201413427e-06, - "loss": 0.2599, - "step": 10470 - }, - { - "epoch": 36.39, - "learning_rate": 2.590388692579505e-06, - "loss": 0.267, - "step": 10480 - }, - { - "epoch": 36.42, - "learning_rate": 2.588975265017668e-06, - "loss": 0.2639, - "step": 10490 - }, - { - "epoch": 36.46, - "learning_rate": 2.5875618374558303e-06, - "loss": 0.2715, - "step": 10500 - }, - { - "epoch": 36.49, - "learning_rate": 2.586148409893993e-06, - "loss": 0.3031, - "step": 10510 - }, - { - "epoch": 36.53, - "learning_rate": 2.584734982332155e-06, - "loss": 0.2996, - "step": 10520 - }, - { - "epoch": 36.56, - "learning_rate": 2.583321554770318e-06, - "loss": 0.2586, - "step": 10530 - }, - { - "epoch": 36.6, - "learning_rate": 2.5819081272084804e-06, - "loss": 0.2514, - "step": 10540 - }, - { - "epoch": 36.63, - "learning_rate": 2.580494699646643e-06, - "loss": 0.255, - "step": 10550 - }, - { - "epoch": 36.66, - "learning_rate": 2.5790812720848056e-06, - "loss": 0.2765, - "step": 10560 - }, - { - "epoch": 36.7, - "learning_rate": 2.5776678445229685e-06, - "loss": 0.2721, - "step": 10570 - }, - { - "epoch": 36.73, - "learning_rate": 2.5762544169611304e-06, - "loss": 0.2704, - "step": 10580 - }, - { - "epoch": 36.77, - "learning_rate": 2.5748409893992933e-06, - "loss": 0.2613, - "step": 10590 - }, - { - "epoch": 36.8, - "learning_rate": 2.5734275618374557e-06, - "loss": 0.2711, - "step": 10600 - }, - { - "epoch": 36.84, - "learning_rate": 2.5720141342756185e-06, - "loss": 0.2769, - "step": 10610 - }, - { - "epoch": 36.87, - "learning_rate": 2.570600706713781e-06, - "loss": 0.2635, - "step": 10620 - }, - { - "epoch": 36.91, - "learning_rate": 2.5691872791519438e-06, - "loss": 0.2655, - "step": 10630 - }, - { - "epoch": 36.94, - "learning_rate": 2.5677738515901057e-06, - "loss": 0.2689, - "step": 10640 - }, - { - "epoch": 36.98, - "learning_rate": 2.566360424028268e-06, - "loss": 0.2706, - "step": 10650 - }, - { - "epoch": 37.0, - "eval_loss": 0.5178768038749695, - "eval_runtime": 130.9202, - "eval_samples_per_second": 4.064, - "eval_steps_per_second": 1.016, - "eval_wer": 0.1983030147200617, - "step": 10656 - }, - { - "epoch": 37.01, - "learning_rate": 2.564946996466431e-06, - "loss": 0.2868, - "step": 10660 - }, - { - "epoch": 37.05, - "learning_rate": 2.5635335689045934e-06, - "loss": 0.2749, - "step": 10670 - }, - { - "epoch": 37.08, - "learning_rate": 2.5621201413427562e-06, - "loss": 0.2454, - "step": 10680 - }, - { - "epoch": 37.12, - "learning_rate": 2.5607067137809182e-06, - "loss": 0.283, - "step": 10690 - }, - { - "epoch": 37.15, - "learning_rate": 2.559293286219081e-06, - "loss": 0.2709, - "step": 10700 - }, - { - "epoch": 37.19, - "learning_rate": 2.5578798586572435e-06, - "loss": 0.2623, - "step": 10710 - }, - { - "epoch": 37.22, - "learning_rate": 2.5564664310954063e-06, - "loss": 0.2742, - "step": 10720 - }, - { - "epoch": 37.26, - "learning_rate": 2.5550530035335687e-06, - "loss": 0.2683, - "step": 10730 - }, - { - "epoch": 37.29, - "learning_rate": 2.5536395759717315e-06, - "loss": 0.251, - "step": 10740 - }, - { - "epoch": 37.33, - "learning_rate": 2.5522261484098935e-06, - "loss": 0.2613, - "step": 10750 - }, - { - "epoch": 37.36, - "learning_rate": 2.5508127208480564e-06, - "loss": 0.2655, - "step": 10760 - }, - { - "epoch": 37.39, - "learning_rate": 2.5493992932862188e-06, - "loss": 0.2723, - "step": 10770 - }, - { - "epoch": 37.43, - "learning_rate": 2.5479858657243816e-06, - "loss": 0.2675, - "step": 10780 - }, - { - "epoch": 37.46, - "learning_rate": 2.546572438162544e-06, - "loss": 0.2732, - "step": 10790 - }, - { - "epoch": 37.5, - "learning_rate": 2.545159010600707e-06, - "loss": 0.2773, - "step": 10800 - }, - { - "epoch": 37.53, - "learning_rate": 2.543745583038869e-06, - "loss": 0.2536, - "step": 10810 - }, - { - "epoch": 37.57, - "learning_rate": 2.5423321554770317e-06, - "loss": 0.2693, - "step": 10820 - }, - { - "epoch": 37.6, - "learning_rate": 2.540918727915194e-06, - "loss": 0.2498, - "step": 10830 - }, - { - "epoch": 37.64, - "learning_rate": 2.539505300353357e-06, - "loss": 0.2603, - "step": 10840 - }, - { - "epoch": 37.67, - "learning_rate": 2.5380918727915193e-06, - "loss": 0.2798, - "step": 10850 - }, - { - "epoch": 37.71, - "learning_rate": 2.5366784452296817e-06, - "loss": 0.2911, - "step": 10860 - }, - { - "epoch": 37.74, - "learning_rate": 2.535265017667844e-06, - "loss": 0.2625, - "step": 10870 - }, - { - "epoch": 37.78, - "learning_rate": 2.533851590106007e-06, - "loss": 0.2744, - "step": 10880 - }, - { - "epoch": 37.81, - "learning_rate": 2.5324381625441694e-06, - "loss": 0.2753, - "step": 10890 - }, - { - "epoch": 37.85, - "learning_rate": 2.531024734982332e-06, - "loss": 0.267, - "step": 10900 - }, - { - "epoch": 37.88, - "learning_rate": 2.5296113074204946e-06, - "loss": 0.2572, - "step": 10910 - }, - { - "epoch": 37.91, - "learning_rate": 2.528197879858657e-06, - "loss": 0.2551, - "step": 10920 - }, - { - "epoch": 37.95, - "learning_rate": 2.5267844522968194e-06, - "loss": 0.2469, - "step": 10930 - }, - { - "epoch": 37.98, - "learning_rate": 2.5253710247349823e-06, - "loss": 0.2791, - "step": 10940 - }, - { - "epoch": 38.0, - "eval_loss": 0.515429675579071, - "eval_runtime": 130.0554, - "eval_samples_per_second": 4.091, - "eval_steps_per_second": 1.023, - "eval_wer": 0.19759593752008742, - "step": 10944 - }, - { - "epoch": 38.02, - "learning_rate": 2.5239575971731447e-06, - "loss": 0.2944, - "step": 10950 - }, - { - "epoch": 38.06, - "learning_rate": 2.5225441696113075e-06, - "loss": 0.264, - "step": 10960 - }, - { - "epoch": 38.09, - "learning_rate": 2.52113074204947e-06, - "loss": 0.2722, - "step": 10970 - }, - { - "epoch": 38.12, - "learning_rate": 2.5197173144876323e-06, - "loss": 0.2692, - "step": 10980 - }, - { - "epoch": 38.16, - "learning_rate": 2.5183038869257947e-06, - "loss": 0.2607, - "step": 10990 - }, - { - "epoch": 38.19, - "learning_rate": 2.5168904593639576e-06, - "loss": 0.2412, - "step": 11000 - }, - { - "epoch": 38.23, - "learning_rate": 2.51547703180212e-06, - "loss": 0.2621, - "step": 11010 - }, - { - "epoch": 38.26, - "learning_rate": 2.514063604240283e-06, - "loss": 0.2383, - "step": 11020 - }, - { - "epoch": 38.3, - "learning_rate": 2.512650176678445e-06, - "loss": 0.2608, - "step": 11030 - }, - { - "epoch": 38.33, - "learning_rate": 2.5112367491166076e-06, - "loss": 0.2865, - "step": 11040 - }, - { - "epoch": 38.37, - "learning_rate": 2.50982332155477e-06, - "loss": 0.2529, - "step": 11050 - }, - { - "epoch": 38.4, - "learning_rate": 2.508409893992933e-06, - "loss": 0.2468, - "step": 11060 - }, - { - "epoch": 38.44, - "learning_rate": 2.5069964664310953e-06, - "loss": 0.2767, - "step": 11070 - }, - { - "epoch": 38.47, - "learning_rate": 2.505583038869258e-06, - "loss": 0.2832, - "step": 11080 - }, - { - "epoch": 38.51, - "learning_rate": 2.50416961130742e-06, - "loss": 0.2732, - "step": 11090 - }, - { - "epoch": 38.54, - "learning_rate": 2.502756183745583e-06, - "loss": 0.2604, - "step": 11100 - }, - { - "epoch": 38.57, - "learning_rate": 2.5013427561837453e-06, - "loss": 0.2797, - "step": 11110 - }, - { - "epoch": 38.61, - "learning_rate": 2.499929328621908e-06, - "loss": 0.2548, - "step": 11120 - }, - { - "epoch": 38.64, - "learning_rate": 2.4985159010600706e-06, - "loss": 0.2735, - "step": 11130 - }, - { - "epoch": 38.68, - "learning_rate": 2.497102473498233e-06, - "loss": 0.2544, - "step": 11140 - }, - { - "epoch": 38.71, - "learning_rate": 2.4956890459363954e-06, - "loss": 0.2744, - "step": 11150 - }, - { - "epoch": 38.75, - "learning_rate": 2.4942756183745582e-06, - "loss": 0.2696, - "step": 11160 - }, - { - "epoch": 38.78, - "learning_rate": 2.4928621908127206e-06, - "loss": 0.2339, - "step": 11170 - }, - { - "epoch": 38.82, - "learning_rate": 2.4914487632508835e-06, - "loss": 0.2658, - "step": 11180 - }, - { - "epoch": 38.85, - "learning_rate": 2.490035335689046e-06, - "loss": 0.2626, - "step": 11190 - }, - { - "epoch": 38.89, - "learning_rate": 2.4886219081272083e-06, - "loss": 0.2592, - "step": 11200 - }, - { - "epoch": 38.92, - "learning_rate": 2.4872084805653707e-06, - "loss": 0.2644, - "step": 11210 - }, - { - "epoch": 38.96, - "learning_rate": 2.4857950530035335e-06, - "loss": 0.2661, - "step": 11220 - }, - { - "epoch": 38.99, - "learning_rate": 2.484381625441696e-06, - "loss": 0.3148, - "step": 11230 - }, - { - "epoch": 39.0, - "eval_loss": 0.5082433223724365, - "eval_runtime": 132.6404, - "eval_samples_per_second": 4.011, - "eval_steps_per_second": 1.003, - "eval_wer": 0.199010091920036, - "step": 11232 - }, - { - "epoch": 39.03, - "learning_rate": 2.4829681978798588e-06, - "loss": 0.261, - "step": 11240 - }, - { - "epoch": 39.06, - "learning_rate": 2.481554770318021e-06, - "loss": 0.2706, - "step": 11250 - }, - { - "epoch": 39.1, - "learning_rate": 2.4801413427561836e-06, - "loss": 0.2532, - "step": 11260 - }, - { - "epoch": 39.13, - "learning_rate": 2.478727915194346e-06, - "loss": 0.2841, - "step": 11270 - }, - { - "epoch": 39.17, - "learning_rate": 2.477314487632509e-06, - "loss": 0.2502, - "step": 11280 - }, - { - "epoch": 39.2, - "learning_rate": 2.4759010600706713e-06, - "loss": 0.2579, - "step": 11290 - }, - { - "epoch": 39.24, - "learning_rate": 2.474487632508834e-06, - "loss": 0.2768, - "step": 11300 - }, - { - "epoch": 39.27, - "learning_rate": 2.473074204946996e-06, - "loss": 0.2351, - "step": 11310 - }, - { - "epoch": 39.3, - "learning_rate": 2.471660777385159e-06, - "loss": 0.2888, - "step": 11320 - }, - { - "epoch": 39.34, - "learning_rate": 2.4702473498233213e-06, - "loss": 0.2852, - "step": 11330 - }, - { - "epoch": 39.37, - "learning_rate": 2.468833922261484e-06, - "loss": 0.2604, - "step": 11340 - }, - { - "epoch": 39.41, - "learning_rate": 2.4674204946996466e-06, - "loss": 0.2629, - "step": 11350 - }, - { - "epoch": 39.44, - "learning_rate": 2.4660070671378094e-06, - "loss": 0.2291, - "step": 11360 - }, - { - "epoch": 39.48, - "learning_rate": 2.4645936395759714e-06, - "loss": 0.2684, - "step": 11370 - }, - { - "epoch": 39.51, - "learning_rate": 2.4631802120141342e-06, - "loss": 0.2635, - "step": 11380 - }, - { - "epoch": 39.55, - "learning_rate": 2.4617667844522966e-06, - "loss": 0.2524, - "step": 11390 - }, - { - "epoch": 39.58, - "learning_rate": 2.4603533568904595e-06, - "loss": 0.2813, - "step": 11400 - }, - { - "epoch": 39.62, - "learning_rate": 2.458939929328622e-06, - "loss": 0.2778, - "step": 11410 - }, - { - "epoch": 39.65, - "learning_rate": 2.4575265017667847e-06, - "loss": 0.2845, - "step": 11420 - }, - { - "epoch": 39.69, - "learning_rate": 2.4561130742049467e-06, - "loss": 0.2779, - "step": 11430 - }, - { - "epoch": 39.72, - "learning_rate": 2.4546996466431095e-06, - "loss": 0.2418, - "step": 11440 - }, - { - "epoch": 39.75, - "learning_rate": 2.453286219081272e-06, - "loss": 0.2493, - "step": 11450 - }, - { - "epoch": 39.79, - "learning_rate": 2.4518727915194348e-06, - "loss": 0.2677, - "step": 11460 - }, - { - "epoch": 39.82, - "learning_rate": 2.450459363957597e-06, - "loss": 0.2747, - "step": 11470 - }, - { - "epoch": 39.86, - "learning_rate": 2.4490459363957596e-06, - "loss": 0.2768, - "step": 11480 - }, - { - "epoch": 39.89, - "learning_rate": 2.447632508833922e-06, - "loss": 0.2705, - "step": 11490 - }, - { - "epoch": 39.93, - "learning_rate": 2.446219081272085e-06, - "loss": 0.2486, - "step": 11500 - }, - { - "epoch": 39.96, - "learning_rate": 2.4448056537102472e-06, - "loss": 0.2852, - "step": 11510 - }, - { - "epoch": 40.0, - "learning_rate": 2.44339222614841e-06, - "loss": 0.2834, - "step": 11520 - }, - { - "epoch": 40.0, - "eval_loss": 0.5106706023216248, - "eval_runtime": 132.6333, - "eval_samples_per_second": 4.011, - "eval_steps_per_second": 1.003, - "eval_wer": 0.19804589573825288, - "step": 11520 - }, - { - "epoch": 40.03, - "learning_rate": 2.4419787985865725e-06, - "loss": 0.2684, - "step": 11530 - }, - { - "epoch": 40.07, - "learning_rate": 2.440565371024735e-06, - "loss": 0.2851, - "step": 11540 - }, - { - "epoch": 40.1, - "learning_rate": 2.4391519434628973e-06, - "loss": 0.2619, - "step": 11550 - }, - { - "epoch": 40.14, - "learning_rate": 2.43773851590106e-06, - "loss": 0.2778, - "step": 11560 - }, - { - "epoch": 40.17, - "learning_rate": 2.4363250883392225e-06, - "loss": 0.2822, - "step": 11570 - }, - { - "epoch": 40.21, - "learning_rate": 2.4349116607773854e-06, - "loss": 0.2447, - "step": 11580 - }, - { - "epoch": 40.24, - "learning_rate": 2.4334982332155478e-06, - "loss": 0.2741, - "step": 11590 - }, - { - "epoch": 40.28, - "learning_rate": 2.43208480565371e-06, - "loss": 0.2678, - "step": 11600 - }, - { - "epoch": 40.31, - "learning_rate": 2.4306713780918726e-06, - "loss": 0.2677, - "step": 11610 - }, - { - "epoch": 40.35, - "learning_rate": 2.4292579505300354e-06, - "loss": 0.2553, - "step": 11620 - }, - { - "epoch": 40.38, - "learning_rate": 2.427844522968198e-06, - "loss": 0.262, - "step": 11630 - }, - { - "epoch": 40.42, - "learning_rate": 2.4264310954063607e-06, - "loss": 0.2346, - "step": 11640 - }, - { - "epoch": 40.45, - "learning_rate": 2.4250176678445227e-06, - "loss": 0.2454, - "step": 11650 - }, - { - "epoch": 40.48, - "learning_rate": 2.4236042402826855e-06, - "loss": 0.2916, - "step": 11660 - }, - { - "epoch": 40.52, - "learning_rate": 2.422190812720848e-06, - "loss": 0.2796, - "step": 11670 - }, - { - "epoch": 40.55, - "learning_rate": 2.4207773851590107e-06, - "loss": 0.2665, - "step": 11680 - }, - { - "epoch": 40.59, - "learning_rate": 2.419363957597173e-06, - "loss": 0.2589, - "step": 11690 - }, - { - "epoch": 40.62, - "learning_rate": 2.417950530035336e-06, - "loss": 0.2391, - "step": 11700 - }, - { - "epoch": 40.66, - "learning_rate": 2.416537102473498e-06, - "loss": 0.2641, - "step": 11710 - }, - { - "epoch": 40.69, - "learning_rate": 2.4151236749116604e-06, - "loss": 0.2821, - "step": 11720 - }, - { - "epoch": 40.73, - "learning_rate": 2.413710247349823e-06, - "loss": 0.2595, - "step": 11730 - }, - { - "epoch": 40.76, - "learning_rate": 2.4122968197879856e-06, - "loss": 0.2632, - "step": 11740 - }, - { - "epoch": 40.8, - "learning_rate": 2.4108833922261484e-06, - "loss": 0.2707, - "step": 11750 - }, - { - "epoch": 40.83, - "learning_rate": 2.4094699646643104e-06, - "loss": 0.2821, - "step": 11760 - }, - { - "epoch": 40.87, - "learning_rate": 2.4080565371024733e-06, - "loss": 0.27, - "step": 11770 - }, - { - "epoch": 40.9, - "learning_rate": 2.4066431095406357e-06, - "loss": 0.2556, - "step": 11780 - }, - { - "epoch": 40.94, - "learning_rate": 2.4052296819787985e-06, - "loss": 0.2552, - "step": 11790 - }, - { - "epoch": 40.97, - "learning_rate": 2.403816254416961e-06, - "loss": 0.2739, - "step": 11800 - }, - { - "epoch": 41.0, - "eval_loss": 0.5009294152259827, - "eval_runtime": 134.0218, - "eval_samples_per_second": 3.97, - "eval_steps_per_second": 0.992, - "eval_wer": 0.199010091920036, - "step": 11808 - }, - { - "epoch": 41.01, - "learning_rate": 2.4024028268551238e-06, - "loss": 0.2686, - "step": 11810 - }, - { - "epoch": 41.04, - "learning_rate": 2.4009893992932857e-06, - "loss": 0.2519, - "step": 11820 - }, - { - "epoch": 41.08, - "learning_rate": 2.3995759717314486e-06, - "loss": 0.2594, - "step": 11830 - }, - { - "epoch": 41.11, - "learning_rate": 2.398162544169611e-06, - "loss": 0.2581, - "step": 11840 - }, - { - "epoch": 41.15, - "learning_rate": 2.396749116607774e-06, - "loss": 0.2805, - "step": 11850 - }, - { - "epoch": 41.18, - "learning_rate": 2.3953356890459362e-06, - "loss": 0.2676, - "step": 11860 - }, - { - "epoch": 41.21, - "learning_rate": 2.393922261484099e-06, - "loss": 0.266, - "step": 11870 - }, - { - "epoch": 41.25, - "learning_rate": 2.392508833922261e-06, - "loss": 0.2659, - "step": 11880 - }, - { - "epoch": 41.28, - "learning_rate": 2.391095406360424e-06, - "loss": 0.2744, - "step": 11890 - }, - { - "epoch": 41.32, - "learning_rate": 2.3896819787985863e-06, - "loss": 0.2645, - "step": 11900 - }, - { - "epoch": 41.35, - "learning_rate": 2.388268551236749e-06, - "loss": 0.2566, - "step": 11910 - }, - { - "epoch": 41.39, - "learning_rate": 2.3868551236749115e-06, - "loss": 0.2739, - "step": 11920 - }, - { - "epoch": 41.42, - "learning_rate": 2.385441696113074e-06, - "loss": 0.2716, - "step": 11930 - }, - { - "epoch": 41.46, - "learning_rate": 2.3840282685512363e-06, - "loss": 0.2489, - "step": 11940 - }, - { - "epoch": 41.49, - "learning_rate": 2.382614840989399e-06, - "loss": 0.2852, - "step": 11950 - }, - { - "epoch": 41.53, - "learning_rate": 2.3812014134275616e-06, - "loss": 0.2709, - "step": 11960 - }, - { - "epoch": 41.56, - "learning_rate": 2.3797879858657244e-06, - "loss": 0.274, - "step": 11970 - }, - { - "epoch": 41.6, - "learning_rate": 2.378374558303887e-06, - "loss": 0.2656, - "step": 11980 - }, - { - "epoch": 41.63, - "learning_rate": 2.3769611307420492e-06, - "loss": 0.2745, - "step": 11990 - }, - { - "epoch": 41.66, - "learning_rate": 2.3755477031802117e-06, - "loss": 0.2757, - "step": 12000 - }, - { - "epoch": 41.7, - "learning_rate": 2.3741342756183745e-06, - "loss": 0.2799, - "step": 12010 - }, - { - "epoch": 41.73, - "learning_rate": 2.372720848056537e-06, - "loss": 0.2521, - "step": 12020 - }, - { - "epoch": 41.77, - "learning_rate": 2.3713074204946997e-06, - "loss": 0.2568, - "step": 12030 - }, - { - "epoch": 41.8, - "learning_rate": 2.369893992932862e-06, - "loss": 0.2557, - "step": 12040 - }, - { - "epoch": 41.84, - "learning_rate": 2.3684805653710245e-06, - "loss": 0.2617, - "step": 12050 - }, - { - "epoch": 41.87, - "learning_rate": 2.367067137809187e-06, - "loss": 0.2595, - "step": 12060 - }, - { - "epoch": 41.91, - "learning_rate": 2.36565371024735e-06, - "loss": 0.2647, - "step": 12070 - }, - { - "epoch": 41.94, - "learning_rate": 2.364240282685512e-06, - "loss": 0.2544, - "step": 12080 - }, - { - "epoch": 41.98, - "learning_rate": 2.362826855123675e-06, - "loss": 0.2687, - "step": 12090 - }, - { - "epoch": 42.0, - "eval_loss": 0.5231707692146301, - "eval_runtime": 133.0554, - "eval_samples_per_second": 3.998, - "eval_steps_per_second": 1.0, - "eval_wer": 0.20113132351995885, - "step": 12096 - }, - { - "epoch": 42.01, - "learning_rate": 2.361413427561837e-06, - "loss": 0.288, - "step": 12100 - }, - { - "epoch": 42.05, - "learning_rate": 2.36e-06, - "loss": 0.2828, - "step": 12110 - }, - { - "epoch": 42.08, - "learning_rate": 2.3585865724381623e-06, - "loss": 0.267, - "step": 12120 - }, - { - "epoch": 42.12, - "learning_rate": 2.357173144876325e-06, - "loss": 0.2614, - "step": 12130 - }, - { - "epoch": 42.15, - "learning_rate": 2.3557597173144875e-06, - "loss": 0.2614, - "step": 12140 - }, - { - "epoch": 42.19, - "learning_rate": 2.3543462897526503e-06, - "loss": 0.2936, - "step": 12150 - }, - { - "epoch": 42.22, - "learning_rate": 2.3529328621908123e-06, - "loss": 0.2661, - "step": 12160 - }, - { - "epoch": 42.26, - "learning_rate": 2.351519434628975e-06, - "loss": 0.2655, - "step": 12170 - }, - { - "epoch": 42.29, - "learning_rate": 2.3501060070671376e-06, - "loss": 0.2874, - "step": 12180 - }, - { - "epoch": 42.33, - "learning_rate": 2.3486925795053004e-06, - "loss": 0.2629, - "step": 12190 - }, - { - "epoch": 42.36, - "learning_rate": 2.347279151943463e-06, - "loss": 0.2498, - "step": 12200 - }, - { - "epoch": 42.39, - "learning_rate": 2.3458657243816256e-06, - "loss": 0.2821, - "step": 12210 - }, - { - "epoch": 42.43, - "learning_rate": 2.3444522968197876e-06, - "loss": 0.2461, - "step": 12220 - }, - { - "epoch": 42.46, - "learning_rate": 2.3430388692579505e-06, - "loss": 0.2809, - "step": 12230 - }, - { - "epoch": 42.5, - "learning_rate": 2.341625441696113e-06, - "loss": 0.2653, - "step": 12240 - }, - { - "epoch": 42.53, - "learning_rate": 2.3402120141342757e-06, - "loss": 0.2616, - "step": 12250 - }, - { - "epoch": 42.57, - "learning_rate": 2.338798586572438e-06, - "loss": 0.261, - "step": 12260 - }, - { - "epoch": 42.6, - "learning_rate": 2.3373851590106005e-06, - "loss": 0.2511, - "step": 12270 - }, - { - "epoch": 42.64, - "learning_rate": 2.335971731448763e-06, - "loss": 0.2572, - "step": 12280 - }, - { - "epoch": 42.67, - "learning_rate": 2.3345583038869258e-06, - "loss": 0.2928, - "step": 12290 - }, - { - "epoch": 42.71, - "learning_rate": 2.333144876325088e-06, - "loss": 0.2539, - "step": 12300 - }, - { - "epoch": 42.74, - "learning_rate": 2.331731448763251e-06, - "loss": 0.2707, - "step": 12310 - }, - { - "epoch": 42.78, - "learning_rate": 2.3303180212014134e-06, - "loss": 0.2607, - "step": 12320 - }, - { - "epoch": 42.81, - "learning_rate": 2.328904593639576e-06, - "loss": 0.2695, - "step": 12330 - }, - { - "epoch": 42.85, - "learning_rate": 2.3274911660777382e-06, - "loss": 0.2836, - "step": 12340 - }, - { - "epoch": 42.88, - "learning_rate": 2.326077738515901e-06, - "loss": 0.2677, - "step": 12350 - }, - { - "epoch": 42.91, - "learning_rate": 2.3246643109540635e-06, - "loss": 0.2583, - "step": 12360 - }, - { - "epoch": 42.95, - "learning_rate": 2.3232508833922263e-06, - "loss": 0.2554, - "step": 12370 - }, - { - "epoch": 42.98, - "learning_rate": 2.3218374558303883e-06, - "loss": 0.2696, - "step": 12380 - }, - { - "epoch": 43.0, - "eval_loss": 0.5108169913291931, - "eval_runtime": 133.4619, - "eval_samples_per_second": 3.986, - "eval_steps_per_second": 0.997, - "eval_wer": 0.19862441344732276, - "step": 12384 - }, - { - "epoch": 43.02, - "learning_rate": 2.320424028268551e-06, - "loss": 0.2739, - "step": 12390 - }, - { - "epoch": 43.06, - "learning_rate": 2.3190106007067135e-06, - "loss": 0.2612, - "step": 12400 - }, - { - "epoch": 43.09, - "learning_rate": 2.3175971731448764e-06, - "loss": 0.2596, - "step": 12410 - }, - { - "epoch": 43.12, - "learning_rate": 2.3161837455830388e-06, - "loss": 0.2777, - "step": 12420 - }, - { - "epoch": 43.16, - "learning_rate": 2.3147703180212016e-06, - "loss": 0.2487, - "step": 12430 - }, - { - "epoch": 43.19, - "learning_rate": 2.3133568904593636e-06, - "loss": 0.2452, - "step": 12440 - }, - { - "epoch": 43.23, - "learning_rate": 2.3119434628975264e-06, - "loss": 0.2495, - "step": 12450 - }, - { - "epoch": 43.26, - "learning_rate": 2.310530035335689e-06, - "loss": 0.2412, - "step": 12460 - }, - { - "epoch": 43.3, - "learning_rate": 2.3091166077738517e-06, - "loss": 0.2515, - "step": 12470 - }, - { - "epoch": 43.33, - "learning_rate": 2.307703180212014e-06, - "loss": 0.2955, - "step": 12480 - }, - { - "epoch": 43.37, - "learning_rate": 2.306289752650177e-06, - "loss": 0.2725, - "step": 12490 - }, - { - "epoch": 43.4, - "learning_rate": 2.304876325088339e-06, - "loss": 0.2414, - "step": 12500 - }, - { - "epoch": 43.44, - "learning_rate": 2.3034628975265017e-06, - "loss": 0.251, - "step": 12510 - }, - { - "epoch": 43.47, - "learning_rate": 2.302049469964664e-06, - "loss": 0.2579, - "step": 12520 - }, - { - "epoch": 43.51, - "learning_rate": 2.300636042402827e-06, - "loss": 0.2531, - "step": 12530 - }, - { - "epoch": 43.54, - "learning_rate": 2.2992226148409894e-06, - "loss": 0.247, - "step": 12540 - }, - { - "epoch": 43.57, - "learning_rate": 2.297809187279152e-06, - "loss": 0.278, - "step": 12550 - }, - { - "epoch": 43.61, - "learning_rate": 2.296395759717314e-06, - "loss": 0.2435, - "step": 12560 - }, - { - "epoch": 43.64, - "learning_rate": 2.294982332155477e-06, - "loss": 0.258, - "step": 12570 - }, - { - "epoch": 43.68, - "learning_rate": 2.2935689045936395e-06, - "loss": 0.2659, - "step": 12580 - }, - { - "epoch": 43.71, - "learning_rate": 2.2921554770318023e-06, - "loss": 0.2554, - "step": 12590 - }, - { - "epoch": 43.75, - "learning_rate": 2.2907420494699647e-06, - "loss": 0.2671, - "step": 12600 - }, - { - "epoch": 43.78, - "learning_rate": 2.289328621908127e-06, - "loss": 0.26, - "step": 12610 - }, - { - "epoch": 43.82, - "learning_rate": 2.2879151943462895e-06, - "loss": 0.2791, - "step": 12620 - }, - { - "epoch": 43.85, - "learning_rate": 2.2865017667844523e-06, - "loss": 0.2532, - "step": 12630 - }, - { - "epoch": 43.89, - "learning_rate": 2.2850883392226148e-06, - "loss": 0.2759, - "step": 12640 - }, - { - "epoch": 43.92, - "learning_rate": 2.2836749116607776e-06, - "loss": 0.2659, - "step": 12650 - }, - { - "epoch": 43.96, - "learning_rate": 2.28226148409894e-06, - "loss": 0.2672, - "step": 12660 - }, - { - "epoch": 43.99, - "learning_rate": 2.2808480565371024e-06, - "loss": 0.2729, - "step": 12670 - }, - { - "epoch": 44.0, - "eval_loss": 0.5158911943435669, - "eval_runtime": 133.2183, - "eval_samples_per_second": 3.993, - "eval_steps_per_second": 0.998, - "eval_wer": 0.1990743716654882, - "step": 12672 - }, - { - "epoch": 44.03, - "learning_rate": 2.279434628975265e-06, - "loss": 0.2755, - "step": 12680 - }, - { - "epoch": 44.06, - "learning_rate": 2.2780212014134277e-06, - "loss": 0.2787, - "step": 12690 - }, - { - "epoch": 44.1, - "learning_rate": 2.27660777385159e-06, - "loss": 0.2539, - "step": 12700 - }, - { - "epoch": 44.13, - "learning_rate": 2.275194346289753e-06, - "loss": 0.2686, - "step": 12710 - }, - { - "epoch": 44.17, - "learning_rate": 2.273780918727915e-06, - "loss": 0.2883, - "step": 12720 - }, - { - "epoch": 44.2, - "learning_rate": 2.2723674911660777e-06, - "loss": 0.2573, - "step": 12730 - }, - { - "epoch": 44.24, - "learning_rate": 2.27095406360424e-06, - "loss": 0.2739, - "step": 12740 - }, - { - "epoch": 44.27, - "learning_rate": 2.269540636042403e-06, - "loss": 0.2749, - "step": 12750 - }, - { - "epoch": 44.3, - "learning_rate": 2.2681272084805654e-06, - "loss": 0.275, - "step": 12760 - }, - { - "epoch": 44.34, - "learning_rate": 2.266713780918728e-06, - "loss": 0.2766, - "step": 12770 - }, - { - "epoch": 44.37, - "learning_rate": 2.26530035335689e-06, - "loss": 0.2475, - "step": 12780 - }, - { - "epoch": 44.41, - "learning_rate": 2.2638869257950526e-06, - "loss": 0.2739, - "step": 12790 - }, - { - "epoch": 44.44, - "learning_rate": 2.2624734982332154e-06, - "loss": 0.2448, - "step": 12800 - }, - { - "epoch": 44.48, - "learning_rate": 2.2610600706713783e-06, - "loss": 0.2801, - "step": 12810 - }, - { - "epoch": 44.51, - "learning_rate": 2.2596466431095407e-06, - "loss": 0.2575, - "step": 12820 - }, - { - "epoch": 44.55, - "learning_rate": 2.2582332155477035e-06, - "loss": 0.249, - "step": 12830 - }, - { - "epoch": 44.58, - "learning_rate": 2.2568197879858655e-06, - "loss": 0.2546, - "step": 12840 - }, - { - "epoch": 44.62, - "learning_rate": 2.255406360424028e-06, - "loss": 0.2462, - "step": 12850 - }, - { - "epoch": 44.65, - "learning_rate": 2.2539929328621907e-06, - "loss": 0.2588, - "step": 12860 - }, - { - "epoch": 44.69, - "learning_rate": 2.252579505300353e-06, - "loss": 0.2569, - "step": 12870 - }, - { - "epoch": 44.72, - "learning_rate": 2.251166077738516e-06, - "loss": 0.2515, - "step": 12880 - }, - { - "epoch": 44.75, - "learning_rate": 2.249752650176678e-06, - "loss": 0.2564, - "step": 12890 - }, - { - "epoch": 44.79, - "learning_rate": 2.248339222614841e-06, - "loss": 0.2579, - "step": 12900 - }, - { - "epoch": 44.82, - "learning_rate": 2.246925795053003e-06, - "loss": 0.2831, - "step": 12910 - }, - { - "epoch": 44.86, - "learning_rate": 2.245512367491166e-06, - "loss": 0.2546, - "step": 12920 - }, - { - "epoch": 44.89, - "learning_rate": 2.2440989399293284e-06, - "loss": 0.2653, - "step": 12930 - }, - { - "epoch": 44.93, - "learning_rate": 2.2426855123674913e-06, - "loss": 0.2527, - "step": 12940 - }, - { - "epoch": 44.96, - "learning_rate": 2.2412720848056533e-06, - "loss": 0.2692, - "step": 12950 - }, - { - "epoch": 45.0, - "learning_rate": 2.239858657243816e-06, - "loss": 0.2579, - "step": 12960 - }, - { - "epoch": 45.0, - "eval_loss": 0.516213059425354, - "eval_runtime": 133.2787, - "eval_samples_per_second": 3.992, - "eval_steps_per_second": 0.998, - "eval_wer": 0.19913865141094042, - "step": 12960 - }, - { - "epoch": 45.03, - "learning_rate": 2.2384452296819785e-06, - "loss": 0.273, - "step": 12970 - }, - { - "epoch": 45.07, - "learning_rate": 2.2370318021201413e-06, - "loss": 0.2757, - "step": 12980 - }, - { - "epoch": 45.1, - "learning_rate": 2.2356183745583037e-06, - "loss": 0.2461, - "step": 12990 - }, - { - "epoch": 45.14, - "learning_rate": 2.234204946996466e-06, - "loss": 0.2693, - "step": 13000 - }, - { - "epoch": 45.17, - "learning_rate": 2.2327915194346286e-06, - "loss": 0.2596, - "step": 13010 - }, - { - "epoch": 45.21, - "learning_rate": 2.2313780918727914e-06, - "loss": 0.2436, - "step": 13020 - }, - { - "epoch": 45.24, - "learning_rate": 2.229964664310954e-06, - "loss": 0.2484, - "step": 13030 - }, - { - "epoch": 45.28, - "learning_rate": 2.2285512367491166e-06, - "loss": 0.2378, - "step": 13040 - }, - { - "epoch": 45.31, - "learning_rate": 2.227137809187279e-06, - "loss": 0.2688, - "step": 13050 - }, - { - "epoch": 45.35, - "learning_rate": 2.2257243816254415e-06, - "loss": 0.2768, - "step": 13060 - }, - { - "epoch": 45.38, - "learning_rate": 2.224310954063604e-06, - "loss": 0.2626, - "step": 13070 - }, - { - "epoch": 45.42, - "learning_rate": 2.2228975265017667e-06, - "loss": 0.2602, - "step": 13080 - }, - { - "epoch": 45.45, - "learning_rate": 2.221484098939929e-06, - "loss": 0.2623, - "step": 13090 - }, - { - "epoch": 45.48, - "learning_rate": 2.220070671378092e-06, - "loss": 0.2782, - "step": 13100 - }, - { - "epoch": 45.52, - "learning_rate": 2.2186572438162544e-06, - "loss": 0.2689, - "step": 13110 - }, - { - "epoch": 45.55, - "learning_rate": 2.2172438162544168e-06, - "loss": 0.2642, - "step": 13120 - }, - { - "epoch": 45.59, - "learning_rate": 2.215830388692579e-06, - "loss": 0.2557, - "step": 13130 - }, - { - "epoch": 45.62, - "learning_rate": 2.214416961130742e-06, - "loss": 0.2737, - "step": 13140 - }, - { - "epoch": 45.66, - "learning_rate": 2.2130035335689044e-06, - "loss": 0.2703, - "step": 13150 - }, - { - "epoch": 45.69, - "learning_rate": 2.2115901060070673e-06, - "loss": 0.2737, - "step": 13160 - }, - { - "epoch": 45.73, - "learning_rate": 2.2101766784452292e-06, - "loss": 0.264, - "step": 13170 - }, - { - "epoch": 45.76, - "learning_rate": 2.208763250883392e-06, - "loss": 0.2595, - "step": 13180 - }, - { - "epoch": 45.8, - "learning_rate": 2.2073498233215545e-06, - "loss": 0.2488, - "step": 13190 - }, - { - "epoch": 45.83, - "learning_rate": 2.2059363957597173e-06, - "loss": 0.2766, - "step": 13200 - }, - { - "epoch": 45.87, - "learning_rate": 2.2045229681978797e-06, - "loss": 0.253, - "step": 13210 - }, - { - "epoch": 45.9, - "learning_rate": 2.2031095406360426e-06, - "loss": 0.2589, - "step": 13220 - }, - { - "epoch": 45.94, - "learning_rate": 2.2016961130742045e-06, - "loss": 0.2794, - "step": 13230 - }, - { - "epoch": 45.97, - "learning_rate": 2.2002826855123674e-06, - "loss": 0.283, - "step": 13240 - }, - { - "epoch": 46.0, - "eval_loss": 0.5031996369361877, - "eval_runtime": 133.0395, - "eval_samples_per_second": 3.999, - "eval_steps_per_second": 1.0, - "eval_wer": 0.1981744552291573, - "step": 13248 - }, - { - "epoch": 46.01, - "learning_rate": 2.1988692579505298e-06, - "loss": 0.2882, - "step": 13250 - }, - { - "epoch": 46.04, - "learning_rate": 2.1974558303886926e-06, - "loss": 0.2563, - "step": 13260 - }, - { - "epoch": 46.08, - "learning_rate": 2.196042402826855e-06, - "loss": 0.2821, - "step": 13270 - }, - { - "epoch": 46.11, - "learning_rate": 2.194628975265018e-06, - "loss": 0.2555, - "step": 13280 - }, - { - "epoch": 46.15, - "learning_rate": 2.19321554770318e-06, - "loss": 0.2765, - "step": 13290 - }, - { - "epoch": 46.18, - "learning_rate": 2.1918021201413427e-06, - "loss": 0.2745, - "step": 13300 - }, - { - "epoch": 46.21, - "learning_rate": 2.190388692579505e-06, - "loss": 0.2667, - "step": 13310 - }, - { - "epoch": 46.25, - "learning_rate": 2.188975265017668e-06, - "loss": 0.2759, - "step": 13320 - }, - { - "epoch": 46.28, - "learning_rate": 2.1875618374558303e-06, - "loss": 0.2642, - "step": 13330 - }, - { - "epoch": 46.32, - "learning_rate": 2.1861484098939927e-06, - "loss": 0.2702, - "step": 13340 - }, - { - "epoch": 46.35, - "learning_rate": 2.184734982332155e-06, - "loss": 0.2689, - "step": 13350 - }, - { - "epoch": 46.39, - "learning_rate": 2.183321554770318e-06, - "loss": 0.2657, - "step": 13360 - }, - { - "epoch": 46.42, - "learning_rate": 2.1819081272084804e-06, - "loss": 0.2431, - "step": 13370 - }, - { - "epoch": 46.46, - "learning_rate": 2.1804946996466432e-06, - "loss": 0.2472, - "step": 13380 - }, - { - "epoch": 46.49, - "learning_rate": 2.1790812720848056e-06, - "loss": 0.2774, - "step": 13390 - }, - { - "epoch": 46.53, - "learning_rate": 2.177667844522968e-06, - "loss": 0.2459, - "step": 13400 - }, - { - "epoch": 46.56, - "learning_rate": 2.1762544169611305e-06, - "loss": 0.269, - "step": 13410 - }, - { - "epoch": 46.6, - "learning_rate": 2.1748409893992933e-06, - "loss": 0.2489, - "step": 13420 - }, - { - "epoch": 46.63, - "learning_rate": 2.1734275618374557e-06, - "loss": 0.2567, - "step": 13430 - }, - { - "epoch": 46.66, - "learning_rate": 2.1720141342756185e-06, - "loss": 0.2636, - "step": 13440 - }, - { - "epoch": 46.7, - "learning_rate": 2.170600706713781e-06, - "loss": 0.2421, - "step": 13450 - }, - { - "epoch": 46.73, - "learning_rate": 2.1691872791519434e-06, - "loss": 0.2446, - "step": 13460 - }, - { - "epoch": 46.77, - "learning_rate": 2.1677738515901058e-06, - "loss": 0.2593, - "step": 13470 - }, - { - "epoch": 46.8, - "learning_rate": 2.1663604240282686e-06, - "loss": 0.2525, - "step": 13480 - }, - { - "epoch": 46.84, - "learning_rate": 2.164946996466431e-06, - "loss": 0.2719, - "step": 13490 - }, - { - "epoch": 46.87, - "learning_rate": 2.163533568904594e-06, - "loss": 0.2601, - "step": 13500 - }, - { - "epoch": 46.91, - "learning_rate": 2.162120141342756e-06, - "loss": 0.2798, - "step": 13510 - }, - { - "epoch": 46.94, - "learning_rate": 2.1608480565371027e-06, - "loss": 0.2435, - "step": 13520 - }, - { - "epoch": 46.98, - "learning_rate": 2.1594346289752647e-06, - "loss": 0.282, - "step": 13530 - }, - { - "epoch": 47.0, - "eval_loss": 0.5107125639915466, - "eval_runtime": 133.7168, - "eval_samples_per_second": 3.979, - "eval_steps_per_second": 0.995, - "eval_wer": 0.19804589573825288, - "step": 13536 - }, - { - "epoch": 47.01, - "learning_rate": 2.1580212014134275e-06, - "loss": 0.2783, - "step": 13540 - }, - { - "epoch": 47.05, - "learning_rate": 2.15660777385159e-06, - "loss": 0.2695, - "step": 13550 - }, - { - "epoch": 47.08, - "learning_rate": 2.1551943462897528e-06, - "loss": 0.2469, - "step": 13560 - }, - { - "epoch": 47.12, - "learning_rate": 2.153780918727915e-06, - "loss": 0.2757, - "step": 13570 - }, - { - "epoch": 47.15, - "learning_rate": 2.152367491166078e-06, - "loss": 0.2721, - "step": 13580 - }, - { - "epoch": 47.19, - "learning_rate": 2.15095406360424e-06, - "loss": 0.2529, - "step": 13590 - }, - { - "epoch": 47.22, - "learning_rate": 2.149540636042403e-06, - "loss": 0.2562, - "step": 13600 - }, - { - "epoch": 47.26, - "learning_rate": 2.1481272084805652e-06, - "loss": 0.2712, - "step": 13610 - }, - { - "epoch": 47.29, - "learning_rate": 2.146713780918728e-06, - "loss": 0.2696, - "step": 13620 - }, - { - "epoch": 47.33, - "learning_rate": 2.1453003533568905e-06, - "loss": 0.2698, - "step": 13630 - }, - { - "epoch": 47.36, - "learning_rate": 2.143886925795053e-06, - "loss": 0.2528, - "step": 13640 - }, - { - "epoch": 47.39, - "learning_rate": 2.1424734982332153e-06, - "loss": 0.2671, - "step": 13650 - }, - { - "epoch": 47.43, - "learning_rate": 2.141060070671378e-06, - "loss": 0.2542, - "step": 13660 - }, - { - "epoch": 47.46, - "learning_rate": 2.1396466431095405e-06, - "loss": 0.2696, - "step": 13670 - }, - { - "epoch": 47.5, - "learning_rate": 2.1382332155477034e-06, - "loss": 0.2652, - "step": 13680 - }, - { - "epoch": 47.53, - "learning_rate": 2.136819787985866e-06, - "loss": 0.2518, - "step": 13690 - }, - { - "epoch": 47.57, - "learning_rate": 2.135406360424028e-06, - "loss": 0.2353, - "step": 13700 - }, - { - "epoch": 47.6, - "learning_rate": 2.1339929328621906e-06, - "loss": 0.2568, - "step": 13710 - }, - { - "epoch": 47.64, - "learning_rate": 2.1325795053003534e-06, - "loss": 0.2935, - "step": 13720 - }, - { - "epoch": 47.67, - "learning_rate": 2.131166077738516e-06, - "loss": 0.2511, - "step": 13730 - }, - { - "epoch": 47.71, - "learning_rate": 2.1297526501766787e-06, - "loss": 0.2768, - "step": 13740 - }, - { - "epoch": 47.74, - "learning_rate": 2.128339222614841e-06, - "loss": 0.2525, - "step": 13750 - }, - { - "epoch": 47.78, - "learning_rate": 2.126925795053003e-06, - "loss": 0.2236, - "step": 13760 - }, - { - "epoch": 47.81, - "learning_rate": 2.125512367491166e-06, - "loss": 0.2719, - "step": 13770 - }, - { - "epoch": 47.85, - "learning_rate": 2.1240989399293287e-06, - "loss": 0.2772, - "step": 13780 - }, - { - "epoch": 47.88, - "learning_rate": 2.122685512367491e-06, - "loss": 0.2682, - "step": 13790 - }, - { - "epoch": 47.91, - "learning_rate": 2.121272084805654e-06, - "loss": 0.2631, - "step": 13800 - }, - { - "epoch": 47.95, - "learning_rate": 2.119858657243816e-06, - "loss": 0.2571, - "step": 13810 - }, - { - "epoch": 47.98, - "learning_rate": 2.1184452296819784e-06, - "loss": 0.2708, - "step": 13820 - }, - { - "epoch": 48.0, - "eval_loss": 0.5127933025360107, - "eval_runtime": 133.2709, - "eval_samples_per_second": 3.992, - "eval_steps_per_second": 0.998, - "eval_wer": 0.1982387349746095, - "step": 13824 - }, - { - "epoch": 48.02, - "learning_rate": 2.1170318021201412e-06, - "loss": 0.2812, - "step": 13830 - }, - { - "epoch": 48.06, - "learning_rate": 2.1156183745583036e-06, - "loss": 0.2673, - "step": 13840 - }, - { - "epoch": 48.09, - "learning_rate": 2.1142049469964665e-06, - "loss": 0.2529, - "step": 13850 - }, - { - "epoch": 48.12, - "learning_rate": 2.112791519434629e-06, - "loss": 0.2602, - "step": 13860 - }, - { - "epoch": 48.16, - "learning_rate": 2.1113780918727913e-06, - "loss": 0.2634, - "step": 13870 - }, - { - "epoch": 48.19, - "learning_rate": 2.1099646643109537e-06, - "loss": 0.2439, - "step": 13880 - }, - { - "epoch": 48.23, - "learning_rate": 2.1085512367491165e-06, - "loss": 0.2744, - "step": 13890 - }, - { - "epoch": 48.26, - "learning_rate": 2.107137809187279e-06, - "loss": 0.2572, - "step": 13900 - }, - { - "epoch": 48.3, - "learning_rate": 2.1057243816254418e-06, - "loss": 0.2838, - "step": 13910 - }, - { - "epoch": 48.33, - "learning_rate": 2.1043109540636038e-06, - "loss": 0.2746, - "step": 13920 - }, - { - "epoch": 48.37, - "learning_rate": 2.1028975265017666e-06, - "loss": 0.2663, - "step": 13930 - }, - { - "epoch": 48.4, - "learning_rate": 2.101484098939929e-06, - "loss": 0.2817, - "step": 13940 - }, - { - "epoch": 48.44, - "learning_rate": 2.100070671378092e-06, - "loss": 0.2583, - "step": 13950 - }, - { - "epoch": 48.47, - "learning_rate": 2.0986572438162542e-06, - "loss": 0.2796, - "step": 13960 - }, - { - "epoch": 48.51, - "learning_rate": 2.097243816254417e-06, - "loss": 0.266, - "step": 13970 - }, - { - "epoch": 48.54, - "learning_rate": 2.095830388692579e-06, - "loss": 0.2757, - "step": 13980 - }, - { - "epoch": 48.57, - "learning_rate": 2.094416961130742e-06, - "loss": 0.262, - "step": 13990 - }, - { - "epoch": 48.61, - "learning_rate": 2.0930035335689043e-06, - "loss": 0.2463, - "step": 14000 - }, - { - "epoch": 48.64, - "learning_rate": 2.091590106007067e-06, - "loss": 0.2763, - "step": 14010 - }, - { - "epoch": 48.68, - "learning_rate": 2.0901766784452295e-06, - "loss": 0.2746, - "step": 14020 - }, - { - "epoch": 48.71, - "learning_rate": 2.0887632508833924e-06, - "loss": 0.2459, - "step": 14030 - }, - { - "epoch": 48.75, - "learning_rate": 2.0873498233215544e-06, - "loss": 0.2657, - "step": 14040 - }, - { - "epoch": 48.78, - "learning_rate": 2.085936395759717e-06, - "loss": 0.2599, - "step": 14050 - }, - { - "epoch": 48.82, - "learning_rate": 2.0845229681978796e-06, - "loss": 0.2634, - "step": 14060 - }, - { - "epoch": 48.85, - "learning_rate": 2.0831095406360424e-06, - "loss": 0.2551, - "step": 14070 - }, - { - "epoch": 48.89, - "learning_rate": 2.081696113074205e-06, - "loss": 0.2322, - "step": 14080 - }, - { - "epoch": 48.92, - "learning_rate": 2.0802826855123673e-06, - "loss": 0.2524, - "step": 14090 - }, - { - "epoch": 48.96, - "learning_rate": 2.0788692579505297e-06, - "loss": 0.2667, - "step": 14100 - }, - { - "epoch": 48.99, - "learning_rate": 2.0774558303886925e-06, - "loss": 0.2562, - "step": 14110 - }, - { - "epoch": 49.0, - "eval_loss": 0.5162803530693054, - "eval_runtime": 133.3898, - "eval_samples_per_second": 3.988, - "eval_steps_per_second": 0.997, - "eval_wer": 0.1990743716654882, - "step": 14112 - }, - { - "epoch": 49.03, - "learning_rate": 2.076042402826855e-06, - "loss": 0.2776, - "step": 14120 - }, - { - "epoch": 49.06, - "learning_rate": 2.0746289752650177e-06, - "loss": 0.2473, - "step": 14130 - }, - { - "epoch": 49.1, - "learning_rate": 2.07321554770318e-06, - "loss": 0.2626, - "step": 14140 - }, - { - "epoch": 49.13, - "learning_rate": 2.0718021201413426e-06, - "loss": 0.2602, - "step": 14150 - }, - { - "epoch": 49.17, - "learning_rate": 2.070388692579505e-06, - "loss": 0.2707, - "step": 14160 - }, - { - "epoch": 49.2, - "learning_rate": 2.068975265017668e-06, - "loss": 0.2423, - "step": 14170 - }, - { - "epoch": 49.24, - "learning_rate": 2.06756183745583e-06, - "loss": 0.2965, - "step": 14180 - }, - { - "epoch": 49.27, - "learning_rate": 2.066148409893993e-06, - "loss": 0.2602, - "step": 14190 - }, - { - "epoch": 49.3, - "learning_rate": 2.0647349823321555e-06, - "loss": 0.2547, - "step": 14200 - }, - { - "epoch": 49.34, - "learning_rate": 2.063321554770318e-06, - "loss": 0.2702, - "step": 14210 - }, - { - "epoch": 49.37, - "learning_rate": 2.0619081272084803e-06, - "loss": 0.2806, - "step": 14220 - }, - { - "epoch": 49.41, - "learning_rate": 2.060494699646643e-06, - "loss": 0.2648, - "step": 14230 - }, - { - "epoch": 49.44, - "learning_rate": 2.0590812720848055e-06, - "loss": 0.2396, - "step": 14240 - }, - { - "epoch": 49.48, - "learning_rate": 2.0576678445229683e-06, - "loss": 0.2837, - "step": 14250 - }, - { - "epoch": 49.51, - "learning_rate": 2.0562544169611303e-06, - "loss": 0.281, - "step": 14260 - }, - { - "epoch": 49.55, - "learning_rate": 2.054840989399293e-06, - "loss": 0.235, - "step": 14270 - }, - { - "epoch": 49.58, - "learning_rate": 2.0534275618374556e-06, - "loss": 0.2556, - "step": 14280 - }, - { - "epoch": 49.62, - "learning_rate": 2.0520141342756184e-06, - "loss": 0.2675, - "step": 14290 - }, - { - "epoch": 49.65, - "learning_rate": 2.050600706713781e-06, - "loss": 0.2774, - "step": 14300 - }, - { - "epoch": 49.69, - "learning_rate": 2.0491872791519437e-06, - "loss": 0.2742, - "step": 14310 - }, - { - "epoch": 49.72, - "learning_rate": 2.0477738515901056e-06, - "loss": 0.2665, - "step": 14320 - }, - { - "epoch": 49.75, - "learning_rate": 2.0463604240282685e-06, - "loss": 0.2664, - "step": 14330 - }, - { - "epoch": 49.79, - "learning_rate": 2.044946996466431e-06, - "loss": 0.2496, - "step": 14340 - }, - { - "epoch": 49.82, - "learning_rate": 2.0435335689045937e-06, - "loss": 0.2725, - "step": 14350 - }, - { - "epoch": 49.86, - "learning_rate": 2.042120141342756e-06, - "loss": 0.2581, - "step": 14360 - }, - { - "epoch": 49.89, - "learning_rate": 2.040706713780919e-06, - "loss": 0.2582, - "step": 14370 - }, - { - "epoch": 49.93, - "learning_rate": 2.039293286219081e-06, - "loss": 0.2514, - "step": 14380 - }, - { - "epoch": 49.96, - "learning_rate": 2.0378798586572438e-06, - "loss": 0.2765, - "step": 14390 - }, - { - "epoch": 50.0, - "learning_rate": 2.036466431095406e-06, - "loss": 0.2675, - "step": 14400 - }, - { - "epoch": 50.0, - "eval_loss": 0.5062453150749207, - "eval_runtime": 133.1193, - "eval_samples_per_second": 3.996, - "eval_steps_per_second": 0.999, - "eval_wer": 0.19939577039274925, - "step": 14400 - }, - { - "epoch": 50.03, - "learning_rate": 2.035053003533569e-06, - "loss": 0.2766, - "step": 14410 - }, - { - "epoch": 50.07, - "learning_rate": 2.0336395759717314e-06, - "loss": 0.2511, - "step": 14420 - }, - { - "epoch": 50.1, - "learning_rate": 2.032226148409894e-06, - "loss": 0.2459, - "step": 14430 - }, - { - "epoch": 50.14, - "learning_rate": 2.0308127208480562e-06, - "loss": 0.2715, - "step": 14440 - }, - { - "epoch": 50.17, - "learning_rate": 2.029399293286219e-06, - "loss": 0.2912, - "step": 14450 - }, - { - "epoch": 50.21, - "learning_rate": 2.0279858657243815e-06, - "loss": 0.2606, - "step": 14460 - }, - { - "epoch": 50.24, - "learning_rate": 2.0265724381625443e-06, - "loss": 0.2685, - "step": 14470 - }, - { - "epoch": 50.28, - "learning_rate": 2.0251590106007067e-06, - "loss": 0.2354, - "step": 14480 - }, - { - "epoch": 50.31, - "learning_rate": 2.023745583038869e-06, - "loss": 0.2725, - "step": 14490 - }, - { - "epoch": 50.35, - "learning_rate": 2.0223321554770316e-06, - "loss": 0.2681, - "step": 14500 - }, - { - "epoch": 50.38, - "learning_rate": 2.0209187279151944e-06, - "loss": 0.242, - "step": 14510 - }, - { - "epoch": 50.42, - "learning_rate": 2.019505300353357e-06, - "loss": 0.2646, - "step": 14520 - }, - { - "epoch": 50.45, - "learning_rate": 2.0180918727915196e-06, - "loss": 0.2415, - "step": 14530 - }, - { - "epoch": 50.48, - "learning_rate": 2.0166784452296816e-06, - "loss": 0.2905, - "step": 14540 - }, - { - "epoch": 50.52, - "learning_rate": 2.0152650176678444e-06, - "loss": 0.2674, - "step": 14550 - }, - { - "epoch": 50.55, - "learning_rate": 2.013851590106007e-06, - "loss": 0.2427, - "step": 14560 - }, - { - "epoch": 50.59, - "learning_rate": 2.0124381625441697e-06, - "loss": 0.2535, - "step": 14570 - }, - { - "epoch": 50.62, - "learning_rate": 2.011024734982332e-06, - "loss": 0.252, - "step": 14580 - }, - { - "epoch": 50.66, - "learning_rate": 2.009611307420495e-06, - "loss": 0.2764, - "step": 14590 - }, - { - "epoch": 50.69, - "learning_rate": 2.008197879858657e-06, - "loss": 0.2632, - "step": 14600 - }, - { - "epoch": 50.73, - "learning_rate": 2.0067844522968198e-06, - "loss": 0.2551, - "step": 14610 - }, - { - "epoch": 50.76, - "learning_rate": 2.005371024734982e-06, - "loss": 0.2657, - "step": 14620 - }, - { - "epoch": 50.8, - "learning_rate": 2.003957597173145e-06, - "loss": 0.2655, - "step": 14630 - }, - { - "epoch": 50.83, - "learning_rate": 2.0025441696113074e-06, - "loss": 0.2512, - "step": 14640 - }, - { - "epoch": 50.87, - "learning_rate": 2.0011307420494702e-06, - "loss": 0.2607, - "step": 14650 - }, - { - "epoch": 50.9, - "learning_rate": 1.9997173144876326e-06, - "loss": 0.2681, - "step": 14660 - }, - { - "epoch": 50.94, - "learning_rate": 1.998303886925795e-06, - "loss": 0.2625, - "step": 14670 - }, - { - "epoch": 50.97, - "learning_rate": 1.9968904593639575e-06, - "loss": 0.285, - "step": 14680 - }, - { - "epoch": 51.0, - "eval_loss": 0.4999462068080902, - "eval_runtime": 133.4245, - "eval_samples_per_second": 3.987, - "eval_steps_per_second": 0.997, - "eval_wer": 0.19875297293822716, - "step": 14688 - }, - { - "epoch": 51.01, - "learning_rate": 1.9954770318021203e-06, - "loss": 0.2801, - "step": 14690 - }, - { - "epoch": 51.04, - "learning_rate": 1.9940636042402827e-06, - "loss": 0.2528, - "step": 14700 - }, - { - "epoch": 51.08, - "learning_rate": 1.992650176678445e-06, - "loss": 0.2613, - "step": 14710 - }, - { - "epoch": 51.11, - "learning_rate": 1.991236749116608e-06, - "loss": 0.2647, - "step": 14720 - }, - { - "epoch": 51.15, - "learning_rate": 1.9898233215547704e-06, - "loss": 0.2629, - "step": 14730 - }, - { - "epoch": 51.18, - "learning_rate": 1.9884098939929328e-06, - "loss": 0.2848, - "step": 14740 - }, - { - "epoch": 51.21, - "learning_rate": 1.9869964664310956e-06, - "loss": 0.25, - "step": 14750 - }, - { - "epoch": 51.25, - "learning_rate": 1.985583038869258e-06, - "loss": 0.2707, - "step": 14760 - }, - { - "epoch": 51.28, - "learning_rate": 1.9841696113074204e-06, - "loss": 0.2287, - "step": 14770 - }, - { - "epoch": 51.32, - "learning_rate": 1.982756183745583e-06, - "loss": 0.2822, - "step": 14780 - }, - { - "epoch": 51.35, - "learning_rate": 1.9813427561837457e-06, - "loss": 0.2816, - "step": 14790 - }, - { - "epoch": 51.39, - "learning_rate": 1.979929328621908e-06, - "loss": 0.2655, - "step": 14800 - }, - { - "epoch": 51.42, - "learning_rate": 1.9785159010600705e-06, - "loss": 0.2573, - "step": 14810 - }, - { - "epoch": 51.46, - "learning_rate": 1.9771024734982333e-06, - "loss": 0.2674, - "step": 14820 - }, - { - "epoch": 51.49, - "learning_rate": 1.9756890459363957e-06, - "loss": 0.2745, - "step": 14830 - }, - { - "epoch": 51.53, - "learning_rate": 1.974275618374558e-06, - "loss": 0.2586, - "step": 14840 - }, - { - "epoch": 51.56, - "learning_rate": 1.972862190812721e-06, - "loss": 0.2439, - "step": 14850 - }, - { - "epoch": 51.6, - "learning_rate": 1.9714487632508834e-06, - "loss": 0.2376, - "step": 14860 - }, - { - "epoch": 51.63, - "learning_rate": 1.9700353356890458e-06, - "loss": 0.248, - "step": 14870 - }, - { - "epoch": 51.66, - "learning_rate": 1.968621908127208e-06, - "loss": 0.2522, - "step": 14880 - }, - { - "epoch": 51.7, - "learning_rate": 1.967208480565371e-06, - "loss": 0.2599, - "step": 14890 - }, - { - "epoch": 51.73, - "learning_rate": 1.9657950530035334e-06, - "loss": 0.2678, - "step": 14900 - }, - { - "epoch": 51.77, - "learning_rate": 1.964381625441696e-06, - "loss": 0.2662, - "step": 14910 - }, - { - "epoch": 51.8, - "learning_rate": 1.9629681978798587e-06, - "loss": 0.2576, - "step": 14920 - }, - { - "epoch": 51.84, - "learning_rate": 1.961554770318021e-06, - "loss": 0.2788, - "step": 14930 - }, - { - "epoch": 51.87, - "learning_rate": 1.9601413427561835e-06, - "loss": 0.2517, - "step": 14940 - }, - { - "epoch": 51.91, - "learning_rate": 1.958727915194346e-06, - "loss": 0.2728, - "step": 14950 - }, - { - "epoch": 51.94, - "learning_rate": 1.9573144876325087e-06, - "loss": 0.2538, - "step": 14960 - }, - { - "epoch": 51.98, - "learning_rate": 1.955901060070671e-06, - "loss": 0.2756, - "step": 14970 - }, - { - "epoch": 52.0, - "eval_loss": 0.5029511451721191, - "eval_runtime": 133.7467, - "eval_samples_per_second": 3.978, - "eval_steps_per_second": 0.994, - "eval_wer": 0.19862441344732276, - "step": 14976 - }, - { - "epoch": 52.01, - "learning_rate": 1.9544876325088336e-06, - "loss": 0.2558, - "step": 14980 - }, - { - "epoch": 52.05, - "learning_rate": 1.9530742049469964e-06, - "loss": 0.2658, - "step": 14990 - }, - { - "epoch": 52.08, - "learning_rate": 1.951660777385159e-06, - "loss": 0.255, - "step": 15000 - }, - { - "epoch": 52.12, - "learning_rate": 1.9503886925795053e-06, - "loss": 0.2528, - "step": 15010 - }, - { - "epoch": 52.15, - "learning_rate": 1.9489752650176677e-06, - "loss": 0.2853, - "step": 15020 - }, - { - "epoch": 52.19, - "learning_rate": 1.94756183745583e-06, - "loss": 0.2631, - "step": 15030 - }, - { - "epoch": 52.22, - "learning_rate": 1.946148409893993e-06, - "loss": 0.2424, - "step": 15040 - }, - { - "epoch": 52.26, - "learning_rate": 1.9447349823321553e-06, - "loss": 0.2537, - "step": 15050 - }, - { - "epoch": 52.29, - "learning_rate": 1.9433215547703177e-06, - "loss": 0.2686, - "step": 15060 - }, - { - "epoch": 52.33, - "learning_rate": 1.9419081272084806e-06, - "loss": 0.259, - "step": 15070 - }, - { - "epoch": 52.36, - "learning_rate": 1.940494699646643e-06, - "loss": 0.2609, - "step": 15080 - }, - { - "epoch": 52.39, - "learning_rate": 1.9390812720848054e-06, - "loss": 0.2807, - "step": 15090 - }, - { - "epoch": 52.43, - "learning_rate": 1.9376678445229682e-06, - "loss": 0.2633, - "step": 15100 - }, - { - "epoch": 52.46, - "learning_rate": 1.9362544169611306e-06, - "loss": 0.2583, - "step": 15110 - }, - { - "epoch": 52.5, - "learning_rate": 1.934840989399293e-06, - "loss": 0.2656, - "step": 15120 - }, - { - "epoch": 52.53, - "learning_rate": 1.933427561837456e-06, - "loss": 0.2534, - "step": 15130 - }, - { - "epoch": 52.57, - "learning_rate": 1.9320141342756183e-06, - "loss": 0.2639, - "step": 15140 - }, - { - "epoch": 52.6, - "learning_rate": 1.9306007067137807e-06, - "loss": 0.2408, - "step": 15150 - }, - { - "epoch": 52.64, - "learning_rate": 1.9291872791519435e-06, - "loss": 0.2493, - "step": 15160 - }, - { - "epoch": 52.67, - "learning_rate": 1.927773851590106e-06, - "loss": 0.2729, - "step": 15170 - }, - { - "epoch": 52.71, - "learning_rate": 1.9263604240282684e-06, - "loss": 0.2708, - "step": 15180 - }, - { - "epoch": 52.74, - "learning_rate": 1.924946996466431e-06, - "loss": 0.2759, - "step": 15190 - }, - { - "epoch": 52.78, - "learning_rate": 1.9235335689045936e-06, - "loss": 0.254, - "step": 15200 - }, - { - "epoch": 52.81, - "learning_rate": 1.922120141342756e-06, - "loss": 0.2598, - "step": 15210 - }, - { - "epoch": 52.85, - "learning_rate": 1.9207067137809184e-06, - "loss": 0.2672, - "step": 15220 - }, - { - "epoch": 52.88, - "learning_rate": 1.9192932862190812e-06, - "loss": 0.2436, - "step": 15230 - }, - { - "epoch": 52.91, - "learning_rate": 1.9178798586572437e-06, - "loss": 0.2741, - "step": 15240 - }, - { - "epoch": 52.95, - "learning_rate": 1.916466431095406e-06, - "loss": 0.2601, - "step": 15250 - }, - { - "epoch": 52.98, - "learning_rate": 1.915053003533569e-06, - "loss": 0.2888, - "step": 15260 - }, - { - "epoch": 53.0, - "eval_loss": 0.5042588114738464, - "eval_runtime": 133.2498, - "eval_samples_per_second": 3.993, - "eval_steps_per_second": 0.998, - "eval_wer": 0.19746737802918302, - "step": 15264 - }, - { - "epoch": 53.02, - "learning_rate": 1.9136395759717313e-06, - "loss": 0.2853, - "step": 15270 - }, - { - "epoch": 53.06, - "learning_rate": 1.9122261484098937e-06, - "loss": 0.2504, - "step": 15280 - }, - { - "epoch": 53.09, - "learning_rate": 1.9108127208480565e-06, - "loss": 0.2608, - "step": 15290 - }, - { - "epoch": 53.12, - "learning_rate": 1.909399293286219e-06, - "loss": 0.2486, - "step": 15300 - }, - { - "epoch": 53.16, - "learning_rate": 1.9079858657243814e-06, - "loss": 0.2576, - "step": 15310 - }, - { - "epoch": 53.19, - "learning_rate": 1.906572438162544e-06, - "loss": 0.2678, - "step": 15320 - }, - { - "epoch": 53.23, - "learning_rate": 1.9051590106007068e-06, - "loss": 0.271, - "step": 15330 - }, - { - "epoch": 53.26, - "learning_rate": 1.903745583038869e-06, - "loss": 0.2528, - "step": 15340 - }, - { - "epoch": 53.3, - "learning_rate": 1.9023321554770316e-06, - "loss": 0.2786, - "step": 15350 - }, - { - "epoch": 53.33, - "learning_rate": 1.9009187279151943e-06, - "loss": 0.2634, - "step": 15360 - }, - { - "epoch": 53.37, - "learning_rate": 1.8995053003533567e-06, - "loss": 0.2764, - "step": 15370 - }, - { - "epoch": 53.4, - "learning_rate": 1.8980918727915193e-06, - "loss": 0.2592, - "step": 15380 - }, - { - "epoch": 53.44, - "learning_rate": 1.8966784452296817e-06, - "loss": 0.2503, - "step": 15390 - }, - { - "epoch": 53.47, - "learning_rate": 1.8952650176678443e-06, - "loss": 0.2712, - "step": 15400 - }, - { - "epoch": 53.51, - "learning_rate": 1.893851590106007e-06, - "loss": 0.2914, - "step": 15410 - }, - { - "epoch": 53.54, - "learning_rate": 1.8924381625441694e-06, - "loss": 0.2474, - "step": 15420 - }, - { - "epoch": 53.57, - "learning_rate": 1.891024734982332e-06, - "loss": 0.2733, - "step": 15430 - }, - { - "epoch": 53.61, - "learning_rate": 1.8896113074204946e-06, - "loss": 0.2511, - "step": 15440 - }, - { - "epoch": 53.64, - "learning_rate": 1.888197879858657e-06, - "loss": 0.2564, - "step": 15450 - }, - { - "epoch": 53.68, - "learning_rate": 1.8867844522968196e-06, - "loss": 0.2475, - "step": 15460 - }, - { - "epoch": 53.71, - "learning_rate": 1.8853710247349823e-06, - "loss": 0.2616, - "step": 15470 - }, - { - "epoch": 53.75, - "learning_rate": 1.8839575971731447e-06, - "loss": 0.2788, - "step": 15480 - }, - { - "epoch": 53.78, - "learning_rate": 1.8825441696113073e-06, - "loss": 0.2476, - "step": 15490 - }, - { - "epoch": 53.82, - "learning_rate": 1.88113074204947e-06, - "loss": 0.2713, - "step": 15500 - }, - { - "epoch": 53.85, - "learning_rate": 1.8797173144876323e-06, - "loss": 0.2638, - "step": 15510 - }, - { - "epoch": 53.89, - "learning_rate": 1.878303886925795e-06, - "loss": 0.2478, - "step": 15520 - }, - { - "epoch": 53.92, - "learning_rate": 1.8768904593639573e-06, - "loss": 0.2535, - "step": 15530 - }, - { - "epoch": 53.96, - "learning_rate": 1.87547703180212e-06, - "loss": 0.2804, - "step": 15540 - }, - { - "epoch": 53.99, - "learning_rate": 1.8740636042402826e-06, - "loss": 0.2778, - "step": 15550 - }, - { - "epoch": 54.0, - "eval_loss": 0.5110978484153748, - "eval_runtime": 133.5788, - "eval_samples_per_second": 3.983, - "eval_steps_per_second": 0.996, - "eval_wer": 0.19804589573825288, - "step": 15552 - }, - { - "epoch": 54.03, - "learning_rate": 1.872650176678445e-06, - "loss": 0.2538, - "step": 15560 - }, - { - "epoch": 54.06, - "learning_rate": 1.8712367491166076e-06, - "loss": 0.2607, - "step": 15570 - }, - { - "epoch": 54.1, - "learning_rate": 1.8698233215547702e-06, - "loss": 0.2557, - "step": 15580 - }, - { - "epoch": 54.13, - "learning_rate": 1.8684098939929326e-06, - "loss": 0.2918, - "step": 15590 - }, - { - "epoch": 54.17, - "learning_rate": 1.8669964664310953e-06, - "loss": 0.3063, - "step": 15600 - }, - { - "epoch": 54.2, - "learning_rate": 1.8655830388692579e-06, - "loss": 0.2604, - "step": 15610 - }, - { - "epoch": 54.24, - "learning_rate": 1.8641696113074203e-06, - "loss": 0.263, - "step": 15620 - }, - { - "epoch": 54.27, - "learning_rate": 1.862756183745583e-06, - "loss": 0.2506, - "step": 15630 - }, - { - "epoch": 54.3, - "learning_rate": 1.8613427561837455e-06, - "loss": 0.271, - "step": 15640 - }, - { - "epoch": 54.34, - "learning_rate": 1.859929328621908e-06, - "loss": 0.2591, - "step": 15650 - }, - { - "epoch": 54.37, - "learning_rate": 1.8585159010600706e-06, - "loss": 0.2762, - "step": 15660 - }, - { - "epoch": 54.41, - "learning_rate": 1.8571024734982332e-06, - "loss": 0.2877, - "step": 15670 - }, - { - "epoch": 54.44, - "learning_rate": 1.8556890459363956e-06, - "loss": 0.2491, - "step": 15680 - }, - { - "epoch": 54.48, - "learning_rate": 1.8542756183745582e-06, - "loss": 0.2738, - "step": 15690 - }, - { - "epoch": 54.51, - "learning_rate": 1.8528621908127206e-06, - "loss": 0.2679, - "step": 15700 - }, - { - "epoch": 54.55, - "learning_rate": 1.8514487632508833e-06, - "loss": 0.2627, - "step": 15710 - }, - { - "epoch": 54.58, - "learning_rate": 1.8500353356890459e-06, - "loss": 0.2609, - "step": 15720 - }, - { - "epoch": 54.62, - "learning_rate": 1.8486219081272083e-06, - "loss": 0.2451, - "step": 15730 - }, - { - "epoch": 54.65, - "learning_rate": 1.847208480565371e-06, - "loss": 0.2622, - "step": 15740 - }, - { - "epoch": 54.69, - "learning_rate": 1.8457950530035335e-06, - "loss": 0.2716, - "step": 15750 - }, - { - "epoch": 54.72, - "learning_rate": 1.844381625441696e-06, - "loss": 0.2604, - "step": 15760 - }, - { - "epoch": 54.75, - "learning_rate": 1.8429681978798586e-06, - "loss": 0.2488, - "step": 15770 - }, - { - "epoch": 54.79, - "learning_rate": 1.8415547703180212e-06, - "loss": 0.2716, - "step": 15780 - }, - { - "epoch": 54.82, - "learning_rate": 1.8401413427561836e-06, - "loss": 0.2795, - "step": 15790 - }, - { - "epoch": 54.86, - "learning_rate": 1.8387279151943462e-06, - "loss": 0.2662, - "step": 15800 - }, - { - "epoch": 54.89, - "learning_rate": 1.8373144876325088e-06, - "loss": 0.2475, - "step": 15810 - }, - { - "epoch": 54.93, - "learning_rate": 1.8359010600706712e-06, - "loss": 0.2695, - "step": 15820 - }, - { - "epoch": 54.96, - "learning_rate": 1.8344876325088339e-06, - "loss": 0.2605, - "step": 15830 - }, - { - "epoch": 55.0, - "learning_rate": 1.8330742049469965e-06, - "loss": 0.2707, - "step": 15840 - }, - { - "epoch": 55.0, - "eval_loss": 0.5116538405418396, - "eval_runtime": 133.5286, - "eval_samples_per_second": 3.984, - "eval_steps_per_second": 0.996, - "eval_wer": 0.19946005013820145, - "step": 15840 - }, - { - "epoch": 55.03, - "learning_rate": 1.831660777385159e-06, - "loss": 0.2439, - "step": 15850 - }, - { - "epoch": 55.07, - "learning_rate": 1.8302473498233215e-06, - "loss": 0.2534, - "step": 15860 - }, - { - "epoch": 55.1, - "learning_rate": 1.828833922261484e-06, - "loss": 0.2465, - "step": 15870 - }, - { - "epoch": 55.14, - "learning_rate": 1.8274204946996465e-06, - "loss": 0.2705, - "step": 15880 - }, - { - "epoch": 55.17, - "learning_rate": 1.8260070671378092e-06, - "loss": 0.2686, - "step": 15890 - }, - { - "epoch": 55.21, - "learning_rate": 1.8245936395759716e-06, - "loss": 0.2646, - "step": 15900 - }, - { - "epoch": 55.24, - "learning_rate": 1.8231802120141342e-06, - "loss": 0.2688, - "step": 15910 - }, - { - "epoch": 55.28, - "learning_rate": 1.8217667844522968e-06, - "loss": 0.2504, - "step": 15920 - }, - { - "epoch": 55.31, - "learning_rate": 1.8203533568904592e-06, - "loss": 0.2696, - "step": 15930 - }, - { - "epoch": 55.35, - "learning_rate": 1.8189399293286219e-06, - "loss": 0.2634, - "step": 15940 - }, - { - "epoch": 55.38, - "learning_rate": 1.8175265017667845e-06, - "loss": 0.281, - "step": 15950 - }, - { - "epoch": 55.42, - "learning_rate": 1.8161130742049469e-06, - "loss": 0.2617, - "step": 15960 - }, - { - "epoch": 55.45, - "learning_rate": 1.8146996466431095e-06, - "loss": 0.2631, - "step": 15970 - }, - { - "epoch": 55.48, - "learning_rate": 1.8132862190812721e-06, - "loss": 0.2646, - "step": 15980 - }, - { - "epoch": 55.52, - "learning_rate": 1.8118727915194345e-06, - "loss": 0.2597, - "step": 15990 - }, - { - "epoch": 55.55, - "learning_rate": 1.8104593639575972e-06, - "loss": 0.2723, - "step": 16000 - }, - { - "epoch": 55.59, - "learning_rate": 1.8090459363957596e-06, - "loss": 0.2507, - "step": 16010 - }, - { - "epoch": 55.62, - "learning_rate": 1.8076325088339222e-06, - "loss": 0.2457, - "step": 16020 - }, - { - "epoch": 55.66, - "learning_rate": 1.8062190812720848e-06, - "loss": 0.2963, - "step": 16030 - }, - { - "epoch": 55.69, - "learning_rate": 1.8048056537102472e-06, - "loss": 0.2469, - "step": 16040 - }, - { - "epoch": 55.73, - "learning_rate": 1.8033922261484098e-06, - "loss": 0.2333, - "step": 16050 - }, - { - "epoch": 55.76, - "learning_rate": 1.8019787985865725e-06, - "loss": 0.2694, - "step": 16060 - }, - { - "epoch": 55.8, - "learning_rate": 1.8005653710247349e-06, - "loss": 0.2568, - "step": 16070 - }, - { - "epoch": 55.83, - "learning_rate": 1.7991519434628975e-06, - "loss": 0.277, - "step": 16080 - }, - { - "epoch": 55.87, - "learning_rate": 1.7977385159010601e-06, - "loss": 0.2871, - "step": 16090 - }, - { - "epoch": 55.9, - "learning_rate": 1.7963250883392225e-06, - "loss": 0.2669, - "step": 16100 - }, - { - "epoch": 55.94, - "learning_rate": 1.7949116607773851e-06, - "loss": 0.2684, - "step": 16110 - }, - { - "epoch": 55.97, - "learning_rate": 1.7934982332155478e-06, - "loss": 0.2566, - "step": 16120 - }, - { - "epoch": 56.0, - "eval_loss": 0.5196597576141357, - "eval_runtime": 133.3522, - "eval_samples_per_second": 3.989, - "eval_steps_per_second": 0.997, - "eval_wer": 0.20023140708362794, - "step": 16128 - }, - { - "epoch": 56.01, - "learning_rate": 1.7920848056537102e-06, - "loss": 0.2742, - "step": 16130 - }, - { - "epoch": 56.04, - "learning_rate": 1.7906713780918728e-06, - "loss": 0.2635, - "step": 16140 - }, - { - "epoch": 56.08, - "learning_rate": 1.7892579505300354e-06, - "loss": 0.263, - "step": 16150 - }, - { - "epoch": 56.11, - "learning_rate": 1.7878445229681978e-06, - "loss": 0.2578, - "step": 16160 - }, - { - "epoch": 56.15, - "learning_rate": 1.7864310954063604e-06, - "loss": 0.26, - "step": 16170 - }, - { - "epoch": 56.18, - "learning_rate": 1.7850176678445229e-06, - "loss": 0.2523, - "step": 16180 - }, - { - "epoch": 56.21, - "learning_rate": 1.7836042402826855e-06, - "loss": 0.2663, - "step": 16190 - }, - { - "epoch": 56.25, - "learning_rate": 1.782190812720848e-06, - "loss": 0.2493, - "step": 16200 - }, - { - "epoch": 56.28, - "learning_rate": 1.7807773851590105e-06, - "loss": 0.2407, - "step": 16210 - }, - { - "epoch": 56.32, - "learning_rate": 1.7793639575971731e-06, - "loss": 0.2565, - "step": 16220 - }, - { - "epoch": 56.35, - "learning_rate": 1.7779505300353358e-06, - "loss": 0.2673, - "step": 16230 - }, - { - "epoch": 56.39, - "learning_rate": 1.7765371024734982e-06, - "loss": 0.2487, - "step": 16240 - }, - { - "epoch": 56.42, - "learning_rate": 1.7751236749116608e-06, - "loss": 0.2539, - "step": 16250 - }, - { - "epoch": 56.46, - "learning_rate": 1.7737102473498234e-06, - "loss": 0.267, - "step": 16260 - }, - { - "epoch": 56.49, - "learning_rate": 1.7722968197879858e-06, - "loss": 0.2649, - "step": 16270 - }, - { - "epoch": 56.53, - "learning_rate": 1.7708833922261484e-06, - "loss": 0.2514, - "step": 16280 - }, - { - "epoch": 56.56, - "learning_rate": 1.769469964664311e-06, - "loss": 0.2652, - "step": 16290 - }, - { - "epoch": 56.6, - "learning_rate": 1.7680565371024735e-06, - "loss": 0.2702, - "step": 16300 - }, - { - "epoch": 56.63, - "learning_rate": 1.766643109540636e-06, - "loss": 0.2674, - "step": 16310 - }, - { - "epoch": 56.66, - "learning_rate": 1.7652296819787985e-06, - "loss": 0.3018, - "step": 16320 - }, - { - "epoch": 56.7, - "learning_rate": 1.7638162544169611e-06, - "loss": 0.2583, - "step": 16330 - }, - { - "epoch": 56.73, - "learning_rate": 1.7624028268551237e-06, - "loss": 0.262, - "step": 16340 - }, - { - "epoch": 56.77, - "learning_rate": 1.7609893992932861e-06, - "loss": 0.2863, - "step": 16350 - }, - { - "epoch": 56.8, - "learning_rate": 1.7595759717314488e-06, - "loss": 0.2632, - "step": 16360 - }, - { - "epoch": 56.84, - "learning_rate": 1.7581625441696114e-06, - "loss": 0.2861, - "step": 16370 - }, - { - "epoch": 56.87, - "learning_rate": 1.7567491166077738e-06, - "loss": 0.2588, - "step": 16380 - }, - { - "epoch": 56.91, - "learning_rate": 1.7553356890459364e-06, - "loss": 0.2594, - "step": 16390 - }, - { - "epoch": 56.94, - "learning_rate": 1.753922261484099e-06, - "loss": 0.2593, - "step": 16400 - }, - { - "epoch": 56.98, - "learning_rate": 1.7525088339222612e-06, - "loss": 0.2517, - "step": 16410 - }, - { - "epoch": 57.0, - "eval_loss": 0.5210915803909302, - "eval_runtime": 133.6955, - "eval_samples_per_second": 3.979, - "eval_steps_per_second": 0.995, - "eval_wer": 0.19766021726553962, - "step": 16416 - }, - { - "epoch": 57.01, - "learning_rate": 1.7510954063604239e-06, - "loss": 0.2697, - "step": 16420 - }, - { - "epoch": 57.05, - "learning_rate": 1.7496819787985865e-06, - "loss": 0.2594, - "step": 16430 - }, - { - "epoch": 57.08, - "learning_rate": 1.7482685512367489e-06, - "loss": 0.255, - "step": 16440 - }, - { - "epoch": 57.12, - "learning_rate": 1.7468551236749115e-06, - "loss": 0.2831, - "step": 16450 - }, - { - "epoch": 57.15, - "learning_rate": 1.7454416961130741e-06, - "loss": 0.2727, - "step": 16460 - }, - { - "epoch": 57.19, - "learning_rate": 1.7440282685512365e-06, - "loss": 0.2516, - "step": 16470 - }, - { - "epoch": 57.22, - "learning_rate": 1.7426148409893992e-06, - "loss": 0.2602, - "step": 16480 - }, - { - "epoch": 57.26, - "learning_rate": 1.7412014134275616e-06, - "loss": 0.2567, - "step": 16490 - }, - { - "epoch": 57.29, - "learning_rate": 1.7397879858657242e-06, - "loss": 0.2625, - "step": 16500 - }, - { - "epoch": 57.33, - "learning_rate": 1.7383745583038868e-06, - "loss": 0.2711, - "step": 16510 - }, - { - "epoch": 57.36, - "learning_rate": 1.7369611307420492e-06, - "loss": 0.2688, - "step": 16520 - }, - { - "epoch": 57.39, - "learning_rate": 1.7355477031802119e-06, - "loss": 0.2677, - "step": 16530 - }, - { - "epoch": 57.43, - "learning_rate": 1.7341342756183745e-06, - "loss": 0.2636, - "step": 16540 - }, - { - "epoch": 57.46, - "learning_rate": 1.7327208480565369e-06, - "loss": 0.2531, - "step": 16550 - }, - { - "epoch": 57.5, - "learning_rate": 1.7313074204946995e-06, - "loss": 0.2769, - "step": 16560 - }, - { - "epoch": 57.53, - "learning_rate": 1.7298939929328621e-06, - "loss": 0.2666, - "step": 16570 - }, - { - "epoch": 57.57, - "learning_rate": 1.7284805653710245e-06, - "loss": 0.2544, - "step": 16580 - }, - { - "epoch": 57.6, - "learning_rate": 1.7270671378091872e-06, - "loss": 0.2544, - "step": 16590 - }, - { - "epoch": 57.64, - "learning_rate": 1.7256537102473498e-06, - "loss": 0.2738, - "step": 16600 - }, - { - "epoch": 57.67, - "learning_rate": 1.7242402826855122e-06, - "loss": 0.274, - "step": 16610 - }, - { - "epoch": 57.71, - "learning_rate": 1.7228268551236748e-06, - "loss": 0.2501, - "step": 16620 - }, - { - "epoch": 57.74, - "learning_rate": 1.7214134275618372e-06, - "loss": 0.2516, - "step": 16630 - }, - { - "epoch": 57.78, - "learning_rate": 1.7199999999999998e-06, - "loss": 0.2444, - "step": 16640 - }, - { - "epoch": 57.81, - "learning_rate": 1.7185865724381625e-06, - "loss": 0.2728, - "step": 16650 - }, - { - "epoch": 57.85, - "learning_rate": 1.7171731448763249e-06, - "loss": 0.2628, - "step": 16660 - }, - { - "epoch": 57.88, - "learning_rate": 1.7157597173144875e-06, - "loss": 0.2577, - "step": 16670 - }, - { - "epoch": 57.91, - "learning_rate": 1.7143462897526501e-06, - "loss": 0.2769, - "step": 16680 - }, - { - "epoch": 57.95, - "learning_rate": 1.7129328621908125e-06, - "loss": 0.2379, - "step": 16690 - }, - { - "epoch": 57.98, - "learning_rate": 1.7115194346289751e-06, - "loss": 0.2629, - "step": 16700 - }, - { - "epoch": 58.0, - "eval_loss": 0.5079585313796997, - "eval_runtime": 133.0035, - "eval_samples_per_second": 4.0, - "eval_steps_per_second": 1.0, - "eval_wer": 0.19856013370187053, - "step": 16704 - }, - { - "epoch": 58.02, - "learning_rate": 1.7101060070671378e-06, - "loss": 0.2771, - "step": 16710 - }, - { - "epoch": 58.06, - "learning_rate": 1.7086925795053002e-06, - "loss": 0.2628, - "step": 16720 - }, - { - "epoch": 58.09, - "learning_rate": 1.7072791519434628e-06, - "loss": 0.278, - "step": 16730 - }, - { - "epoch": 58.12, - "learning_rate": 1.7058657243816254e-06, - "loss": 0.2515, - "step": 16740 - }, - { - "epoch": 58.16, - "learning_rate": 1.7044522968197878e-06, - "loss": 0.2736, - "step": 16750 - }, - { - "epoch": 58.19, - "learning_rate": 1.7030388692579504e-06, - "loss": 0.263, - "step": 16760 - }, - { - "epoch": 58.23, - "learning_rate": 1.701625441696113e-06, - "loss": 0.2649, - "step": 16770 - }, - { - "epoch": 58.26, - "learning_rate": 1.7002120141342755e-06, - "loss": 0.2387, - "step": 16780 - }, - { - "epoch": 58.3, - "learning_rate": 1.698798586572438e-06, - "loss": 0.2654, - "step": 16790 - }, - { - "epoch": 58.33, - "learning_rate": 1.6973851590106005e-06, - "loss": 0.2658, - "step": 16800 - }, - { - "epoch": 58.37, - "learning_rate": 1.6959717314487631e-06, - "loss": 0.2685, - "step": 16810 - }, - { - "epoch": 58.4, - "learning_rate": 1.6945583038869258e-06, - "loss": 0.2531, - "step": 16820 - }, - { - "epoch": 58.44, - "learning_rate": 1.6931448763250882e-06, - "loss": 0.2577, - "step": 16830 - }, - { - "epoch": 58.47, - "learning_rate": 1.6917314487632508e-06, - "loss": 0.2636, - "step": 16840 - }, - { - "epoch": 58.51, - "learning_rate": 1.6903180212014134e-06, - "loss": 0.2856, - "step": 16850 - }, - { - "epoch": 58.54, - "learning_rate": 1.6889045936395758e-06, - "loss": 0.2475, - "step": 16860 - }, - { - "epoch": 58.57, - "learning_rate": 1.6874911660777384e-06, - "loss": 0.2671, - "step": 16870 - }, - { - "epoch": 58.61, - "learning_rate": 1.686077738515901e-06, - "loss": 0.2512, - "step": 16880 - }, - { - "epoch": 58.64, - "learning_rate": 1.6846643109540635e-06, - "loss": 0.2786, - "step": 16890 - }, - { - "epoch": 58.68, - "learning_rate": 1.683250883392226e-06, - "loss": 0.2816, - "step": 16900 - }, - { - "epoch": 58.71, - "learning_rate": 1.6818374558303887e-06, - "loss": 0.2577, - "step": 16910 - }, - { - "epoch": 58.75, - "learning_rate": 1.6804240282685511e-06, - "loss": 0.2604, - "step": 16920 - }, - { - "epoch": 58.78, - "learning_rate": 1.6790106007067137e-06, - "loss": 0.2746, - "step": 16930 - }, - { - "epoch": 58.82, - "learning_rate": 1.6775971731448761e-06, - "loss": 0.269, - "step": 16940 - }, - { - "epoch": 58.85, - "learning_rate": 1.6761837455830388e-06, - "loss": 0.2399, - "step": 16950 - }, - { - "epoch": 58.89, - "learning_rate": 1.6747703180212014e-06, - "loss": 0.275, - "step": 16960 - }, - { - "epoch": 58.92, - "learning_rate": 1.6733568904593638e-06, - "loss": 0.2616, - "step": 16970 - }, - { - "epoch": 58.96, - "learning_rate": 1.6719434628975264e-06, - "loss": 0.2533, - "step": 16980 - }, - { - "epoch": 58.99, - "learning_rate": 1.670530035335689e-06, - "loss": 0.2787, - "step": 16990 - }, - { - "epoch": 59.0, - "eval_loss": 0.5133015513420105, - "eval_runtime": 133.197, - "eval_samples_per_second": 3.994, - "eval_steps_per_second": 0.999, - "eval_wer": 0.19798161599280067, - "step": 16992 - }, - { - "epoch": 59.03, - "learning_rate": 1.6691166077738515e-06, - "loss": 0.2536, - "step": 17000 - }, - { - "epoch": 59.06, - "learning_rate": 1.667703180212014e-06, - "loss": 0.2524, - "step": 17010 - }, - { - "epoch": 59.1, - "learning_rate": 1.6662897526501767e-06, - "loss": 0.2374, - "step": 17020 - }, - { - "epoch": 59.13, - "learning_rate": 1.664876325088339e-06, - "loss": 0.2744, - "step": 17030 - }, - { - "epoch": 59.17, - "learning_rate": 1.6634628975265017e-06, - "loss": 0.2803, - "step": 17040 - }, - { - "epoch": 59.2, - "learning_rate": 1.6620494699646643e-06, - "loss": 0.2857, - "step": 17050 - }, - { - "epoch": 59.24, - "learning_rate": 1.6606360424028268e-06, - "loss": 0.2656, - "step": 17060 - }, - { - "epoch": 59.27, - "learning_rate": 1.6592226148409894e-06, - "loss": 0.2608, - "step": 17070 - }, - { - "epoch": 59.3, - "learning_rate": 1.657809187279152e-06, - "loss": 0.2826, - "step": 17080 - }, - { - "epoch": 59.34, - "learning_rate": 1.6563957597173144e-06, - "loss": 0.2972, - "step": 17090 - }, - { - "epoch": 59.37, - "learning_rate": 1.654982332155477e-06, - "loss": 0.2681, - "step": 17100 - }, - { - "epoch": 59.41, - "learning_rate": 1.6535689045936394e-06, - "loss": 0.2643, - "step": 17110 - }, - { - "epoch": 59.44, - "learning_rate": 1.652155477031802e-06, - "loss": 0.255, - "step": 17120 - }, - { - "epoch": 59.48, - "learning_rate": 1.6507420494699647e-06, - "loss": 0.2737, - "step": 17130 - }, - { - "epoch": 59.51, - "learning_rate": 1.649328621908127e-06, - "loss": 0.2642, - "step": 17140 - }, - { - "epoch": 59.55, - "learning_rate": 1.6479151943462897e-06, - "loss": 0.2459, - "step": 17150 - }, - { - "epoch": 59.58, - "learning_rate": 1.6465017667844523e-06, - "loss": 0.2693, - "step": 17160 - }, - { - "epoch": 59.62, - "learning_rate": 1.6450883392226147e-06, - "loss": 0.2648, - "step": 17170 - }, - { - "epoch": 59.65, - "learning_rate": 1.6436749116607774e-06, - "loss": 0.2467, - "step": 17180 - }, - { - "epoch": 59.69, - "learning_rate": 1.64226148409894e-06, - "loss": 0.2732, - "step": 17190 - }, - { - "epoch": 59.72, - "learning_rate": 1.6408480565371024e-06, - "loss": 0.2362, - "step": 17200 - }, - { - "epoch": 59.75, - "learning_rate": 1.639434628975265e-06, - "loss": 0.2591, - "step": 17210 - }, - { - "epoch": 59.79, - "learning_rate": 1.6380212014134276e-06, - "loss": 0.2481, - "step": 17220 - }, - { - "epoch": 59.82, - "learning_rate": 1.63660777385159e-06, - "loss": 0.2918, - "step": 17230 - }, - { - "epoch": 59.86, - "learning_rate": 1.6351943462897527e-06, - "loss": 0.2633, - "step": 17240 - }, - { - "epoch": 59.89, - "learning_rate": 1.633780918727915e-06, - "loss": 0.2691, - "step": 17250 - }, - { - "epoch": 59.93, - "learning_rate": 1.6323674911660777e-06, - "loss": 0.2457, - "step": 17260 - }, - { - "epoch": 59.96, - "learning_rate": 1.6309540636042403e-06, - "loss": 0.2563, - "step": 17270 - }, - { - "epoch": 60.0, - "learning_rate": 1.6295406360424027e-06, - "loss": 0.269, - "step": 17280 - }, - { - "epoch": 60.0, - "eval_loss": 0.5155569314956665, - "eval_runtime": 133.7176, - "eval_samples_per_second": 3.979, - "eval_steps_per_second": 0.995, - "eval_wer": 0.1972745387928264, - "step": 17280 - }, - { - "epoch": 60.03, - "learning_rate": 1.6281272084805654e-06, - "loss": 0.2982, - "step": 17290 - }, - { - "epoch": 60.07, - "learning_rate": 1.626713780918728e-06, - "loss": 0.2651, - "step": 17300 - }, - { - "epoch": 60.1, - "learning_rate": 1.6253003533568904e-06, - "loss": 0.2533, - "step": 17310 - }, - { - "epoch": 60.14, - "learning_rate": 1.623886925795053e-06, - "loss": 0.2531, - "step": 17320 - }, - { - "epoch": 60.17, - "learning_rate": 1.6224734982332156e-06, - "loss": 0.2584, - "step": 17330 - }, - { - "epoch": 60.21, - "learning_rate": 1.621060070671378e-06, - "loss": 0.2649, - "step": 17340 - }, - { - "epoch": 60.24, - "learning_rate": 1.6196466431095407e-06, - "loss": 0.2601, - "step": 17350 - }, - { - "epoch": 60.28, - "learning_rate": 1.6182332155477033e-06, - "loss": 0.2509, - "step": 17360 - }, - { - "epoch": 60.31, - "learning_rate": 1.6168197879858657e-06, - "loss": 0.2647, - "step": 17370 - }, - { - "epoch": 60.35, - "learning_rate": 1.6154063604240283e-06, - "loss": 0.259, - "step": 17380 - }, - { - "epoch": 60.38, - "learning_rate": 1.613992932862191e-06, - "loss": 0.2466, - "step": 17390 - }, - { - "epoch": 60.42, - "learning_rate": 1.6125795053003533e-06, - "loss": 0.2568, - "step": 17400 - }, - { - "epoch": 60.45, - "learning_rate": 1.611166077738516e-06, - "loss": 0.2427, - "step": 17410 - }, - { - "epoch": 60.48, - "learning_rate": 1.6097526501766784e-06, - "loss": 0.265, - "step": 17420 - }, - { - "epoch": 60.52, - "learning_rate": 1.608339222614841e-06, - "loss": 0.2602, - "step": 17430 - }, - { - "epoch": 60.55, - "learning_rate": 1.6069257950530036e-06, - "loss": 0.2419, - "step": 17440 - }, - { - "epoch": 60.59, - "learning_rate": 1.605512367491166e-06, - "loss": 0.2363, - "step": 17450 - }, - { - "epoch": 60.62, - "learning_rate": 1.6040989399293286e-06, - "loss": 0.2614, - "step": 17460 - }, - { - "epoch": 60.66, - "learning_rate": 1.6026855123674913e-06, - "loss": 0.288, - "step": 17470 - }, - { - "epoch": 60.69, - "learning_rate": 1.6012720848056535e-06, - "loss": 0.2746, - "step": 17480 - }, - { - "epoch": 60.73, - "learning_rate": 1.5998586572438163e-06, - "loss": 0.2442, - "step": 17490 - }, - { - "epoch": 60.76, - "learning_rate": 1.598445229681979e-06, - "loss": 0.2789, - "step": 17500 - }, - { - "epoch": 60.8, - "learning_rate": 1.5970318021201411e-06, - "loss": 0.2478, - "step": 17510 - }, - { - "epoch": 60.83, - "learning_rate": 1.5956183745583037e-06, - "loss": 0.2833, - "step": 17520 - }, - { - "epoch": 60.87, - "learning_rate": 1.5942049469964664e-06, - "loss": 0.2829, - "step": 17530 - }, - { - "epoch": 60.9, - "learning_rate": 1.5927915194346288e-06, - "loss": 0.2482, - "step": 17540 - }, - { - "epoch": 60.94, - "learning_rate": 1.5913780918727914e-06, - "loss": 0.2772, - "step": 17550 - }, - { - "epoch": 60.97, - "learning_rate": 1.5899646643109538e-06, - "loss": 0.2664, - "step": 17560 - }, - { - "epoch": 61.0, - "eval_loss": 0.5191646814346313, - "eval_runtime": 133.5584, - "eval_samples_per_second": 3.983, - "eval_steps_per_second": 0.996, - "eval_wer": 0.1948961882110947, - "step": 17568 - }, - { - "epoch": 61.01, - "learning_rate": 1.5885512367491164e-06, - "loss": 0.2819, - "step": 17570 - }, - { - "epoch": 61.04, - "learning_rate": 1.587137809187279e-06, - "loss": 0.2615, - "step": 17580 - }, - { - "epoch": 61.08, - "learning_rate": 1.5857243816254414e-06, - "loss": 0.2556, - "step": 17590 - }, - { - "epoch": 61.11, - "learning_rate": 1.584310954063604e-06, - "loss": 0.2771, - "step": 17600 - }, - { - "epoch": 61.15, - "learning_rate": 1.5828975265017667e-06, - "loss": 0.2854, - "step": 17610 - }, - { - "epoch": 61.18, - "learning_rate": 1.581484098939929e-06, - "loss": 0.2554, - "step": 17620 - }, - { - "epoch": 61.21, - "learning_rate": 1.5800706713780917e-06, - "loss": 0.2597, - "step": 17630 - }, - { - "epoch": 61.25, - "learning_rate": 1.5786572438162543e-06, - "loss": 0.2422, - "step": 17640 - }, - { - "epoch": 61.28, - "learning_rate": 1.5772438162544168e-06, - "loss": 0.268, - "step": 17650 - }, - { - "epoch": 61.32, - "learning_rate": 1.5758303886925794e-06, - "loss": 0.2665, - "step": 17660 - }, - { - "epoch": 61.35, - "learning_rate": 1.574416961130742e-06, - "loss": 0.2504, - "step": 17670 - }, - { - "epoch": 61.39, - "learning_rate": 1.5730035335689044e-06, - "loss": 0.256, - "step": 17680 - }, - { - "epoch": 61.42, - "learning_rate": 1.571590106007067e-06, - "loss": 0.2634, - "step": 17690 - }, - { - "epoch": 61.46, - "learning_rate": 1.5701766784452296e-06, - "loss": 0.2538, - "step": 17700 - }, - { - "epoch": 61.49, - "learning_rate": 1.568763250883392e-06, - "loss": 0.2518, - "step": 17710 - }, - { - "epoch": 61.53, - "learning_rate": 1.5673498233215547e-06, - "loss": 0.2623, - "step": 17720 - }, - { - "epoch": 61.56, - "learning_rate": 1.565936395759717e-06, - "loss": 0.2741, - "step": 17730 - }, - { - "epoch": 61.6, - "learning_rate": 1.5645229681978797e-06, - "loss": 0.2519, - "step": 17740 - }, - { - "epoch": 61.63, - "learning_rate": 1.5631095406360423e-06, - "loss": 0.2381, - "step": 17750 - }, - { - "epoch": 61.66, - "learning_rate": 1.5616961130742047e-06, - "loss": 0.26, - "step": 17760 - }, - { - "epoch": 61.7, - "learning_rate": 1.5602826855123674e-06, - "loss": 0.2751, - "step": 17770 - }, - { - "epoch": 61.73, - "learning_rate": 1.55886925795053e-06, - "loss": 0.2536, - "step": 17780 - }, - { - "epoch": 61.77, - "learning_rate": 1.5574558303886924e-06, - "loss": 0.2614, - "step": 17790 - }, - { - "epoch": 61.8, - "learning_rate": 1.556042402826855e-06, - "loss": 0.2669, - "step": 17800 - }, - { - "epoch": 61.84, - "learning_rate": 1.5546289752650176e-06, - "loss": 0.2653, - "step": 17810 - }, - { - "epoch": 61.87, - "learning_rate": 1.55321554770318e-06, - "loss": 0.2641, - "step": 17820 - }, - { - "epoch": 61.91, - "learning_rate": 1.5518021201413427e-06, - "loss": 0.267, - "step": 17830 - }, - { - "epoch": 61.94, - "learning_rate": 1.5503886925795053e-06, - "loss": 0.2447, - "step": 17840 - }, - { - "epoch": 61.98, - "learning_rate": 1.5489752650176677e-06, - "loss": 0.2605, - "step": 17850 - }, - { - "epoch": 62.0, - "eval_loss": 0.5094706416130066, - "eval_runtime": 133.5482, - "eval_samples_per_second": 3.984, - "eval_steps_per_second": 0.996, - "eval_wer": 0.19701741981101756, - "step": 17856 - }, - { - "epoch": 62.01, - "learning_rate": 1.5475618374558303e-06, - "loss": 0.2882, - "step": 17860 - }, - { - "epoch": 62.05, - "learning_rate": 1.5461484098939927e-06, - "loss": 0.2536, - "step": 17870 - }, - { - "epoch": 62.08, - "learning_rate": 1.5447349823321554e-06, - "loss": 0.2642, - "step": 17880 - }, - { - "epoch": 62.12, - "learning_rate": 1.543321554770318e-06, - "loss": 0.2723, - "step": 17890 - }, - { - "epoch": 62.15, - "learning_rate": 1.5419081272084804e-06, - "loss": 0.2688, - "step": 17900 - }, - { - "epoch": 62.19, - "learning_rate": 1.540494699646643e-06, - "loss": 0.2406, - "step": 17910 - }, - { - "epoch": 62.22, - "learning_rate": 1.5390812720848056e-06, - "loss": 0.2617, - "step": 17920 - }, - { - "epoch": 62.26, - "learning_rate": 1.537667844522968e-06, - "loss": 0.259, - "step": 17930 - }, - { - "epoch": 62.29, - "learning_rate": 1.5362544169611307e-06, - "loss": 0.25, - "step": 17940 - }, - { - "epoch": 62.33, - "learning_rate": 1.5348409893992933e-06, - "loss": 0.2976, - "step": 17950 - }, - { - "epoch": 62.36, - "learning_rate": 1.5334275618374557e-06, - "loss": 0.2654, - "step": 17960 - }, - { - "epoch": 62.39, - "learning_rate": 1.5320141342756183e-06, - "loss": 0.2781, - "step": 17970 - }, - { - "epoch": 62.43, - "learning_rate": 1.530600706713781e-06, - "loss": 0.2588, - "step": 17980 - }, - { - "epoch": 62.46, - "learning_rate": 1.5291872791519433e-06, - "loss": 0.2336, - "step": 17990 - }, - { - "epoch": 62.5, - "learning_rate": 1.527773851590106e-06, - "loss": 0.2496, - "step": 18000 - }, - { - "epoch": 62.53, - "learning_rate": 1.5263604240282686e-06, - "loss": 0.2469, - "step": 18010 - }, - { - "epoch": 62.57, - "learning_rate": 1.524946996466431e-06, - "loss": 0.2624, - "step": 18020 - }, - { - "epoch": 62.6, - "learning_rate": 1.5235335689045936e-06, - "loss": 0.2382, - "step": 18030 - }, - { - "epoch": 62.64, - "learning_rate": 1.522120141342756e-06, - "loss": 0.2812, - "step": 18040 - }, - { - "epoch": 62.67, - "learning_rate": 1.5207067137809186e-06, - "loss": 0.2653, - "step": 18050 - }, - { - "epoch": 62.71, - "learning_rate": 1.519434628975265e-06, - "loss": 0.2644, - "step": 18060 - }, - { - "epoch": 62.74, - "learning_rate": 1.5180212014134275e-06, - "loss": 0.2725, - "step": 18070 - }, - { - "epoch": 62.78, - "learning_rate": 1.5166077738515901e-06, - "loss": 0.2444, - "step": 18080 - }, - { - "epoch": 62.81, - "learning_rate": 1.5151943462897525e-06, - "loss": 0.276, - "step": 18090 - }, - { - "epoch": 62.85, - "learning_rate": 1.5137809187279152e-06, - "loss": 0.2724, - "step": 18100 - }, - { - "epoch": 62.88, - "learning_rate": 1.5123674911660778e-06, - "loss": 0.2495, - "step": 18110 - }, - { - "epoch": 62.91, - "learning_rate": 1.5109540636042402e-06, - "loss": 0.2311, - "step": 18120 - }, - { - "epoch": 62.95, - "learning_rate": 1.5095406360424028e-06, - "loss": 0.2443, - "step": 18130 - }, - { - "epoch": 62.98, - "learning_rate": 1.5081272084805654e-06, - "loss": 0.2649, - "step": 18140 - }, - { - "epoch": 63.0, - "eval_loss": 0.5149233937263489, - "eval_runtime": 133.9576, - "eval_samples_per_second": 3.971, - "eval_steps_per_second": 0.993, - "eval_wer": 0.19695314006556533, - "step": 18144 - }, - { - "epoch": 63.02, - "learning_rate": 1.5067137809187279e-06, - "loss": 0.2642, - "step": 18150 - }, - { - "epoch": 63.06, - "learning_rate": 1.5053003533568905e-06, - "loss": 0.2526, - "step": 18160 - }, - { - "epoch": 63.09, - "learning_rate": 1.5038869257950529e-06, - "loss": 0.2483, - "step": 18170 - }, - { - "epoch": 63.12, - "learning_rate": 1.5024734982332155e-06, - "loss": 0.2617, - "step": 18180 - }, - { - "epoch": 63.16, - "learning_rate": 1.5010600706713781e-06, - "loss": 0.2942, - "step": 18190 - }, - { - "epoch": 63.19, - "learning_rate": 1.4996466431095405e-06, - "loss": 0.2672, - "step": 18200 - }, - { - "epoch": 63.23, - "learning_rate": 1.4982332155477032e-06, - "loss": 0.2541, - "step": 18210 - }, - { - "epoch": 63.26, - "learning_rate": 1.4968197879858658e-06, - "loss": 0.2403, - "step": 18220 - }, - { - "epoch": 63.3, - "learning_rate": 1.4954063604240282e-06, - "loss": 0.2749, - "step": 18230 - }, - { - "epoch": 63.33, - "learning_rate": 1.4939929328621908e-06, - "loss": 0.2812, - "step": 18240 - }, - { - "epoch": 63.37, - "learning_rate": 1.4925795053003534e-06, - "loss": 0.2279, - "step": 18250 - }, - { - "epoch": 63.4, - "learning_rate": 1.4911660777385158e-06, - "loss": 0.2552, - "step": 18260 - }, - { - "epoch": 63.44, - "learning_rate": 1.4897526501766785e-06, - "loss": 0.2594, - "step": 18270 - }, - { - "epoch": 63.47, - "learning_rate": 1.488339222614841e-06, - "loss": 0.2593, - "step": 18280 - }, - { - "epoch": 63.51, - "learning_rate": 1.4869257950530035e-06, - "loss": 0.2681, - "step": 18290 - }, - { - "epoch": 63.54, - "learning_rate": 1.4855123674911661e-06, - "loss": 0.239, - "step": 18300 - }, - { - "epoch": 63.57, - "learning_rate": 1.4840989399293287e-06, - "loss": 0.2505, - "step": 18310 - }, - { - "epoch": 63.61, - "learning_rate": 1.4826855123674911e-06, - "loss": 0.2526, - "step": 18320 - }, - { - "epoch": 63.64, - "learning_rate": 1.4812720848056538e-06, - "loss": 0.2672, - "step": 18330 - }, - { - "epoch": 63.68, - "learning_rate": 1.4798586572438162e-06, - "loss": 0.2715, - "step": 18340 - }, - { - "epoch": 63.71, - "learning_rate": 1.4784452296819788e-06, - "loss": 0.2519, - "step": 18350 - }, - { - "epoch": 63.75, - "learning_rate": 1.4770318021201414e-06, - "loss": 0.2712, - "step": 18360 - }, - { - "epoch": 63.78, - "learning_rate": 1.4756183745583038e-06, - "loss": 0.2385, - "step": 18370 - }, - { - "epoch": 63.82, - "learning_rate": 1.4742049469964664e-06, - "loss": 0.2732, - "step": 18380 - }, - { - "epoch": 63.85, - "learning_rate": 1.472791519434629e-06, - "loss": 0.2835, - "step": 18390 - }, - { - "epoch": 63.89, - "learning_rate": 1.4713780918727915e-06, - "loss": 0.2812, - "step": 18400 - }, - { - "epoch": 63.92, - "learning_rate": 1.469964664310954e-06, - "loss": 0.2488, - "step": 18410 - }, - { - "epoch": 63.96, - "learning_rate": 1.4685512367491167e-06, - "loss": 0.2607, - "step": 18420 - }, - { - "epoch": 63.99, - "learning_rate": 1.4671378091872791e-06, - "loss": 0.246, - "step": 18430 - }, - { - "epoch": 64.0, - "eval_loss": 0.5164635181427002, - "eval_runtime": 134.1849, - "eval_samples_per_second": 3.965, - "eval_steps_per_second": 0.991, - "eval_wer": 0.19753165777463522, - "step": 18432 - }, - { - "epoch": 64.03, - "learning_rate": 1.4657243816254418e-06, - "loss": 0.2641, - "step": 18440 - }, - { - "epoch": 64.06, - "learning_rate": 1.4643109540636044e-06, - "loss": 0.268, - "step": 18450 - }, - { - "epoch": 64.1, - "learning_rate": 1.4628975265017666e-06, - "loss": 0.2544, - "step": 18460 - }, - { - "epoch": 64.13, - "learning_rate": 1.4614840989399294e-06, - "loss": 0.299, - "step": 18470 - }, - { - "epoch": 64.17, - "learning_rate": 1.4600706713780916e-06, - "loss": 0.27, - "step": 18480 - }, - { - "epoch": 64.2, - "learning_rate": 1.4586572438162542e-06, - "loss": 0.2475, - "step": 18490 - }, - { - "epoch": 64.24, - "learning_rate": 1.4572438162544168e-06, - "loss": 0.262, - "step": 18500 - }, - { - "epoch": 64.27, - "learning_rate": 1.4558303886925793e-06, - "loss": 0.2591, - "step": 18510 - }, - { - "epoch": 64.3, - "learning_rate": 1.4544169611307419e-06, - "loss": 0.2448, - "step": 18520 - }, - { - "epoch": 64.34, - "learning_rate": 1.4530035335689045e-06, - "loss": 0.263, - "step": 18530 - }, - { - "epoch": 64.37, - "learning_rate": 1.451590106007067e-06, - "loss": 0.2527, - "step": 18540 - }, - { - "epoch": 64.41, - "learning_rate": 1.4501766784452295e-06, - "loss": 0.2668, - "step": 18550 - }, - { - "epoch": 64.44, - "learning_rate": 1.4487632508833921e-06, - "loss": 0.2316, - "step": 18560 - }, - { - "epoch": 64.48, - "learning_rate": 1.4473498233215546e-06, - "loss": 0.2757, - "step": 18570 - }, - { - "epoch": 64.51, - "learning_rate": 1.4459363957597172e-06, - "loss": 0.2749, - "step": 18580 - }, - { - "epoch": 64.55, - "learning_rate": 1.4445229681978798e-06, - "loss": 0.2537, - "step": 18590 - }, - { - "epoch": 64.58, - "learning_rate": 1.4431095406360422e-06, - "loss": 0.2663, - "step": 18600 - }, - { - "epoch": 64.62, - "learning_rate": 1.4416961130742048e-06, - "loss": 0.2525, - "step": 18610 - }, - { - "epoch": 64.65, - "learning_rate": 1.4402826855123675e-06, - "loss": 0.2669, - "step": 18620 - }, - { - "epoch": 64.69, - "learning_rate": 1.4388692579505299e-06, - "loss": 0.2724, - "step": 18630 - }, - { - "epoch": 64.72, - "learning_rate": 1.4374558303886925e-06, - "loss": 0.2506, - "step": 18640 - }, - { - "epoch": 64.75, - "learning_rate": 1.4360424028268549e-06, - "loss": 0.2458, - "step": 18650 - }, - { - "epoch": 64.79, - "learning_rate": 1.4346289752650175e-06, - "loss": 0.2545, - "step": 18660 - }, - { - "epoch": 64.82, - "learning_rate": 1.4332155477031801e-06, - "loss": 0.2623, - "step": 18670 - }, - { - "epoch": 64.86, - "learning_rate": 1.4318021201413425e-06, - "loss": 0.2512, - "step": 18680 - }, - { - "epoch": 64.89, - "learning_rate": 1.4303886925795052e-06, - "loss": 0.2394, - "step": 18690 - }, - { - "epoch": 64.93, - "learning_rate": 1.4289752650176678e-06, - "loss": 0.2602, - "step": 18700 - }, - { - "epoch": 64.96, - "learning_rate": 1.4275618374558302e-06, - "loss": 0.2483, - "step": 18710 - }, - { - "epoch": 65.0, - "learning_rate": 1.4261484098939928e-06, - "loss": 0.2567, - "step": 18720 - }, - { - "epoch": 65.0, - "eval_loss": 0.5072118043899536, - "eval_runtime": 134.0915, - "eval_samples_per_second": 3.967, - "eval_steps_per_second": 0.992, - "eval_wer": 0.19811017548370508, - "step": 18720 - }, - { - "epoch": 65.03, - "learning_rate": 1.4247349823321554e-06, - "loss": 0.2677, - "step": 18730 - }, - { - "epoch": 65.07, - "learning_rate": 1.4233215547703178e-06, - "loss": 0.2524, - "step": 18740 - }, - { - "epoch": 65.1, - "learning_rate": 1.4219081272084805e-06, - "loss": 0.2628, - "step": 18750 - }, - { - "epoch": 65.14, - "learning_rate": 1.420494699646643e-06, - "loss": 0.2743, - "step": 18760 - }, - { - "epoch": 65.17, - "learning_rate": 1.4190812720848055e-06, - "loss": 0.2692, - "step": 18770 - }, - { - "epoch": 65.21, - "learning_rate": 1.4176678445229681e-06, - "loss": 0.2551, - "step": 18780 - }, - { - "epoch": 65.24, - "learning_rate": 1.4162544169611305e-06, - "loss": 0.2416, - "step": 18790 - }, - { - "epoch": 65.28, - "learning_rate": 1.4148409893992932e-06, - "loss": 0.2516, - "step": 18800 - }, - { - "epoch": 65.31, - "learning_rate": 1.4134275618374558e-06, - "loss": 0.2842, - "step": 18810 - }, - { - "epoch": 65.35, - "learning_rate": 1.4120141342756182e-06, - "loss": 0.263, - "step": 18820 - }, - { - "epoch": 65.38, - "learning_rate": 1.4106007067137808e-06, - "loss": 0.2531, - "step": 18830 - }, - { - "epoch": 65.42, - "learning_rate": 1.4091872791519434e-06, - "loss": 0.2536, - "step": 18840 - }, - { - "epoch": 65.45, - "learning_rate": 1.4077738515901058e-06, - "loss": 0.2741, - "step": 18850 - }, - { - "epoch": 65.48, - "learning_rate": 1.4063604240282685e-06, - "loss": 0.2675, - "step": 18860 - }, - { - "epoch": 65.52, - "learning_rate": 1.404946996466431e-06, - "loss": 0.2597, - "step": 18870 - }, - { - "epoch": 65.55, - "learning_rate": 1.4035335689045935e-06, - "loss": 0.259, - "step": 18880 - }, - { - "epoch": 65.59, - "learning_rate": 1.4021201413427561e-06, - "loss": 0.2586, - "step": 18890 - }, - { - "epoch": 65.62, - "learning_rate": 1.4007067137809187e-06, - "loss": 0.2473, - "step": 18900 - }, - { - "epoch": 65.66, - "learning_rate": 1.3992932862190811e-06, - "loss": 0.2679, - "step": 18910 - }, - { - "epoch": 65.69, - "learning_rate": 1.3978798586572438e-06, - "loss": 0.2429, - "step": 18920 - }, - { - "epoch": 65.73, - "learning_rate": 1.3964664310954064e-06, - "loss": 0.2521, - "step": 18930 - }, - { - "epoch": 65.76, - "learning_rate": 1.3950530035335688e-06, - "loss": 0.2651, - "step": 18940 - }, - { - "epoch": 65.8, - "learning_rate": 1.3936395759717314e-06, - "loss": 0.243, - "step": 18950 - }, - { - "epoch": 65.83, - "learning_rate": 1.3922261484098938e-06, - "loss": 0.26, - "step": 18960 - }, - { - "epoch": 65.87, - "learning_rate": 1.3908127208480564e-06, - "loss": 0.2509, - "step": 18970 - }, - { - "epoch": 65.9, - "learning_rate": 1.389399293286219e-06, - "loss": 0.2528, - "step": 18980 - }, - { - "epoch": 65.94, - "learning_rate": 1.3879858657243815e-06, - "loss": 0.2602, - "step": 18990 - }, - { - "epoch": 65.97, - "learning_rate": 1.386572438162544e-06, - "loss": 0.2509, - "step": 19000 - }, - { - "epoch": 66.0, - "eval_loss": 0.5061087012290955, - "eval_runtime": 133.4932, - "eval_samples_per_second": 3.985, - "eval_steps_per_second": 0.996, - "eval_wer": 0.19778877675644405, - "step": 19008 - }, - { - "epoch": 66.01, - "learning_rate": 1.3851590106007067e-06, - "loss": 0.2801, - "step": 19010 - }, - { - "epoch": 66.04, - "learning_rate": 1.3837455830388691e-06, - "loss": 0.256, - "step": 19020 - }, - { - "epoch": 66.08, - "learning_rate": 1.3823321554770318e-06, - "loss": 0.2356, - "step": 19030 - }, - { - "epoch": 66.11, - "learning_rate": 1.3809187279151944e-06, - "loss": 0.2594, - "step": 19040 - }, - { - "epoch": 66.15, - "learning_rate": 1.3795053003533568e-06, - "loss": 0.2468, - "step": 19050 - }, - { - "epoch": 66.18, - "learning_rate": 1.3780918727915194e-06, - "loss": 0.2661, - "step": 19060 - }, - { - "epoch": 66.21, - "learning_rate": 1.376678445229682e-06, - "loss": 0.2664, - "step": 19070 - }, - { - "epoch": 66.25, - "learning_rate": 1.3752650176678444e-06, - "loss": 0.266, - "step": 19080 - }, - { - "epoch": 66.28, - "learning_rate": 1.373851590106007e-06, - "loss": 0.2531, - "step": 19090 - }, - { - "epoch": 66.32, - "learning_rate": 1.3724381625441695e-06, - "loss": 0.2631, - "step": 19100 - }, - { - "epoch": 66.35, - "learning_rate": 1.371024734982332e-06, - "loss": 0.2732, - "step": 19110 - }, - { - "epoch": 66.39, - "learning_rate": 1.3696113074204947e-06, - "loss": 0.2584, - "step": 19120 - }, - { - "epoch": 66.42, - "learning_rate": 1.3681978798586571e-06, - "loss": 0.2374, - "step": 19130 - }, - { - "epoch": 66.46, - "learning_rate": 1.3667844522968197e-06, - "loss": 0.2653, - "step": 19140 - }, - { - "epoch": 66.49, - "learning_rate": 1.3653710247349824e-06, - "loss": 0.2614, - "step": 19150 - }, - { - "epoch": 66.53, - "learning_rate": 1.3639575971731448e-06, - "loss": 0.2625, - "step": 19160 - }, - { - "epoch": 66.56, - "learning_rate": 1.3625441696113074e-06, - "loss": 0.2558, - "step": 19170 - }, - { - "epoch": 66.6, - "learning_rate": 1.36113074204947e-06, - "loss": 0.2759, - "step": 19180 - }, - { - "epoch": 66.63, - "learning_rate": 1.3597173144876324e-06, - "loss": 0.238, - "step": 19190 - }, - { - "epoch": 66.66, - "learning_rate": 1.358303886925795e-06, - "loss": 0.2661, - "step": 19200 - }, - { - "epoch": 66.7, - "learning_rate": 1.3568904593639577e-06, - "loss": 0.2439, - "step": 19210 - }, - { - "epoch": 66.73, - "learning_rate": 1.35547703180212e-06, - "loss": 0.251, - "step": 19220 - }, - { - "epoch": 66.77, - "learning_rate": 1.3540636042402827e-06, - "loss": 0.2693, - "step": 19230 - }, - { - "epoch": 66.8, - "learning_rate": 1.3526501766784453e-06, - "loss": 0.2361, - "step": 19240 - }, - { - "epoch": 66.84, - "learning_rate": 1.3512367491166077e-06, - "loss": 0.2761, - "step": 19250 - }, - { - "epoch": 66.87, - "learning_rate": 1.3498233215547703e-06, - "loss": 0.2546, - "step": 19260 - }, - { - "epoch": 66.91, - "learning_rate": 1.3484098939929328e-06, - "loss": 0.251, - "step": 19270 - }, - { - "epoch": 66.94, - "learning_rate": 1.3469964664310954e-06, - "loss": 0.2381, - "step": 19280 - }, - { - "epoch": 66.98, - "learning_rate": 1.345583038869258e-06, - "loss": 0.289, - "step": 19290 - }, - { - "epoch": 67.0, - "eval_loss": 0.5087379217147827, - "eval_runtime": 134.753, - "eval_samples_per_second": 3.948, - "eval_steps_per_second": 0.987, - "eval_wer": 0.19573182490197338, - "step": 19296 - }, - { - "epoch": 67.01, - "learning_rate": 1.3441696113074204e-06, - "loss": 0.255, - "step": 19300 - }, - { - "epoch": 67.05, - "learning_rate": 1.342756183745583e-06, - "loss": 0.2501, - "step": 19310 - }, - { - "epoch": 67.08, - "learning_rate": 1.3413427561837457e-06, - "loss": 0.2529, - "step": 19320 - }, - { - "epoch": 67.12, - "learning_rate": 1.339929328621908e-06, - "loss": 0.2559, - "step": 19330 - }, - { - "epoch": 67.15, - "learning_rate": 1.3385159010600707e-06, - "loss": 0.2783, - "step": 19340 - }, - { - "epoch": 67.19, - "learning_rate": 1.3371024734982333e-06, - "loss": 0.2495, - "step": 19350 - }, - { - "epoch": 67.22, - "learning_rate": 1.3356890459363957e-06, - "loss": 0.2414, - "step": 19360 - }, - { - "epoch": 67.26, - "learning_rate": 1.3342756183745583e-06, - "loss": 0.2584, - "step": 19370 - }, - { - "epoch": 67.29, - "learning_rate": 1.332862190812721e-06, - "loss": 0.2553, - "step": 19380 - }, - { - "epoch": 67.33, - "learning_rate": 1.3314487632508834e-06, - "loss": 0.2712, - "step": 19390 - }, - { - "epoch": 67.36, - "learning_rate": 1.330035335689046e-06, - "loss": 0.2593, - "step": 19400 - }, - { - "epoch": 67.39, - "learning_rate": 1.3286219081272084e-06, - "loss": 0.2656, - "step": 19410 - }, - { - "epoch": 67.43, - "learning_rate": 1.327208480565371e-06, - "loss": 0.237, - "step": 19420 - }, - { - "epoch": 67.46, - "learning_rate": 1.3257950530035336e-06, - "loss": 0.262, - "step": 19430 - }, - { - "epoch": 67.5, - "learning_rate": 1.324381625441696e-06, - "loss": 0.2545, - "step": 19440 - }, - { - "epoch": 67.53, - "learning_rate": 1.3229681978798587e-06, - "loss": 0.2582, - "step": 19450 - }, - { - "epoch": 67.57, - "learning_rate": 1.3215547703180213e-06, - "loss": 0.2508, - "step": 19460 - }, - { - "epoch": 67.6, - "learning_rate": 1.3201413427561837e-06, - "loss": 0.2401, - "step": 19470 - }, - { - "epoch": 67.64, - "learning_rate": 1.3187279151943463e-06, - "loss": 0.2543, - "step": 19480 - }, - { - "epoch": 67.67, - "learning_rate": 1.317314487632509e-06, - "loss": 0.2467, - "step": 19490 - }, - { - "epoch": 67.71, - "learning_rate": 1.3159010600706714e-06, - "loss": 0.2675, - "step": 19500 - }, - { - "epoch": 67.74, - "learning_rate": 1.314487632508834e-06, - "loss": 0.2792, - "step": 19510 - }, - { - "epoch": 67.78, - "learning_rate": 1.3130742049469966e-06, - "loss": 0.2734, - "step": 19520 - }, - { - "epoch": 67.81, - "learning_rate": 1.311660777385159e-06, - "loss": 0.2645, - "step": 19530 - }, - { - "epoch": 67.85, - "learning_rate": 1.3102473498233216e-06, - "loss": 0.284, - "step": 19540 - }, - { - "epoch": 67.88, - "learning_rate": 1.3088339222614842e-06, - "loss": 0.2687, - "step": 19550 - }, - { - "epoch": 67.91, - "learning_rate": 1.3074204946996464e-06, - "loss": 0.2661, - "step": 19560 - }, - { - "epoch": 67.95, - "learning_rate": 1.306007067137809e-06, - "loss": 0.2568, - "step": 19570 - }, - { - "epoch": 67.98, - "learning_rate": 1.3045936395759715e-06, - "loss": 0.2511, - "step": 19580 - }, - { - "epoch": 68.0, - "eval_loss": 0.516753077507019, - "eval_runtime": 134.5773, - "eval_samples_per_second": 3.953, - "eval_steps_per_second": 0.988, - "eval_wer": 0.1981744552291573, - "step": 19584 - }, - { - "epoch": 68.02, - "learning_rate": 1.303180212014134e-06, - "loss": 0.2656, - "step": 19590 - }, - { - "epoch": 68.06, - "learning_rate": 1.3017667844522967e-06, - "loss": 0.2578, - "step": 19600 - }, - { - "epoch": 68.09, - "learning_rate": 1.3003533568904591e-06, - "loss": 0.2424, - "step": 19610 - }, - { - "epoch": 68.12, - "learning_rate": 1.2989399293286217e-06, - "loss": 0.264, - "step": 19620 - }, - { - "epoch": 68.16, - "learning_rate": 1.2975265017667844e-06, - "loss": 0.2589, - "step": 19630 - }, - { - "epoch": 68.19, - "learning_rate": 1.2961130742049468e-06, - "loss": 0.2536, - "step": 19640 - }, - { - "epoch": 68.23, - "learning_rate": 1.2946996466431094e-06, - "loss": 0.2713, - "step": 19650 - }, - { - "epoch": 68.26, - "learning_rate": 1.293286219081272e-06, - "loss": 0.2517, - "step": 19660 - }, - { - "epoch": 68.3, - "learning_rate": 1.2918727915194344e-06, - "loss": 0.271, - "step": 19670 - }, - { - "epoch": 68.33, - "learning_rate": 1.290459363957597e-06, - "loss": 0.2754, - "step": 19680 - }, - { - "epoch": 68.37, - "learning_rate": 1.2890459363957597e-06, - "loss": 0.2486, - "step": 19690 - }, - { - "epoch": 68.4, - "learning_rate": 1.287632508833922e-06, - "loss": 0.2627, - "step": 19700 - }, - { - "epoch": 68.44, - "learning_rate": 1.2862190812720847e-06, - "loss": 0.2434, - "step": 19710 - }, - { - "epoch": 68.47, - "learning_rate": 1.2848056537102471e-06, - "loss": 0.2685, - "step": 19720 - }, - { - "epoch": 68.51, - "learning_rate": 1.2833922261484097e-06, - "loss": 0.2677, - "step": 19730 - }, - { - "epoch": 68.54, - "learning_rate": 1.2819787985865724e-06, - "loss": 0.2783, - "step": 19740 - }, - { - "epoch": 68.57, - "learning_rate": 1.2805653710247348e-06, - "loss": 0.2518, - "step": 19750 - }, - { - "epoch": 68.61, - "learning_rate": 1.2791519434628974e-06, - "loss": 0.2521, - "step": 19760 - }, - { - "epoch": 68.64, - "learning_rate": 1.27773851590106e-06, - "loss": 0.2613, - "step": 19770 - }, - { - "epoch": 68.68, - "learning_rate": 1.2763250883392224e-06, - "loss": 0.2718, - "step": 19780 - }, - { - "epoch": 68.71, - "learning_rate": 1.274911660777385e-06, - "loss": 0.2337, - "step": 19790 - }, - { - "epoch": 68.75, - "learning_rate": 1.2734982332155477e-06, - "loss": 0.2617, - "step": 19800 - }, - { - "epoch": 68.78, - "learning_rate": 1.27208480565371e-06, - "loss": 0.2588, - "step": 19810 - }, - { - "epoch": 68.82, - "learning_rate": 1.2706713780918727e-06, - "loss": 0.254, - "step": 19820 - }, - { - "epoch": 68.85, - "learning_rate": 1.2692579505300353e-06, - "loss": 0.2595, - "step": 19830 - }, - { - "epoch": 68.89, - "learning_rate": 1.2678445229681977e-06, - "loss": 0.2418, - "step": 19840 - }, - { - "epoch": 68.92, - "learning_rate": 1.2664310954063603e-06, - "loss": 0.2567, - "step": 19850 - }, - { - "epoch": 68.96, - "learning_rate": 1.265017667844523e-06, - "loss": 0.2671, - "step": 19860 - }, - { - "epoch": 68.99, - "learning_rate": 1.2636042402826854e-06, - "loss": 0.2623, - "step": 19870 - }, - { - "epoch": 69.0, - "eval_loss": 0.5109707117080688, - "eval_runtime": 133.3708, - "eval_samples_per_second": 3.989, - "eval_steps_per_second": 0.997, - "eval_wer": 0.1958603843928778, - "step": 19872 - }, - { - "epoch": 69.03, - "learning_rate": 1.262190812720848e-06, - "loss": 0.2721, - "step": 19880 - }, - { - "epoch": 69.06, - "learning_rate": 1.2607773851590104e-06, - "loss": 0.2508, - "step": 19890 - }, - { - "epoch": 69.1, - "learning_rate": 1.259363957597173e-06, - "loss": 0.2522, - "step": 19900 - }, - { - "epoch": 69.13, - "learning_rate": 1.2579505300353356e-06, - "loss": 0.2842, - "step": 19910 - }, - { - "epoch": 69.17, - "learning_rate": 1.256537102473498e-06, - "loss": 0.2641, - "step": 19920 - }, - { - "epoch": 69.2, - "learning_rate": 1.2551236749116607e-06, - "loss": 0.2427, - "step": 19930 - }, - { - "epoch": 69.24, - "learning_rate": 1.2537102473498233e-06, - "loss": 0.2805, - "step": 19940 - }, - { - "epoch": 69.27, - "learning_rate": 1.2522968197879857e-06, - "loss": 0.254, - "step": 19950 - }, - { - "epoch": 69.3, - "learning_rate": 1.2508833922261483e-06, - "loss": 0.2651, - "step": 19960 - }, - { - "epoch": 69.34, - "learning_rate": 1.249469964664311e-06, - "loss": 0.2748, - "step": 19970 - }, - { - "epoch": 69.37, - "learning_rate": 1.2480565371024734e-06, - "loss": 0.2592, - "step": 19980 - }, - { - "epoch": 69.41, - "learning_rate": 1.246643109540636e-06, - "loss": 0.2652, - "step": 19990 - }, - { - "epoch": 69.44, - "learning_rate": 1.2452296819787986e-06, - "loss": 0.2382, - "step": 20000 - }, - { - "epoch": 69.48, - "learning_rate": 1.243816254416961e-06, - "loss": 0.2769, - "step": 20010 - }, - { - "epoch": 69.51, - "learning_rate": 1.2424028268551236e-06, - "loss": 0.2448, - "step": 20020 - }, - { - "epoch": 69.55, - "learning_rate": 1.240989399293286e-06, - "loss": 0.2392, - "step": 20030 - }, - { - "epoch": 69.58, - "learning_rate": 1.2395759717314487e-06, - "loss": 0.2546, - "step": 20040 - }, - { - "epoch": 69.62, - "learning_rate": 1.2381625441696113e-06, - "loss": 0.2472, - "step": 20050 - }, - { - "epoch": 69.65, - "learning_rate": 1.2367491166077737e-06, - "loss": 0.2772, - "step": 20060 - }, - { - "epoch": 69.69, - "learning_rate": 1.2353356890459363e-06, - "loss": 0.2799, - "step": 20070 - }, - { - "epoch": 69.72, - "learning_rate": 1.233922261484099e-06, - "loss": 0.2458, - "step": 20080 - }, - { - "epoch": 69.75, - "learning_rate": 1.2325088339222613e-06, - "loss": 0.2776, - "step": 20090 - }, - { - "epoch": 69.79, - "learning_rate": 1.231095406360424e-06, - "loss": 0.2571, - "step": 20100 - }, - { - "epoch": 69.82, - "learning_rate": 1.2296819787985866e-06, - "loss": 0.2464, - "step": 20110 - }, - { - "epoch": 69.86, - "learning_rate": 1.228268551236749e-06, - "loss": 0.2765, - "step": 20120 - }, - { - "epoch": 69.89, - "learning_rate": 1.2268551236749116e-06, - "loss": 0.2443, - "step": 20130 - }, - { - "epoch": 69.93, - "learning_rate": 1.2254416961130742e-06, - "loss": 0.2432, - "step": 20140 - }, - { - "epoch": 69.96, - "learning_rate": 1.2240282685512367e-06, - "loss": 0.2482, - "step": 20150 - }, - { - "epoch": 70.0, - "learning_rate": 1.2226148409893993e-06, - "loss": 0.2762, - "step": 20160 - }, - { - "epoch": 70.0, - "eval_loss": 0.5123195648193359, - "eval_runtime": 133.6748, - "eval_samples_per_second": 3.98, - "eval_steps_per_second": 0.995, - "eval_wer": 0.19592466413833, - "step": 20160 - }, - { - "epoch": 70.03, - "learning_rate": 1.221201413427562e-06, - "loss": 0.2698, - "step": 20170 - }, - { - "epoch": 70.07, - "learning_rate": 1.2197879858657243e-06, - "loss": 0.231, - "step": 20180 - }, - { - "epoch": 70.1, - "learning_rate": 1.218374558303887e-06, - "loss": 0.2392, - "step": 20190 - }, - { - "epoch": 70.14, - "learning_rate": 1.2169611307420493e-06, - "loss": 0.2549, - "step": 20200 - }, - { - "epoch": 70.17, - "learning_rate": 1.215547703180212e-06, - "loss": 0.2701, - "step": 20210 - }, - { - "epoch": 70.21, - "learning_rate": 1.2141342756183746e-06, - "loss": 0.2526, - "step": 20220 - }, - { - "epoch": 70.24, - "learning_rate": 1.212720848056537e-06, - "loss": 0.2654, - "step": 20230 - }, - { - "epoch": 70.28, - "learning_rate": 1.2113074204946996e-06, - "loss": 0.2659, - "step": 20240 - }, - { - "epoch": 70.31, - "learning_rate": 1.2098939929328622e-06, - "loss": 0.2583, - "step": 20250 - }, - { - "epoch": 70.35, - "learning_rate": 1.2084805653710246e-06, - "loss": 0.2559, - "step": 20260 - }, - { - "epoch": 70.38, - "learning_rate": 1.2070671378091873e-06, - "loss": 0.2498, - "step": 20270 - }, - { - "epoch": 70.42, - "learning_rate": 1.2056537102473499e-06, - "loss": 0.2515, - "step": 20280 - }, - { - "epoch": 70.45, - "learning_rate": 1.2042402826855123e-06, - "loss": 0.2389, - "step": 20290 - }, - { - "epoch": 70.48, - "learning_rate": 1.202826855123675e-06, - "loss": 0.2793, - "step": 20300 - }, - { - "epoch": 70.52, - "learning_rate": 1.2014134275618375e-06, - "loss": 0.2548, - "step": 20310 - }, - { - "epoch": 70.55, - "learning_rate": 1.2e-06, - "loss": 0.243, - "step": 20320 - }, - { - "epoch": 70.59, - "learning_rate": 1.1985865724381626e-06, - "loss": 0.2314, - "step": 20330 - }, - { - "epoch": 70.62, - "learning_rate": 1.197173144876325e-06, - "loss": 0.2416, - "step": 20340 - }, - { - "epoch": 70.66, - "learning_rate": 1.1957597173144876e-06, - "loss": 0.2705, - "step": 20350 - }, - { - "epoch": 70.69, - "learning_rate": 1.1943462897526502e-06, - "loss": 0.2564, - "step": 20360 - }, - { - "epoch": 70.73, - "learning_rate": 1.1929328621908126e-06, - "loss": 0.2683, - "step": 20370 - }, - { - "epoch": 70.76, - "learning_rate": 1.1915194346289753e-06, - "loss": 0.2626, - "step": 20380 - }, - { - "epoch": 70.8, - "learning_rate": 1.1901060070671379e-06, - "loss": 0.2484, - "step": 20390 - }, - { - "epoch": 70.83, - "learning_rate": 1.1886925795053003e-06, - "loss": 0.2649, - "step": 20400 - }, - { - "epoch": 70.87, - "learning_rate": 1.187279151943463e-06, - "loss": 0.255, - "step": 20410 - }, - { - "epoch": 70.9, - "learning_rate": 1.1858657243816255e-06, - "loss": 0.253, - "step": 20420 - }, - { - "epoch": 70.94, - "learning_rate": 1.184452296819788e-06, - "loss": 0.2373, - "step": 20430 - }, - { - "epoch": 70.97, - "learning_rate": 1.1830388692579506e-06, - "loss": 0.2704, - "step": 20440 - }, - { - "epoch": 71.0, - "eval_loss": 0.5117577314376831, - "eval_runtime": 133.058, - "eval_samples_per_second": 3.998, - "eval_steps_per_second": 1.0, - "eval_wer": 0.1965674615928521, - "step": 20448 - }, - { - "epoch": 71.01, - "learning_rate": 1.1816254416961132e-06, - "loss": 0.2783, - "step": 20450 - }, - { - "epoch": 71.04, - "learning_rate": 1.1802120141342756e-06, - "loss": 0.2665, - "step": 20460 - }, - { - "epoch": 71.08, - "learning_rate": 1.1787985865724382e-06, - "loss": 0.2626, - "step": 20470 - }, - { - "epoch": 71.11, - "learning_rate": 1.1773851590106008e-06, - "loss": 0.2544, - "step": 20480 - }, - { - "epoch": 71.15, - "learning_rate": 1.1759717314487632e-06, - "loss": 0.2526, - "step": 20490 - }, - { - "epoch": 71.18, - "learning_rate": 1.1745583038869259e-06, - "loss": 0.2749, - "step": 20500 - }, - { - "epoch": 71.21, - "learning_rate": 1.1731448763250883e-06, - "loss": 0.2545, - "step": 20510 - }, - { - "epoch": 71.25, - "learning_rate": 1.1717314487632509e-06, - "loss": 0.2475, - "step": 20520 - }, - { - "epoch": 71.28, - "learning_rate": 1.1703180212014135e-06, - "loss": 0.2502, - "step": 20530 - }, - { - "epoch": 71.32, - "learning_rate": 1.168904593639576e-06, - "loss": 0.2452, - "step": 20540 - }, - { - "epoch": 71.35, - "learning_rate": 1.1676325088339224e-06, - "loss": 0.2562, - "step": 20550 - }, - { - "epoch": 71.39, - "learning_rate": 1.1662190812720846e-06, - "loss": 0.2364, - "step": 20560 - }, - { - "epoch": 71.42, - "learning_rate": 1.1648056537102472e-06, - "loss": 0.2529, - "step": 20570 - }, - { - "epoch": 71.46, - "learning_rate": 1.1633922261484098e-06, - "loss": 0.2561, - "step": 20580 - }, - { - "epoch": 71.49, - "learning_rate": 1.1619787985865722e-06, - "loss": 0.2726, - "step": 20590 - }, - { - "epoch": 71.53, - "learning_rate": 1.1605653710247349e-06, - "loss": 0.2774, - "step": 20600 - }, - { - "epoch": 71.56, - "learning_rate": 1.1591519434628975e-06, - "loss": 0.2541, - "step": 20610 - }, - { - "epoch": 71.6, - "learning_rate": 1.1577385159010599e-06, - "loss": 0.2512, - "step": 20620 - }, - { - "epoch": 71.63, - "learning_rate": 1.1563250883392225e-06, - "loss": 0.2532, - "step": 20630 - }, - { - "epoch": 71.66, - "learning_rate": 1.154911660777385e-06, - "loss": 0.2639, - "step": 20640 - }, - { - "epoch": 71.7, - "learning_rate": 1.1534982332155475e-06, - "loss": 0.2573, - "step": 20650 - }, - { - "epoch": 71.73, - "learning_rate": 1.1520848056537102e-06, - "loss": 0.2662, - "step": 20660 - }, - { - "epoch": 71.77, - "learning_rate": 1.1506713780918726e-06, - "loss": 0.2486, - "step": 20670 - }, - { - "epoch": 71.8, - "learning_rate": 1.1492579505300352e-06, - "loss": 0.2563, - "step": 20680 - }, - { - "epoch": 71.84, - "learning_rate": 1.1478445229681978e-06, - "loss": 0.2631, - "step": 20690 - }, - { - "epoch": 71.87, - "learning_rate": 1.1464310954063602e-06, - "loss": 0.2697, - "step": 20700 - }, - { - "epoch": 71.91, - "learning_rate": 1.1450176678445228e-06, - "loss": 0.2478, - "step": 20710 - }, - { - "epoch": 71.94, - "learning_rate": 1.1436042402826855e-06, - "loss": 0.2436, - "step": 20720 - }, - { - "epoch": 71.98, - "learning_rate": 1.1421908127208479e-06, - "loss": 0.2854, - "step": 20730 - }, - { - "epoch": 72.0, - "eval_loss": 0.5127651691436768, - "eval_runtime": 133.8804, - "eval_samples_per_second": 3.974, - "eval_steps_per_second": 0.993, - "eval_wer": 0.1948961882110947, - "step": 20736 - }, - { - "epoch": 72.01, - "learning_rate": 1.1407773851590105e-06, - "loss": 0.2796, - "step": 20740 - }, - { - "epoch": 72.05, - "learning_rate": 1.1393639575971731e-06, - "loss": 0.2772, - "step": 20750 - }, - { - "epoch": 72.08, - "learning_rate": 1.1379505300353355e-06, - "loss": 0.2524, - "step": 20760 - }, - { - "epoch": 72.12, - "learning_rate": 1.1365371024734981e-06, - "loss": 0.2331, - "step": 20770 - }, - { - "epoch": 72.15, - "learning_rate": 1.1351236749116608e-06, - "loss": 0.2678, - "step": 20780 - }, - { - "epoch": 72.19, - "learning_rate": 1.1337102473498232e-06, - "loss": 0.2769, - "step": 20790 - }, - { - "epoch": 72.22, - "learning_rate": 1.1322968197879858e-06, - "loss": 0.2535, - "step": 20800 - }, - { - "epoch": 72.26, - "learning_rate": 1.1308833922261482e-06, - "loss": 0.2478, - "step": 20810 - }, - { - "epoch": 72.29, - "learning_rate": 1.1294699646643108e-06, - "loss": 0.2383, - "step": 20820 - }, - { - "epoch": 72.33, - "learning_rate": 1.1280565371024735e-06, - "loss": 0.2699, - "step": 20830 - }, - { - "epoch": 72.36, - "learning_rate": 1.1266431095406359e-06, - "loss": 0.2635, - "step": 20840 - }, - { - "epoch": 72.39, - "learning_rate": 1.1252296819787985e-06, - "loss": 0.2566, - "step": 20850 - }, - { - "epoch": 72.43, - "learning_rate": 1.123816254416961e-06, - "loss": 0.2414, - "step": 20860 - }, - { - "epoch": 72.46, - "learning_rate": 1.1224028268551235e-06, - "loss": 0.2522, - "step": 20870 - }, - { - "epoch": 72.5, - "learning_rate": 1.1209893992932861e-06, - "loss": 0.2483, - "step": 20880 - }, - { - "epoch": 72.53, - "learning_rate": 1.1195759717314488e-06, - "loss": 0.2597, - "step": 20890 - }, - { - "epoch": 72.57, - "learning_rate": 1.1181625441696112e-06, - "loss": 0.2576, - "step": 20900 - }, - { - "epoch": 72.6, - "learning_rate": 1.1167491166077738e-06, - "loss": 0.2525, - "step": 20910 - }, - { - "epoch": 72.64, - "learning_rate": 1.1153356890459364e-06, - "loss": 0.2679, - "step": 20920 - }, - { - "epoch": 72.67, - "learning_rate": 1.1139222614840988e-06, - "loss": 0.2634, - "step": 20930 - }, - { - "epoch": 72.71, - "learning_rate": 1.1125088339222614e-06, - "loss": 0.2325, - "step": 20940 - }, - { - "epoch": 72.74, - "learning_rate": 1.1110954063604238e-06, - "loss": 0.2625, - "step": 20950 - }, - { - "epoch": 72.78, - "learning_rate": 1.1096819787985865e-06, - "loss": 0.2442, - "step": 20960 - }, - { - "epoch": 72.81, - "learning_rate": 1.108268551236749e-06, - "loss": 0.2651, - "step": 20970 - }, - { - "epoch": 72.85, - "learning_rate": 1.1068551236749115e-06, - "loss": 0.2531, - "step": 20980 - }, - { - "epoch": 72.88, - "learning_rate": 1.1054416961130741e-06, - "loss": 0.2444, - "step": 20990 - }, - { - "epoch": 72.91, - "learning_rate": 1.1040282685512367e-06, - "loss": 0.2735, - "step": 21000 - }, - { - "epoch": 72.95, - "learning_rate": 1.1026148409893992e-06, - "loss": 0.2528, - "step": 21010 - }, - { - "epoch": 72.98, - "learning_rate": 1.1012014134275618e-06, - "loss": 0.2602, - "step": 21020 - }, - { - "epoch": 73.0, - "eval_loss": 0.5094349384307861, - "eval_runtime": 134.0533, - "eval_samples_per_second": 3.969, - "eval_steps_per_second": 0.992, - "eval_wer": 0.1966317413383043, - "step": 21024 - }, - { - "epoch": 73.02, - "learning_rate": 1.0997879858657244e-06, - "loss": 0.2639, - "step": 21030 - }, - { - "epoch": 73.06, - "learning_rate": 1.0983745583038868e-06, - "loss": 0.2614, - "step": 21040 - }, - { - "epoch": 73.09, - "learning_rate": 1.0969611307420494e-06, - "loss": 0.2265, - "step": 21050 - }, - { - "epoch": 73.12, - "learning_rate": 1.095547703180212e-06, - "loss": 0.2721, - "step": 21060 - }, - { - "epoch": 73.16, - "learning_rate": 1.0941342756183745e-06, - "loss": 0.2645, - "step": 21070 - }, - { - "epoch": 73.19, - "learning_rate": 1.092720848056537e-06, - "loss": 0.2381, - "step": 21080 - }, - { - "epoch": 73.23, - "learning_rate": 1.0913074204946997e-06, - "loss": 0.2458, - "step": 21090 - }, - { - "epoch": 73.26, - "learning_rate": 1.0898939929328621e-06, - "loss": 0.2378, - "step": 21100 - }, - { - "epoch": 73.3, - "learning_rate": 1.0884805653710247e-06, - "loss": 0.2567, - "step": 21110 - }, - { - "epoch": 73.33, - "learning_rate": 1.0870671378091871e-06, - "loss": 0.264, - "step": 21120 - }, - { - "epoch": 73.37, - "learning_rate": 1.0856537102473498e-06, - "loss": 0.2563, - "step": 21130 - }, - { - "epoch": 73.4, - "learning_rate": 1.0842402826855124e-06, - "loss": 0.2683, - "step": 21140 - }, - { - "epoch": 73.44, - "learning_rate": 1.0828268551236748e-06, - "loss": 0.2692, - "step": 21150 - }, - { - "epoch": 73.47, - "learning_rate": 1.0814134275618374e-06, - "loss": 0.2751, - "step": 21160 - }, - { - "epoch": 73.51, - "learning_rate": 1.08e-06, - "loss": 0.2638, - "step": 21170 - }, - { - "epoch": 73.54, - "learning_rate": 1.0785865724381624e-06, - "loss": 0.2333, - "step": 21180 - }, - { - "epoch": 73.57, - "learning_rate": 1.077173144876325e-06, - "loss": 0.2784, - "step": 21190 - }, - { - "epoch": 73.61, - "learning_rate": 1.0757597173144877e-06, - "loss": 0.2539, - "step": 21200 - }, - { - "epoch": 73.64, - "learning_rate": 1.07434628975265e-06, - "loss": 0.2442, - "step": 21210 - }, - { - "epoch": 73.68, - "learning_rate": 1.0729328621908127e-06, - "loss": 0.2633, - "step": 21220 - }, - { - "epoch": 73.71, - "learning_rate": 1.0715194346289753e-06, - "loss": 0.2318, - "step": 21230 - }, - { - "epoch": 73.75, - "learning_rate": 1.0701060070671377e-06, - "loss": 0.259, - "step": 21240 - }, - { - "epoch": 73.78, - "learning_rate": 1.0686925795053004e-06, - "loss": 0.2351, - "step": 21250 - }, - { - "epoch": 73.82, - "learning_rate": 1.0672791519434628e-06, - "loss": 0.2904, - "step": 21260 - }, - { - "epoch": 73.85, - "learning_rate": 1.0658657243816254e-06, - "loss": 0.2636, - "step": 21270 - }, - { - "epoch": 73.89, - "learning_rate": 1.064452296819788e-06, - "loss": 0.2746, - "step": 21280 - }, - { - "epoch": 73.92, - "learning_rate": 1.0630388692579504e-06, - "loss": 0.2249, - "step": 21290 - }, - { - "epoch": 73.96, - "learning_rate": 1.061625441696113e-06, - "loss": 0.257, - "step": 21300 - }, - { - "epoch": 73.99, - "learning_rate": 1.0602120141342757e-06, - "loss": 0.2675, - "step": 21310 - }, - { - "epoch": 74.0, - "eval_loss": 0.5058467388153076, - "eval_runtime": 133.957, - "eval_samples_per_second": 3.971, - "eval_steps_per_second": 0.993, - "eval_wer": 0.19605322362923444, - "step": 21312 - }, - { - "epoch": 74.03, - "learning_rate": 1.058798586572438e-06, - "loss": 0.2531, - "step": 21320 - }, - { - "epoch": 74.06, - "learning_rate": 1.0573851590106007e-06, - "loss": 0.241, - "step": 21330 - }, - { - "epoch": 74.1, - "learning_rate": 1.0559717314487633e-06, - "loss": 0.2388, - "step": 21340 - }, - { - "epoch": 74.13, - "learning_rate": 1.0545583038869257e-06, - "loss": 0.2513, - "step": 21350 - }, - { - "epoch": 74.17, - "learning_rate": 1.0531448763250884e-06, - "loss": 0.2672, - "step": 21360 - }, - { - "epoch": 74.2, - "learning_rate": 1.051731448763251e-06, - "loss": 0.2415, - "step": 21370 - }, - { - "epoch": 74.24, - "learning_rate": 1.0503180212014134e-06, - "loss": 0.2492, - "step": 21380 - }, - { - "epoch": 74.27, - "learning_rate": 1.048904593639576e-06, - "loss": 0.2421, - "step": 21390 - }, - { - "epoch": 74.3, - "learning_rate": 1.0474911660777386e-06, - "loss": 0.2926, - "step": 21400 - }, - { - "epoch": 74.34, - "learning_rate": 1.046077738515901e-06, - "loss": 0.2639, - "step": 21410 - }, - { - "epoch": 74.37, - "learning_rate": 1.0446643109540637e-06, - "loss": 0.2357, - "step": 21420 - }, - { - "epoch": 74.41, - "learning_rate": 1.043250883392226e-06, - "loss": 0.2707, - "step": 21430 - }, - { - "epoch": 74.44, - "learning_rate": 1.0418374558303887e-06, - "loss": 0.2426, - "step": 21440 - }, - { - "epoch": 74.48, - "learning_rate": 1.0404240282685513e-06, - "loss": 0.2743, - "step": 21450 - }, - { - "epoch": 74.51, - "learning_rate": 1.0390106007067137e-06, - "loss": 0.2739, - "step": 21460 - }, - { - "epoch": 74.55, - "learning_rate": 1.0375971731448763e-06, - "loss": 0.2391, - "step": 21470 - }, - { - "epoch": 74.58, - "learning_rate": 1.036183745583039e-06, - "loss": 0.2781, - "step": 21480 - }, - { - "epoch": 74.62, - "learning_rate": 1.0347703180212014e-06, - "loss": 0.2666, - "step": 21490 - }, - { - "epoch": 74.65, - "learning_rate": 1.033356890459364e-06, - "loss": 0.2484, - "step": 21500 - }, - { - "epoch": 74.69, - "learning_rate": 1.0319434628975266e-06, - "loss": 0.2529, - "step": 21510 - }, - { - "epoch": 74.72, - "learning_rate": 1.030530035335689e-06, - "loss": 0.2447, - "step": 21520 - }, - { - "epoch": 74.75, - "learning_rate": 1.0291166077738516e-06, - "loss": 0.2399, - "step": 21530 - }, - { - "epoch": 74.79, - "learning_rate": 1.0277031802120143e-06, - "loss": 0.2519, - "step": 21540 - }, - { - "epoch": 74.82, - "learning_rate": 1.0262897526501767e-06, - "loss": 0.2689, - "step": 21550 - }, - { - "epoch": 74.86, - "learning_rate": 1.0248763250883393e-06, - "loss": 0.2558, - "step": 21560 - }, - { - "epoch": 74.89, - "learning_rate": 1.0234628975265017e-06, - "loss": 0.2466, - "step": 21570 - }, - { - "epoch": 74.93, - "learning_rate": 1.0220494699646643e-06, - "loss": 0.2463, - "step": 21580 - }, - { - "epoch": 74.96, - "learning_rate": 1.020636042402827e-06, - "loss": 0.2776, - "step": 21590 - }, - { - "epoch": 75.0, - "learning_rate": 1.0192226148409894e-06, - "loss": 0.2519, - "step": 21600 - }, - { - "epoch": 75.0, - "eval_loss": 0.5216230750083923, - "eval_runtime": 133.9162, - "eval_samples_per_second": 3.973, - "eval_steps_per_second": 0.993, - "eval_wer": 0.19875297293822716, - "step": 21600 - }, - { - "epoch": 75.03, - "learning_rate": 1.017809187279152e-06, - "loss": 0.2963, - "step": 21610 - }, - { - "epoch": 75.07, - "learning_rate": 1.0163957597173146e-06, - "loss": 0.2578, - "step": 21620 - }, - { - "epoch": 75.1, - "learning_rate": 1.0149823321554768e-06, - "loss": 0.2693, - "step": 21630 - }, - { - "epoch": 75.14, - "learning_rate": 1.0135689045936394e-06, - "loss": 0.2924, - "step": 21640 - }, - { - "epoch": 75.17, - "learning_rate": 1.012155477031802e-06, - "loss": 0.2423, - "step": 21650 - }, - { - "epoch": 75.21, - "learning_rate": 1.0107420494699645e-06, - "loss": 0.2563, - "step": 21660 - }, - { - "epoch": 75.24, - "learning_rate": 1.009328621908127e-06, - "loss": 0.267, - "step": 21670 - }, - { - "epoch": 75.28, - "learning_rate": 1.0079151943462897e-06, - "loss": 0.2634, - "step": 21680 - }, - { - "epoch": 75.31, - "learning_rate": 1.0065017667844521e-06, - "loss": 0.2661, - "step": 21690 - }, - { - "epoch": 75.35, - "learning_rate": 1.0050883392226147e-06, - "loss": 0.2425, - "step": 21700 - }, - { - "epoch": 75.38, - "learning_rate": 1.0036749116607774e-06, - "loss": 0.2592, - "step": 21710 - }, - { - "epoch": 75.42, - "learning_rate": 1.0022614840989398e-06, - "loss": 0.236, - "step": 21720 - }, - { - "epoch": 75.45, - "learning_rate": 1.0008480565371024e-06, - "loss": 0.2506, - "step": 21730 - }, - { - "epoch": 75.48, - "learning_rate": 9.99434628975265e-07, - "loss": 0.2746, - "step": 21740 - }, - { - "epoch": 75.52, - "learning_rate": 9.980212014134274e-07, - "loss": 0.2696, - "step": 21750 - }, - { - "epoch": 75.55, - "learning_rate": 9.9660777385159e-07, - "loss": 0.249, - "step": 21760 - }, - { - "epoch": 75.59, - "learning_rate": 9.951943462897527e-07, - "loss": 0.2845, - "step": 21770 - }, - { - "epoch": 75.62, - "learning_rate": 9.93780918727915e-07, - "loss": 0.2298, - "step": 21780 - }, - { - "epoch": 75.66, - "learning_rate": 9.923674911660777e-07, - "loss": 0.2675, - "step": 21790 - }, - { - "epoch": 75.69, - "learning_rate": 9.909540636042403e-07, - "loss": 0.2734, - "step": 21800 - }, - { - "epoch": 75.73, - "learning_rate": 9.895406360424027e-07, - "loss": 0.244, - "step": 21810 - }, - { - "epoch": 75.76, - "learning_rate": 9.881272084805653e-07, - "loss": 0.2333, - "step": 21820 - }, - { - "epoch": 75.8, - "learning_rate": 9.86713780918728e-07, - "loss": 0.226, - "step": 21830 - }, - { - "epoch": 75.83, - "learning_rate": 9.853003533568904e-07, - "loss": 0.2542, - "step": 21840 - }, - { - "epoch": 75.87, - "learning_rate": 9.83886925795053e-07, - "loss": 0.283, - "step": 21850 - }, - { - "epoch": 75.9, - "learning_rate": 9.824734982332154e-07, - "loss": 0.2332, - "step": 21860 - }, - { - "epoch": 75.94, - "learning_rate": 9.81060070671378e-07, - "loss": 0.2518, - "step": 21870 - }, - { - "epoch": 75.97, - "learning_rate": 9.796466431095406e-07, - "loss": 0.2666, - "step": 21880 - }, - { - "epoch": 76.0, - "eval_loss": 0.5116772651672363, - "eval_runtime": 134.0532, - "eval_samples_per_second": 3.969, - "eval_steps_per_second": 0.992, - "eval_wer": 0.1958603843928778, - "step": 21888 - }, - { - "epoch": 76.01, - "learning_rate": 9.78233215547703e-07, - "loss": 0.2766, - "step": 21890 - }, - { - "epoch": 76.04, - "learning_rate": 9.768197879858657e-07, - "loss": 0.2281, - "step": 21900 - }, - { - "epoch": 76.08, - "learning_rate": 9.754063604240283e-07, - "loss": 0.2703, - "step": 21910 - }, - { - "epoch": 76.11, - "learning_rate": 9.739929328621907e-07, - "loss": 0.258, - "step": 21920 - }, - { - "epoch": 76.15, - "learning_rate": 9.725795053003533e-07, - "loss": 0.2614, - "step": 21930 - }, - { - "epoch": 76.18, - "learning_rate": 9.71166077738516e-07, - "loss": 0.2773, - "step": 21940 - }, - { - "epoch": 76.21, - "learning_rate": 9.697526501766784e-07, - "loss": 0.2701, - "step": 21950 - }, - { - "epoch": 76.25, - "learning_rate": 9.68339222614841e-07, - "loss": 0.2416, - "step": 21960 - }, - { - "epoch": 76.28, - "learning_rate": 9.669257950530036e-07, - "loss": 0.2547, - "step": 21970 - }, - { - "epoch": 76.32, - "learning_rate": 9.65512367491166e-07, - "loss": 0.2483, - "step": 21980 - }, - { - "epoch": 76.35, - "learning_rate": 9.640989399293286e-07, - "loss": 0.2473, - "step": 21990 - }, - { - "epoch": 76.39, - "learning_rate": 9.62685512367491e-07, - "loss": 0.2471, - "step": 22000 - }, - { - "epoch": 76.42, - "learning_rate": 9.612720848056537e-07, - "loss": 0.2323, - "step": 22010 - }, - { - "epoch": 76.46, - "learning_rate": 9.598586572438163e-07, - "loss": 0.276, - "step": 22020 - }, - { - "epoch": 76.49, - "learning_rate": 9.584452296819787e-07, - "loss": 0.2644, - "step": 22030 - }, - { - "epoch": 76.53, - "learning_rate": 9.570318021201413e-07, - "loss": 0.2605, - "step": 22040 - }, - { - "epoch": 76.56, - "learning_rate": 9.55618374558304e-07, - "loss": 0.2717, - "step": 22050 - }, - { - "epoch": 76.6, - "learning_rate": 9.542049469964663e-07, - "loss": 0.2534, - "step": 22060 - }, - { - "epoch": 76.63, - "learning_rate": 9.52791519434629e-07, - "loss": 0.2359, - "step": 22070 - }, - { - "epoch": 76.66, - "learning_rate": 9.513780918727915e-07, - "loss": 0.2806, - "step": 22080 - }, - { - "epoch": 76.7, - "learning_rate": 9.49964664310954e-07, - "loss": 0.2575, - "step": 22090 - }, - { - "epoch": 76.73, - "learning_rate": 9.485512367491165e-07, - "loss": 0.2439, - "step": 22100 - }, - { - "epoch": 76.77, - "learning_rate": 9.471378091872791e-07, - "loss": 0.2618, - "step": 22110 - }, - { - "epoch": 76.8, - "learning_rate": 9.457243816254416e-07, - "loss": 0.2445, - "step": 22120 - }, - { - "epoch": 76.84, - "learning_rate": 9.443109540636042e-07, - "loss": 0.2525, - "step": 22130 - }, - { - "epoch": 76.87, - "learning_rate": 9.428975265017668e-07, - "loss": 0.2441, - "step": 22140 - }, - { - "epoch": 76.91, - "learning_rate": 9.414840989399293e-07, - "loss": 0.259, - "step": 22150 - }, - { - "epoch": 76.94, - "learning_rate": 9.400706713780918e-07, - "loss": 0.2506, - "step": 22160 - }, - { - "epoch": 76.98, - "learning_rate": 9.386572438162543e-07, - "loss": 0.2637, - "step": 22170 - }, - { - "epoch": 77.0, - "eval_loss": 0.5057582259178162, - "eval_runtime": 134.4046, - "eval_samples_per_second": 3.958, - "eval_steps_per_second": 0.99, - "eval_wer": 0.19566754515652118, - "step": 22176 - }, - { - "epoch": 77.01, - "learning_rate": 9.37243816254417e-07, - "loss": 0.2561, - "step": 22180 - }, - { - "epoch": 77.05, - "learning_rate": 9.358303886925795e-07, - "loss": 0.2573, - "step": 22190 - }, - { - "epoch": 77.08, - "learning_rate": 9.34416961130742e-07, - "loss": 0.2447, - "step": 22200 - }, - { - "epoch": 77.12, - "learning_rate": 9.330035335689046e-07, - "loss": 0.2532, - "step": 22210 - }, - { - "epoch": 77.15, - "learning_rate": 9.315901060070671e-07, - "loss": 0.2602, - "step": 22220 - }, - { - "epoch": 77.19, - "learning_rate": 9.301766784452296e-07, - "loss": 0.2541, - "step": 22230 - }, - { - "epoch": 77.22, - "learning_rate": 9.287632508833922e-07, - "loss": 0.2406, - "step": 22240 - }, - { - "epoch": 77.26, - "learning_rate": 9.273498233215548e-07, - "loss": 0.2469, - "step": 22250 - }, - { - "epoch": 77.29, - "learning_rate": 9.259363957597173e-07, - "loss": 0.2633, - "step": 22260 - }, - { - "epoch": 77.33, - "learning_rate": 9.245229681978798e-07, - "loss": 0.2607, - "step": 22270 - }, - { - "epoch": 77.36, - "learning_rate": 9.231095406360424e-07, - "loss": 0.2627, - "step": 22280 - }, - { - "epoch": 77.39, - "learning_rate": 9.216961130742049e-07, - "loss": 0.2787, - "step": 22290 - }, - { - "epoch": 77.43, - "learning_rate": 9.202826855123675e-07, - "loss": 0.2381, - "step": 22300 - }, - { - "epoch": 77.46, - "learning_rate": 9.1886925795053e-07, - "loss": 0.2736, - "step": 22310 - }, - { - "epoch": 77.5, - "learning_rate": 9.174558303886926e-07, - "loss": 0.2599, - "step": 22320 - }, - { - "epoch": 77.53, - "learning_rate": 9.160424028268551e-07, - "loss": 0.2563, - "step": 22330 - }, - { - "epoch": 77.57, - "learning_rate": 9.146289752650176e-07, - "loss": 0.2467, - "step": 22340 - }, - { - "epoch": 77.6, - "learning_rate": 9.132155477031802e-07, - "loss": 0.2582, - "step": 22350 - }, - { - "epoch": 77.64, - "learning_rate": 9.118021201413428e-07, - "loss": 0.2677, - "step": 22360 - }, - { - "epoch": 77.67, - "learning_rate": 9.103886925795053e-07, - "loss": 0.2752, - "step": 22370 - }, - { - "epoch": 77.71, - "learning_rate": 9.089752650176679e-07, - "loss": 0.2373, - "step": 22380 - }, - { - "epoch": 77.74, - "learning_rate": 9.075618374558304e-07, - "loss": 0.2476, - "step": 22390 - }, - { - "epoch": 77.78, - "learning_rate": 9.061484098939929e-07, - "loss": 0.2542, - "step": 22400 - }, - { - "epoch": 77.81, - "learning_rate": 9.047349823321554e-07, - "loss": 0.2466, - "step": 22410 - }, - { - "epoch": 77.85, - "learning_rate": 9.033215547703181e-07, - "loss": 0.2581, - "step": 22420 - }, - { - "epoch": 77.88, - "learning_rate": 9.019081272084806e-07, - "loss": 0.2594, - "step": 22430 - }, - { - "epoch": 77.91, - "learning_rate": 9.00494699646643e-07, - "loss": 0.2615, - "step": 22440 - }, - { - "epoch": 77.95, - "learning_rate": 8.990812720848057e-07, - "loss": 0.2566, - "step": 22450 - }, - { - "epoch": 77.98, - "learning_rate": 8.976678445229681e-07, - "loss": 0.273, - "step": 22460 - }, - { - "epoch": 78.0, - "eval_loss": 0.5186824798583984, - "eval_runtime": 133.6981, - "eval_samples_per_second": 3.979, - "eval_steps_per_second": 0.995, - "eval_wer": 0.1966317413383043, - "step": 22464 - }, - { - "epoch": 78.02, - "learning_rate": 8.962544169611306e-07, - "loss": 0.2666, - "step": 22470 - }, - { - "epoch": 78.06, - "learning_rate": 8.948409893992932e-07, - "loss": 0.2591, - "step": 22480 - }, - { - "epoch": 78.09, - "learning_rate": 8.934275618374558e-07, - "loss": 0.2377, - "step": 22490 - }, - { - "epoch": 78.12, - "learning_rate": 8.920141342756183e-07, - "loss": 0.2836, - "step": 22500 - }, - { - "epoch": 78.16, - "learning_rate": 8.906007067137808e-07, - "loss": 0.2657, - "step": 22510 - }, - { - "epoch": 78.19, - "learning_rate": 8.891872791519434e-07, - "loss": 0.2613, - "step": 22520 - }, - { - "epoch": 78.23, - "learning_rate": 8.877738515901059e-07, - "loss": 0.2644, - "step": 22530 - }, - { - "epoch": 78.26, - "learning_rate": 8.863604240282685e-07, - "loss": 0.2435, - "step": 22540 - }, - { - "epoch": 78.3, - "learning_rate": 8.84946996466431e-07, - "loss": 0.2693, - "step": 22550 - }, - { - "epoch": 78.33, - "learning_rate": 8.835335689045936e-07, - "loss": 0.2531, - "step": 22560 - }, - { - "epoch": 78.37, - "learning_rate": 8.821201413427561e-07, - "loss": 0.2535, - "step": 22570 - }, - { - "epoch": 78.4, - "learning_rate": 8.807067137809186e-07, - "loss": 0.2645, - "step": 22580 - }, - { - "epoch": 78.44, - "learning_rate": 8.792932862190812e-07, - "loss": 0.2336, - "step": 22590 - }, - { - "epoch": 78.47, - "learning_rate": 8.778798586572438e-07, - "loss": 0.2474, - "step": 22600 - }, - { - "epoch": 78.51, - "learning_rate": 8.764664310954063e-07, - "loss": 0.2524, - "step": 22610 - }, - { - "epoch": 78.54, - "learning_rate": 8.750530035335688e-07, - "loss": 0.2246, - "step": 22620 - }, - { - "epoch": 78.57, - "learning_rate": 8.736395759717314e-07, - "loss": 0.2573, - "step": 22630 - }, - { - "epoch": 78.61, - "learning_rate": 8.722261484098939e-07, - "loss": 0.2482, - "step": 22640 - }, - { - "epoch": 78.64, - "learning_rate": 8.708127208480564e-07, - "loss": 0.272, - "step": 22650 - }, - { - "epoch": 78.68, - "learning_rate": 8.693992932862191e-07, - "loss": 0.266, - "step": 22660 - }, - { - "epoch": 78.71, - "learning_rate": 8.679858657243816e-07, - "loss": 0.262, - "step": 22670 - }, - { - "epoch": 78.75, - "learning_rate": 8.665724381625441e-07, - "loss": 0.2503, - "step": 22680 - }, - { - "epoch": 78.78, - "learning_rate": 8.651590106007067e-07, - "loss": 0.2554, - "step": 22690 - }, - { - "epoch": 78.82, - "learning_rate": 8.637455830388692e-07, - "loss": 0.263, - "step": 22700 - }, - { - "epoch": 78.85, - "learning_rate": 8.623321554770318e-07, - "loss": 0.269, - "step": 22710 - }, - { - "epoch": 78.89, - "learning_rate": 8.609187279151943e-07, - "loss": 0.262, - "step": 22720 - }, - { - "epoch": 78.92, - "learning_rate": 8.595053003533569e-07, - "loss": 0.2698, - "step": 22730 - }, - { - "epoch": 78.96, - "learning_rate": 8.580918727915194e-07, - "loss": 0.255, - "step": 22740 - }, - { - "epoch": 78.99, - "learning_rate": 8.566784452296819e-07, - "loss": 0.2666, - "step": 22750 - }, - { - "epoch": 79.0, - "eval_loss": 0.5175613760948181, - "eval_runtime": 134.3104, - "eval_samples_per_second": 3.961, - "eval_steps_per_second": 0.99, - "eval_wer": 0.19579610464742558, - "step": 22752 - }, - { - "epoch": 79.03, - "learning_rate": 8.552650176678445e-07, - "loss": 0.2381, - "step": 22760 - }, - { - "epoch": 79.06, - "learning_rate": 8.538515901060071e-07, - "loss": 0.2487, - "step": 22770 - }, - { - "epoch": 79.1, - "learning_rate": 8.524381625441696e-07, - "loss": 0.2621, - "step": 22780 - }, - { - "epoch": 79.13, - "learning_rate": 8.510247349823321e-07, - "loss": 0.271, - "step": 22790 - }, - { - "epoch": 79.17, - "learning_rate": 8.496113074204947e-07, - "loss": 0.2689, - "step": 22800 - }, - { - "epoch": 79.2, - "learning_rate": 8.481978798586572e-07, - "loss": 0.2351, - "step": 22810 - }, - { - "epoch": 79.24, - "learning_rate": 8.467844522968197e-07, - "loss": 0.2733, - "step": 22820 - }, - { - "epoch": 79.27, - "learning_rate": 8.453710247349824e-07, - "loss": 0.2436, - "step": 22830 - }, - { - "epoch": 79.3, - "learning_rate": 8.439575971731449e-07, - "loss": 0.2628, - "step": 22840 - }, - { - "epoch": 79.34, - "learning_rate": 8.425441696113074e-07, - "loss": 0.251, - "step": 22850 - }, - { - "epoch": 79.37, - "learning_rate": 8.411307420494699e-07, - "loss": 0.258, - "step": 22860 - }, - { - "epoch": 79.41, - "learning_rate": 8.397173144876325e-07, - "loss": 0.242, - "step": 22870 - }, - { - "epoch": 79.44, - "learning_rate": 8.38303886925795e-07, - "loss": 0.2446, - "step": 22880 - }, - { - "epoch": 79.48, - "learning_rate": 8.368904593639576e-07, - "loss": 0.2683, - "step": 22890 - }, - { - "epoch": 79.51, - "learning_rate": 8.354770318021202e-07, - "loss": 0.2686, - "step": 22900 - }, - { - "epoch": 79.55, - "learning_rate": 8.340636042402827e-07, - "loss": 0.2717, - "step": 22910 - }, - { - "epoch": 79.58, - "learning_rate": 8.326501766784452e-07, - "loss": 0.2373, - "step": 22920 - }, - { - "epoch": 79.62, - "learning_rate": 8.312367491166077e-07, - "loss": 0.2399, - "step": 22930 - }, - { - "epoch": 79.65, - "learning_rate": 8.298233215547703e-07, - "loss": 0.2867, - "step": 22940 - }, - { - "epoch": 79.69, - "learning_rate": 8.284098939929329e-07, - "loss": 0.277, - "step": 22950 - }, - { - "epoch": 79.72, - "learning_rate": 8.269964664310954e-07, - "loss": 0.2399, - "step": 22960 - }, - { - "epoch": 79.75, - "learning_rate": 8.25583038869258e-07, - "loss": 0.2537, - "step": 22970 - }, - { - "epoch": 79.79, - "learning_rate": 8.241696113074205e-07, - "loss": 0.2491, - "step": 22980 - }, - { - "epoch": 79.82, - "learning_rate": 8.227561837455829e-07, - "loss": 0.2747, - "step": 22990 - }, - { - "epoch": 79.86, - "learning_rate": 8.213427561837457e-07, - "loss": 0.2612, - "step": 23000 - }, - { - "epoch": 79.89, - "learning_rate": 8.199293286219081e-07, - "loss": 0.2455, - "step": 23010 - }, - { - "epoch": 79.93, - "learning_rate": 8.185159010600706e-07, - "loss": 0.2593, - "step": 23020 - }, - { - "epoch": 79.96, - "learning_rate": 8.171024734982331e-07, - "loss": 0.258, - "step": 23030 - }, - { - "epoch": 80.0, - "learning_rate": 8.156890459363957e-07, - "loss": 0.2627, - "step": 23040 - }, - { - "epoch": 80.0, - "eval_loss": 0.5141689777374268, - "eval_runtime": 133.6944, - "eval_samples_per_second": 3.979, - "eval_steps_per_second": 0.995, - "eval_wer": 0.1949604679565469, - "step": 23040 - }, - { - "epoch": 80.03, - "learning_rate": 8.142756183745582e-07, - "loss": 0.2598, - "step": 23050 - }, - { - "epoch": 80.07, - "learning_rate": 8.128621908127207e-07, - "loss": 0.2679, - "step": 23060 - }, - { - "epoch": 80.1, - "learning_rate": 8.114487632508834e-07, - "loss": 0.223, - "step": 23070 - }, - { - "epoch": 80.14, - "learning_rate": 8.100353356890459e-07, - "loss": 0.2692, - "step": 23080 - }, - { - "epoch": 80.17, - "learning_rate": 8.086219081272084e-07, - "loss": 0.2647, - "step": 23090 - }, - { - "epoch": 80.21, - "learning_rate": 8.072084805653709e-07, - "loss": 0.2544, - "step": 23100 - }, - { - "epoch": 80.24, - "learning_rate": 8.057950530035335e-07, - "loss": 0.2579, - "step": 23110 - }, - { - "epoch": 80.28, - "learning_rate": 8.04381625441696e-07, - "loss": 0.246, - "step": 23120 - }, - { - "epoch": 80.31, - "learning_rate": 8.029681978798586e-07, - "loss": 0.2714, - "step": 23130 - }, - { - "epoch": 80.35, - "learning_rate": 8.015547703180212e-07, - "loss": 0.2763, - "step": 23140 - }, - { - "epoch": 80.38, - "learning_rate": 8.001413427561837e-07, - "loss": 0.2489, - "step": 23150 - }, - { - "epoch": 80.42, - "learning_rate": 7.987279151943462e-07, - "loss": 0.2382, - "step": 23160 - }, - { - "epoch": 80.45, - "learning_rate": 7.973144876325087e-07, - "loss": 0.2712, - "step": 23170 - }, - { - "epoch": 80.48, - "learning_rate": 7.959010600706714e-07, - "loss": 0.2612, - "step": 23180 - }, - { - "epoch": 80.52, - "learning_rate": 7.944876325088339e-07, - "loss": 0.2573, - "step": 23190 - }, - { - "epoch": 80.55, - "learning_rate": 7.930742049469964e-07, - "loss": 0.2412, - "step": 23200 - }, - { - "epoch": 80.59, - "learning_rate": 7.91660777385159e-07, - "loss": 0.262, - "step": 23210 - }, - { - "epoch": 80.62, - "learning_rate": 7.902473498233215e-07, - "loss": 0.2555, - "step": 23220 - }, - { - "epoch": 80.66, - "learning_rate": 7.88833922261484e-07, - "loss": 0.2685, - "step": 23230 - }, - { - "epoch": 80.69, - "learning_rate": 7.874204946996466e-07, - "loss": 0.2427, - "step": 23240 - }, - { - "epoch": 80.73, - "learning_rate": 7.860070671378092e-07, - "loss": 0.2629, - "step": 23250 - }, - { - "epoch": 80.76, - "learning_rate": 7.845936395759717e-07, - "loss": 0.248, - "step": 23260 - }, - { - "epoch": 80.8, - "learning_rate": 7.831802120141342e-07, - "loss": 0.2413, - "step": 23270 - }, - { - "epoch": 80.83, - "learning_rate": 7.817667844522968e-07, - "loss": 0.2675, - "step": 23280 - }, - { - "epoch": 80.87, - "learning_rate": 7.803533568904593e-07, - "loss": 0.263, - "step": 23290 - }, - { - "epoch": 80.9, - "learning_rate": 7.789399293286219e-07, - "loss": 0.2674, - "step": 23300 - }, - { - "epoch": 80.94, - "learning_rate": 7.775265017667845e-07, - "loss": 0.2567, - "step": 23310 - }, - { - "epoch": 80.97, - "learning_rate": 7.76113074204947e-07, - "loss": 0.2508, - "step": 23320 - }, - { - "epoch": 81.0, - "eval_loss": 0.5157809853553772, - "eval_runtime": 134.6235, - "eval_samples_per_second": 3.952, - "eval_steps_per_second": 0.988, - "eval_wer": 0.19605322362923444, - "step": 23328 - }, - { - "epoch": 81.01, - "learning_rate": 7.746996466431095e-07, - "loss": 0.289, - "step": 23330 - }, - { - "epoch": 81.04, - "learning_rate": 7.73286219081272e-07, - "loss": 0.2503, - "step": 23340 - }, - { - "epoch": 81.08, - "learning_rate": 7.718727915194346e-07, - "loss": 0.2387, - "step": 23350 - }, - { - "epoch": 81.11, - "learning_rate": 7.704593639575972e-07, - "loss": 0.2675, - "step": 23360 - }, - { - "epoch": 81.15, - "learning_rate": 7.690459363957597e-07, - "loss": 0.2534, - "step": 23370 - }, - { - "epoch": 81.18, - "learning_rate": 7.676325088339223e-07, - "loss": 0.2603, - "step": 23380 - }, - { - "epoch": 81.21, - "learning_rate": 7.662190812720848e-07, - "loss": 0.2545, - "step": 23390 - }, - { - "epoch": 81.25, - "learning_rate": 7.648056537102473e-07, - "loss": 0.2617, - "step": 23400 - }, - { - "epoch": 81.28, - "learning_rate": 7.633922261484098e-07, - "loss": 0.2495, - "step": 23410 - }, - { - "epoch": 81.32, - "learning_rate": 7.619787985865725e-07, - "loss": 0.2608, - "step": 23420 - }, - { - "epoch": 81.35, - "learning_rate": 7.60565371024735e-07, - "loss": 0.2561, - "step": 23430 - }, - { - "epoch": 81.39, - "learning_rate": 7.591519434628975e-07, - "loss": 0.2487, - "step": 23440 - }, - { - "epoch": 81.42, - "learning_rate": 7.577385159010601e-07, - "loss": 0.2522, - "step": 23450 - }, - { - "epoch": 81.46, - "learning_rate": 7.563250883392226e-07, - "loss": 0.2796, - "step": 23460 - }, - { - "epoch": 81.49, - "learning_rate": 7.549116607773851e-07, - "loss": 0.2516, - "step": 23470 - }, - { - "epoch": 81.53, - "learning_rate": 7.534982332155477e-07, - "loss": 0.2653, - "step": 23480 - }, - { - "epoch": 81.56, - "learning_rate": 7.520848056537103e-07, - "loss": 0.2627, - "step": 23490 - }, - { - "epoch": 81.6, - "learning_rate": 7.506713780918728e-07, - "loss": 0.2524, - "step": 23500 - }, - { - "epoch": 81.63, - "learning_rate": 7.492579505300353e-07, - "loss": 0.2545, - "step": 23510 - }, - { - "epoch": 81.66, - "learning_rate": 7.478445229681979e-07, - "loss": 0.2838, - "step": 23520 - }, - { - "epoch": 81.7, - "learning_rate": 7.464310954063605e-07, - "loss": 0.25, - "step": 23530 - }, - { - "epoch": 81.73, - "learning_rate": 7.450176678445229e-07, - "loss": 0.2702, - "step": 23540 - }, - { - "epoch": 81.77, - "learning_rate": 7.436042402826854e-07, - "loss": 0.2521, - "step": 23550 - }, - { - "epoch": 81.8, - "learning_rate": 7.42190812720848e-07, - "loss": 0.2537, - "step": 23560 - }, - { - "epoch": 81.84, - "learning_rate": 7.407773851590105e-07, - "loss": 0.2731, - "step": 23570 - }, - { - "epoch": 81.87, - "learning_rate": 7.39363957597173e-07, - "loss": 0.2441, - "step": 23580 - }, - { - "epoch": 81.91, - "learning_rate": 7.379505300353357e-07, - "loss": 0.2541, - "step": 23590 - }, - { - "epoch": 81.94, - "learning_rate": 7.365371024734982e-07, - "loss": 0.2546, - "step": 23600 - }, - { - "epoch": 81.98, - "learning_rate": 7.351236749116607e-07, - "loss": 0.2499, - "step": 23610 - }, - { - "epoch": 82.0, - "eval_loss": 0.5130564570426941, - "eval_runtime": 134.0023, - "eval_samples_per_second": 3.97, - "eval_steps_per_second": 0.993, - "eval_wer": 0.19695314006556533, - "step": 23616 - }, - { - "epoch": 82.01, - "learning_rate": 7.337102473498233e-07, - "loss": 0.2829, - "step": 23620 - }, - { - "epoch": 82.05, - "learning_rate": 7.322968197879858e-07, - "loss": 0.2725, - "step": 23630 - }, - { - "epoch": 82.08, - "learning_rate": 7.308833922261483e-07, - "loss": 0.2439, - "step": 23640 - }, - { - "epoch": 82.12, - "learning_rate": 7.294699646643108e-07, - "loss": 0.2534, - "step": 23650 - }, - { - "epoch": 82.15, - "learning_rate": 7.280565371024735e-07, - "loss": 0.2644, - "step": 23660 - }, - { - "epoch": 82.19, - "learning_rate": 7.26643109540636e-07, - "loss": 0.2402, - "step": 23670 - }, - { - "epoch": 82.22, - "learning_rate": 7.252296819787985e-07, - "loss": 0.2337, - "step": 23680 - }, - { - "epoch": 82.26, - "learning_rate": 7.238162544169611e-07, - "loss": 0.2612, - "step": 23690 - }, - { - "epoch": 82.29, - "learning_rate": 7.224028268551236e-07, - "loss": 0.276, - "step": 23700 - }, - { - "epoch": 82.33, - "learning_rate": 7.209893992932862e-07, - "loss": 0.275, - "step": 23710 - }, - { - "epoch": 82.36, - "learning_rate": 7.195759717314487e-07, - "loss": 0.2353, - "step": 23720 - }, - { - "epoch": 82.39, - "learning_rate": 7.181625441696113e-07, - "loss": 0.2435, - "step": 23730 - }, - { - "epoch": 82.43, - "learning_rate": 7.167491166077738e-07, - "loss": 0.2574, - "step": 23740 - }, - { - "epoch": 82.46, - "learning_rate": 7.153356890459363e-07, - "loss": 0.2834, - "step": 23750 - }, - { - "epoch": 82.5, - "learning_rate": 7.139222614840989e-07, - "loss": 0.2714, - "step": 23760 - }, - { - "epoch": 82.53, - "learning_rate": 7.125088339222615e-07, - "loss": 0.2523, - "step": 23770 - }, - { - "epoch": 82.57, - "learning_rate": 7.11095406360424e-07, - "loss": 0.2729, - "step": 23780 - }, - { - "epoch": 82.6, - "learning_rate": 7.096819787985865e-07, - "loss": 0.2366, - "step": 23790 - }, - { - "epoch": 82.64, - "learning_rate": 7.082685512367491e-07, - "loss": 0.2644, - "step": 23800 - }, - { - "epoch": 82.67, - "learning_rate": 7.068551236749116e-07, - "loss": 0.2382, - "step": 23810 - }, - { - "epoch": 82.71, - "learning_rate": 7.054416961130741e-07, - "loss": 0.2489, - "step": 23820 - }, - { - "epoch": 82.74, - "learning_rate": 7.040282685512368e-07, - "loss": 0.2933, - "step": 23830 - }, - { - "epoch": 82.78, - "learning_rate": 7.026148409893993e-07, - "loss": 0.2437, - "step": 23840 - }, - { - "epoch": 82.81, - "learning_rate": 7.012014134275618e-07, - "loss": 0.2433, - "step": 23850 - }, - { - "epoch": 82.85, - "learning_rate": 6.997879858657243e-07, - "loss": 0.2602, - "step": 23860 - }, - { - "epoch": 82.88, - "learning_rate": 6.983745583038869e-07, - "loss": 0.2693, - "step": 23870 - }, - { - "epoch": 82.91, - "learning_rate": 6.969611307420494e-07, - "loss": 0.2426, - "step": 23880 - }, - { - "epoch": 82.95, - "learning_rate": 6.95547703180212e-07, - "loss": 0.242, - "step": 23890 - }, - { - "epoch": 82.98, - "learning_rate": 6.941342756183746e-07, - "loss": 0.2583, - "step": 23900 - }, - { - "epoch": 83.0, - "eval_loss": 0.5149600505828857, - "eval_runtime": 134.0167, - "eval_samples_per_second": 3.97, - "eval_steps_per_second": 0.992, - "eval_wer": 0.19746737802918302, - "step": 23904 - }, - { - "epoch": 83.02, - "learning_rate": 6.927208480565371e-07, - "loss": 0.2692, - "step": 23910 - }, - { - "epoch": 83.06, - "learning_rate": 6.913074204946996e-07, - "loss": 0.2688, - "step": 23920 - }, - { - "epoch": 83.09, - "learning_rate": 6.898939929328622e-07, - "loss": 0.2601, - "step": 23930 - }, - { - "epoch": 83.12, - "learning_rate": 6.884805653710247e-07, - "loss": 0.2784, - "step": 23940 - }, - { - "epoch": 83.16, - "learning_rate": 6.870671378091873e-07, - "loss": 0.2408, - "step": 23950 - }, - { - "epoch": 83.19, - "learning_rate": 6.856537102473498e-07, - "loss": 0.2512, - "step": 23960 - }, - { - "epoch": 83.23, - "learning_rate": 6.842402826855124e-07, - "loss": 0.2371, - "step": 23970 - }, - { - "epoch": 83.26, - "learning_rate": 6.828268551236749e-07, - "loss": 0.2627, - "step": 23980 - }, - { - "epoch": 83.3, - "learning_rate": 6.814134275618374e-07, - "loss": 0.2642, - "step": 23990 - }, - { - "epoch": 83.33, - "learning_rate": 6.800000000000001e-07, - "loss": 0.2806, - "step": 24000 - }, - { - "epoch": 83.37, - "learning_rate": 6.785865724381626e-07, - "loss": 0.2409, - "step": 24010 - }, - { - "epoch": 83.4, - "learning_rate": 6.771731448763251e-07, - "loss": 0.256, - "step": 24020 - }, - { - "epoch": 83.44, - "learning_rate": 6.757597173144876e-07, - "loss": 0.2399, - "step": 24030 - }, - { - "epoch": 83.47, - "learning_rate": 6.743462897526502e-07, - "loss": 0.2721, - "step": 24040 - }, - { - "epoch": 83.51, - "learning_rate": 6.729328621908127e-07, - "loss": 0.2702, - "step": 24050 - }, - { - "epoch": 83.54, - "learning_rate": 6.715194346289753e-07, - "loss": 0.2252, - "step": 24060 - }, - { - "epoch": 83.57, - "learning_rate": 6.701060070671379e-07, - "loss": 0.2405, - "step": 24070 - }, - { - "epoch": 83.61, - "learning_rate": 6.686925795053003e-07, - "loss": 0.2409, - "step": 24080 - }, - { - "epoch": 83.64, - "learning_rate": 6.672791519434628e-07, - "loss": 0.257, - "step": 24090 - }, - { - "epoch": 83.68, - "learning_rate": 6.658657243816253e-07, - "loss": 0.2642, - "step": 24100 - }, - { - "epoch": 83.71, - "learning_rate": 6.644522968197879e-07, - "loss": 0.2699, - "step": 24110 - }, - { - "epoch": 83.75, - "learning_rate": 6.630388692579505e-07, - "loss": 0.2487, - "step": 24120 - }, - { - "epoch": 83.78, - "learning_rate": 6.61625441696113e-07, - "loss": 0.2505, - "step": 24130 - }, - { - "epoch": 83.82, - "learning_rate": 6.602120141342756e-07, - "loss": 0.2627, - "step": 24140 - }, - { - "epoch": 83.85, - "learning_rate": 6.587985865724381e-07, - "loss": 0.2579, - "step": 24150 - }, - { - "epoch": 83.89, - "learning_rate": 6.573851590106006e-07, - "loss": 0.2434, - "step": 24160 - }, - { - "epoch": 83.92, - "learning_rate": 6.559717314487631e-07, - "loss": 0.2344, - "step": 24170 - }, - { - "epoch": 83.96, - "learning_rate": 6.545583038869258e-07, - "loss": 0.2468, - "step": 24180 - }, - { - "epoch": 83.99, - "learning_rate": 6.531448763250883e-07, - "loss": 0.246, - "step": 24190 - }, - { - "epoch": 84.0, - "eval_loss": 0.5096983909606934, - "eval_runtime": 133.3449, - "eval_samples_per_second": 3.99, - "eval_steps_per_second": 0.997, - "eval_wer": 0.19618178312013884, - "step": 24192 - }, - { - "epoch": 84.03, - "learning_rate": 6.517314487632508e-07, - "loss": 0.2808, - "step": 24200 - }, - { - "epoch": 84.06, - "learning_rate": 6.503180212014134e-07, - "loss": 0.2582, - "step": 24210 - }, - { - "epoch": 84.1, - "learning_rate": 6.490459363957597e-07, - "loss": 0.2613, - "step": 24220 - }, - { - "epoch": 84.13, - "learning_rate": 6.476325088339223e-07, - "loss": 0.2637, - "step": 24230 - }, - { - "epoch": 84.17, - "learning_rate": 6.462190812720848e-07, - "loss": 0.2765, - "step": 24240 - }, - { - "epoch": 84.2, - "learning_rate": 6.448056537102473e-07, - "loss": 0.2515, - "step": 24250 - }, - { - "epoch": 84.24, - "learning_rate": 6.433922261484098e-07, - "loss": 0.2331, - "step": 24260 - }, - { - "epoch": 84.27, - "learning_rate": 6.419787985865724e-07, - "loss": 0.2408, - "step": 24270 - }, - { - "epoch": 84.3, - "learning_rate": 6.40565371024735e-07, - "loss": 0.2706, - "step": 24280 - }, - { - "epoch": 84.34, - "learning_rate": 6.391519434628975e-07, - "loss": 0.2605, - "step": 24290 - }, - { - "epoch": 84.37, - "learning_rate": 6.377385159010601e-07, - "loss": 0.2403, - "step": 24300 - }, - { - "epoch": 84.41, - "learning_rate": 6.363250883392226e-07, - "loss": 0.2646, - "step": 24310 - }, - { - "epoch": 84.44, - "learning_rate": 6.349116607773851e-07, - "loss": 0.262, - "step": 24320 - }, - { - "epoch": 84.48, - "learning_rate": 6.334982332155476e-07, - "loss": 0.2664, - "step": 24330 - }, - { - "epoch": 84.51, - "learning_rate": 6.320848056537103e-07, - "loss": 0.2633, - "step": 24340 - }, - { - "epoch": 84.55, - "learning_rate": 6.306713780918728e-07, - "loss": 0.2278, - "step": 24350 - }, - { - "epoch": 84.58, - "learning_rate": 6.292579505300353e-07, - "loss": 0.2645, - "step": 24360 - }, - { - "epoch": 84.62, - "learning_rate": 6.278445229681979e-07, - "loss": 0.2249, - "step": 24370 - }, - { - "epoch": 84.65, - "learning_rate": 6.264310954063604e-07, - "loss": 0.2587, - "step": 24380 - }, - { - "epoch": 84.69, - "learning_rate": 6.25017667844523e-07, - "loss": 0.2471, - "step": 24390 - }, - { - "epoch": 84.72, - "learning_rate": 6.236042402826855e-07, - "loss": 0.258, - "step": 24400 - }, - { - "epoch": 84.75, - "learning_rate": 6.221908127208481e-07, - "loss": 0.2394, - "step": 24410 - }, - { - "epoch": 84.79, - "learning_rate": 6.207773851590106e-07, - "loss": 0.252, - "step": 24420 - }, - { - "epoch": 84.82, - "learning_rate": 6.193639575971731e-07, - "loss": 0.2727, - "step": 24430 - }, - { - "epoch": 84.86, - "learning_rate": 6.179505300353357e-07, - "loss": 0.2699, - "step": 24440 - }, - { - "epoch": 84.89, - "learning_rate": 6.165371024734983e-07, - "loss": 0.2309, - "step": 24450 - }, - { - "epoch": 84.93, - "learning_rate": 6.151236749116608e-07, - "loss": 0.2637, - "step": 24460 - }, - { - "epoch": 84.96, - "learning_rate": 6.13851590106007e-07, - "loss": 0.245, - "step": 24470 - }, - { - "epoch": 85.0, - "learning_rate": 6.124381625441695e-07, - "loss": 0.272, - "step": 24480 - }, - { - "epoch": 85.0, - "eval_loss": 0.504280149936676, - "eval_runtime": 134.0604, - "eval_samples_per_second": 3.968, - "eval_steps_per_second": 0.992, - "eval_wer": 0.1949604679565469, - "step": 24480 - }, - { - "epoch": 85.03, - "learning_rate": 6.110247349823321e-07, - "loss": 0.2629, - "step": 24490 - }, - { - "epoch": 85.07, - "learning_rate": 6.096113074204947e-07, - "loss": 0.2312, - "step": 24500 - }, - { - "epoch": 85.1, - "learning_rate": 6.081978798586572e-07, - "loss": 0.265, - "step": 24510 - }, - { - "epoch": 85.14, - "learning_rate": 6.067844522968197e-07, - "loss": 0.258, - "step": 24520 - }, - { - "epoch": 85.17, - "learning_rate": 6.053710247349822e-07, - "loss": 0.244, - "step": 24530 - }, - { - "epoch": 85.21, - "learning_rate": 6.039575971731448e-07, - "loss": 0.2407, - "step": 24540 - }, - { - "epoch": 85.24, - "learning_rate": 6.025441696113074e-07, - "loss": 0.2632, - "step": 24550 - }, - { - "epoch": 85.28, - "learning_rate": 6.011307420494699e-07, - "loss": 0.2678, - "step": 24560 - }, - { - "epoch": 85.31, - "learning_rate": 5.997173144876325e-07, - "loss": 0.2483, - "step": 24570 - }, - { - "epoch": 85.35, - "learning_rate": 5.98303886925795e-07, - "loss": 0.2801, - "step": 24580 - }, - { - "epoch": 85.38, - "learning_rate": 5.968904593639575e-07, - "loss": 0.251, - "step": 24590 - }, - { - "epoch": 85.42, - "learning_rate": 5.954770318021201e-07, - "loss": 0.2588, - "step": 24600 - }, - { - "epoch": 85.45, - "learning_rate": 5.940636042402827e-07, - "loss": 0.2543, - "step": 24610 - }, - { - "epoch": 85.48, - "learning_rate": 5.926501766784452e-07, - "loss": 0.2755, - "step": 24620 - }, - { - "epoch": 85.52, - "learning_rate": 5.912367491166077e-07, - "loss": 0.2388, - "step": 24630 - }, - { - "epoch": 85.55, - "learning_rate": 5.898233215547703e-07, - "loss": 0.2517, - "step": 24640 - }, - { - "epoch": 85.59, - "learning_rate": 5.884098939929328e-07, - "loss": 0.2513, - "step": 24650 - }, - { - "epoch": 85.62, - "learning_rate": 5.869964664310953e-07, - "loss": 0.2467, - "step": 24660 - }, - { - "epoch": 85.66, - "learning_rate": 5.85583038869258e-07, - "loss": 0.2617, - "step": 24670 - }, - { - "epoch": 85.69, - "learning_rate": 5.841696113074205e-07, - "loss": 0.2484, - "step": 24680 - }, - { - "epoch": 85.73, - "learning_rate": 5.82756183745583e-07, - "loss": 0.2481, - "step": 24690 - }, - { - "epoch": 85.76, - "learning_rate": 5.813427561837455e-07, - "loss": 0.2393, - "step": 24700 - }, - { - "epoch": 85.8, - "learning_rate": 5.799293286219081e-07, - "loss": 0.2372, - "step": 24710 - }, - { - "epoch": 85.83, - "learning_rate": 5.785159010600707e-07, - "loss": 0.2828, - "step": 24720 - }, - { - "epoch": 85.87, - "learning_rate": 5.771024734982332e-07, - "loss": 0.2796, - "step": 24730 - }, - { - "epoch": 85.9, - "learning_rate": 5.756890459363958e-07, - "loss": 0.2604, - "step": 24740 - }, - { - "epoch": 85.94, - "learning_rate": 5.742756183745583e-07, - "loss": 0.2143, - "step": 24750 - }, - { - "epoch": 85.97, - "learning_rate": 5.728621908127208e-07, - "loss": 0.2601, - "step": 24760 - }, - { - "epoch": 86.0, - "eval_loss": 0.5090940594673157, - "eval_runtime": 134.139, - "eval_samples_per_second": 3.966, - "eval_steps_per_second": 0.992, - "eval_wer": 0.19605322362923444, - "step": 24768 - }, - { - "epoch": 86.01, - "learning_rate": 5.714487632508833e-07, - "loss": 0.2614, - "step": 24770 - }, - { - "epoch": 86.04, - "learning_rate": 5.70035335689046e-07, - "loss": 0.2556, - "step": 24780 - }, - { - "epoch": 86.08, - "learning_rate": 5.686219081272085e-07, - "loss": 0.2451, - "step": 24790 - }, - { - "epoch": 86.11, - "learning_rate": 5.67208480565371e-07, - "loss": 0.2619, - "step": 24800 - }, - { - "epoch": 86.15, - "learning_rate": 5.657950530035336e-07, - "loss": 0.263, - "step": 24810 - }, - { - "epoch": 86.18, - "learning_rate": 5.643816254416961e-07, - "loss": 0.2718, - "step": 24820 - }, - { - "epoch": 86.21, - "learning_rate": 5.629681978798586e-07, - "loss": 0.2349, - "step": 24830 - }, - { - "epoch": 86.25, - "learning_rate": 5.615547703180213e-07, - "loss": 0.2553, - "step": 24840 - }, - { - "epoch": 86.28, - "learning_rate": 5.601413427561838e-07, - "loss": 0.2492, - "step": 24850 - }, - { - "epoch": 86.32, - "learning_rate": 5.587279151943463e-07, - "loss": 0.2549, - "step": 24860 - }, - { - "epoch": 86.35, - "learning_rate": 5.573144876325088e-07, - "loss": 0.2416, - "step": 24870 - }, - { - "epoch": 86.39, - "learning_rate": 5.559010600706714e-07, - "loss": 0.2552, - "step": 24880 - }, - { - "epoch": 86.42, - "learning_rate": 5.544876325088339e-07, - "loss": 0.2318, - "step": 24890 - }, - { - "epoch": 86.46, - "learning_rate": 5.530742049469965e-07, - "loss": 0.2538, - "step": 24900 - }, - { - "epoch": 86.49, - "learning_rate": 5.516607773851591e-07, - "loss": 0.2483, - "step": 24910 - }, - { - "epoch": 86.53, - "learning_rate": 5.502473498233216e-07, - "loss": 0.2677, - "step": 24920 - }, - { - "epoch": 86.56, - "learning_rate": 5.488339222614841e-07, - "loss": 0.2506, - "step": 24930 - }, - { - "epoch": 86.6, - "learning_rate": 5.474204946996465e-07, - "loss": 0.2563, - "step": 24940 - }, - { - "epoch": 86.63, - "learning_rate": 5.460070671378092e-07, - "loss": 0.2429, - "step": 24950 - }, - { - "epoch": 86.66, - "learning_rate": 5.445936395759717e-07, - "loss": 0.259, - "step": 24960 - }, - { - "epoch": 86.7, - "learning_rate": 5.431802120141342e-07, - "loss": 0.2554, - "step": 24970 - }, - { - "epoch": 86.73, - "learning_rate": 5.417667844522968e-07, - "loss": 0.2534, - "step": 24980 - }, - { - "epoch": 86.77, - "learning_rate": 5.403533568904593e-07, - "loss": 0.2392, - "step": 24990 - }, - { - "epoch": 86.8, - "learning_rate": 5.389399293286218e-07, - "loss": 0.27, - "step": 25000 - }, - { - "epoch": 86.84, - "learning_rate": 5.375265017667843e-07, - "loss": 0.2516, - "step": 25010 - }, - { - "epoch": 86.87, - "learning_rate": 5.36113074204947e-07, - "loss": 0.2701, - "step": 25020 - }, - { - "epoch": 86.91, - "learning_rate": 5.346996466431095e-07, - "loss": 0.2528, - "step": 25030 - }, - { - "epoch": 86.94, - "learning_rate": 5.33286219081272e-07, - "loss": 0.2286, - "step": 25040 - }, - { - "epoch": 86.98, - "learning_rate": 5.318727915194346e-07, - "loss": 0.2719, - "step": 25050 - }, - { - "epoch": 87.0, - "eval_loss": 0.5086585283279419, - "eval_runtime": 134.1212, - "eval_samples_per_second": 3.967, - "eval_steps_per_second": 0.992, - "eval_wer": 0.19753165777463522, - "step": 25056 - }, - { - "epoch": 87.01, - "learning_rate": 5.304593639575971e-07, - "loss": 0.2532, - "step": 25060 - }, - { - "epoch": 87.05, - "learning_rate": 5.290459363957596e-07, - "loss": 0.2514, - "step": 25070 - }, - { - "epoch": 87.08, - "learning_rate": 5.276325088339222e-07, - "loss": 0.2552, - "step": 25080 - }, - { - "epoch": 87.12, - "learning_rate": 5.262190812720848e-07, - "loss": 0.265, - "step": 25090 - }, - { - "epoch": 87.15, - "learning_rate": 5.248056537102473e-07, - "loss": 0.2704, - "step": 25100 - }, - { - "epoch": 87.19, - "learning_rate": 5.233922261484098e-07, - "loss": 0.2557, - "step": 25110 - }, - { - "epoch": 87.22, - "learning_rate": 5.219787985865724e-07, - "loss": 0.2781, - "step": 25120 - }, - { - "epoch": 87.26, - "learning_rate": 5.20565371024735e-07, - "loss": 0.2355, - "step": 25130 - }, - { - "epoch": 87.29, - "learning_rate": 5.191519434628975e-07, - "loss": 0.2728, - "step": 25140 - }, - { - "epoch": 87.33, - "learning_rate": 5.177385159010601e-07, - "loss": 0.2635, - "step": 25150 - }, - { - "epoch": 87.36, - "learning_rate": 5.163250883392226e-07, - "loss": 0.2442, - "step": 25160 - }, - { - "epoch": 87.39, - "learning_rate": 5.149116607773851e-07, - "loss": 0.2409, - "step": 25170 - }, - { - "epoch": 87.43, - "learning_rate": 5.134982332155476e-07, - "loss": 0.2497, - "step": 25180 - }, - { - "epoch": 87.46, - "learning_rate": 5.120848056537103e-07, - "loss": 0.263, - "step": 25190 - }, - { - "epoch": 87.5, - "learning_rate": 5.106713780918728e-07, - "loss": 0.2511, - "step": 25200 - }, - { - "epoch": 87.53, - "learning_rate": 5.092579505300353e-07, - "loss": 0.2522, - "step": 25210 - }, - { - "epoch": 87.57, - "learning_rate": 5.078445229681979e-07, - "loss": 0.2686, - "step": 25220 - }, - { - "epoch": 87.6, - "learning_rate": 5.064310954063604e-07, - "loss": 0.2407, - "step": 25230 - }, - { - "epoch": 87.64, - "learning_rate": 5.050176678445229e-07, - "loss": 0.228, - "step": 25240 - }, - { - "epoch": 87.67, - "learning_rate": 5.036042402826855e-07, - "loss": 0.2763, - "step": 25250 - }, - { - "epoch": 87.71, - "learning_rate": 5.021908127208481e-07, - "loss": 0.2378, - "step": 25260 - }, - { - "epoch": 87.74, - "learning_rate": 5.007773851590106e-07, - "loss": 0.2532, - "step": 25270 - }, - { - "epoch": 87.78, - "learning_rate": 4.993639575971731e-07, - "loss": 0.2431, - "step": 25280 - }, - { - "epoch": 87.81, - "learning_rate": 4.979505300353356e-07, - "loss": 0.2216, - "step": 25290 - }, - { - "epoch": 87.85, - "learning_rate": 4.965371024734982e-07, - "loss": 0.2579, - "step": 25300 - }, - { - "epoch": 87.88, - "learning_rate": 4.951236749116608e-07, - "loss": 0.2501, - "step": 25310 - }, - { - "epoch": 87.91, - "learning_rate": 4.937102473498233e-07, - "loss": 0.2612, - "step": 25320 - }, - { - "epoch": 87.95, - "learning_rate": 4.922968197879858e-07, - "loss": 0.2665, - "step": 25330 - }, - { - "epoch": 87.98, - "learning_rate": 4.908833922261484e-07, - "loss": 0.269, - "step": 25340 - }, - { - "epoch": 88.0, - "eval_loss": 0.5126340389251709, - "eval_runtime": 134.1929, - "eval_samples_per_second": 3.964, - "eval_steps_per_second": 0.991, - "eval_wer": 0.1965674615928521, - "step": 25344 - }, - { - "epoch": 88.02, - "learning_rate": 4.894699646643109e-07, - "loss": 0.2832, - "step": 25350 - }, - { - "epoch": 88.06, - "learning_rate": 4.880565371024734e-07, - "loss": 0.2522, - "step": 25360 - }, - { - "epoch": 88.09, - "learning_rate": 4.866431095406361e-07, - "loss": 0.232, - "step": 25370 - }, - { - "epoch": 88.12, - "learning_rate": 4.852296819787986e-07, - "loss": 0.2669, - "step": 25380 - }, - { - "epoch": 88.16, - "learning_rate": 4.838162544169611e-07, - "loss": 0.2461, - "step": 25390 - }, - { - "epoch": 88.19, - "learning_rate": 4.824028268551237e-07, - "loss": 0.2498, - "step": 25400 - }, - { - "epoch": 88.23, - "learning_rate": 4.809893992932862e-07, - "loss": 0.2525, - "step": 25410 - }, - { - "epoch": 88.26, - "learning_rate": 4.795759717314487e-07, - "loss": 0.2603, - "step": 25420 - }, - { - "epoch": 88.3, - "learning_rate": 4.781625441696113e-07, - "loss": 0.2594, - "step": 25430 - }, - { - "epoch": 88.33, - "learning_rate": 4.7674911660777383e-07, - "loss": 0.2422, - "step": 25440 - }, - { - "epoch": 88.37, - "learning_rate": 4.7533568904593634e-07, - "loss": 0.2493, - "step": 25450 - }, - { - "epoch": 88.4, - "learning_rate": 4.739222614840989e-07, - "loss": 0.2786, - "step": 25460 - }, - { - "epoch": 88.44, - "learning_rate": 4.725088339222615e-07, - "loss": 0.2218, - "step": 25470 - }, - { - "epoch": 88.47, - "learning_rate": 4.71095406360424e-07, - "loss": 0.2634, - "step": 25480 - }, - { - "epoch": 88.51, - "learning_rate": 4.6968197879858656e-07, - "loss": 0.2572, - "step": 25490 - }, - { - "epoch": 88.54, - "learning_rate": 4.682685512367491e-07, - "loss": 0.249, - "step": 25500 - }, - { - "epoch": 88.57, - "learning_rate": 4.6685512367491165e-07, - "loss": 0.2547, - "step": 25510 - }, - { - "epoch": 88.61, - "learning_rate": 4.654416961130742e-07, - "loss": 0.2611, - "step": 25520 - }, - { - "epoch": 88.64, - "learning_rate": 4.6402826855123673e-07, - "loss": 0.2664, - "step": 25530 - }, - { - "epoch": 88.68, - "learning_rate": 4.626148409893993e-07, - "loss": 0.2758, - "step": 25540 - }, - { - "epoch": 88.71, - "learning_rate": 4.612014134275618e-07, - "loss": 0.2488, - "step": 25550 - }, - { - "epoch": 88.75, - "learning_rate": 4.597879858657244e-07, - "loss": 0.253, - "step": 25560 - }, - { - "epoch": 88.78, - "learning_rate": 4.583745583038869e-07, - "loss": 0.2381, - "step": 25570 - }, - { - "epoch": 88.82, - "learning_rate": 4.5696113074204947e-07, - "loss": 0.2643, - "step": 25580 - }, - { - "epoch": 88.85, - "learning_rate": 4.5554770318021204e-07, - "loss": 0.2523, - "step": 25590 - }, - { - "epoch": 88.89, - "learning_rate": 4.5413427561837455e-07, - "loss": 0.2507, - "step": 25600 - }, - { - "epoch": 88.92, - "learning_rate": 4.527208480565371e-07, - "loss": 0.2359, - "step": 25610 - }, - { - "epoch": 88.96, - "learning_rate": 4.5130742049469963e-07, - "loss": 0.2561, - "step": 25620 - }, - { - "epoch": 88.99, - "learning_rate": 4.498939929328622e-07, - "loss": 0.2863, - "step": 25630 - }, - { - "epoch": 89.0, - "eval_loss": 0.5174065232276917, - "eval_runtime": 135.3515, - "eval_samples_per_second": 3.931, - "eval_steps_per_second": 0.983, - "eval_wer": 0.1965674615928521, - "step": 25632 - }, - { - "epoch": 89.03, - "learning_rate": 4.4848056537102467e-07, - "loss": 0.2527, - "step": 25640 - }, - { - "epoch": 89.06, - "learning_rate": 4.4706713780918723e-07, - "loss": 0.2613, - "step": 25650 - }, - { - "epoch": 89.1, - "learning_rate": 4.456537102473498e-07, - "loss": 0.2368, - "step": 25660 - }, - { - "epoch": 89.13, - "learning_rate": 4.442402826855123e-07, - "loss": 0.2653, - "step": 25670 - }, - { - "epoch": 89.17, - "learning_rate": 4.428268551236749e-07, - "loss": 0.2636, - "step": 25680 - }, - { - "epoch": 89.2, - "learning_rate": 4.414134275618374e-07, - "loss": 0.2154, - "step": 25690 - }, - { - "epoch": 89.24, - "learning_rate": 4.3999999999999997e-07, - "loss": 0.2606, - "step": 25700 - }, - { - "epoch": 89.27, - "learning_rate": 4.3858657243816254e-07, - "loss": 0.2416, - "step": 25710 - }, - { - "epoch": 89.3, - "learning_rate": 4.3717314487632505e-07, - "loss": 0.2521, - "step": 25720 - }, - { - "epoch": 89.34, - "learning_rate": 4.357597173144876e-07, - "loss": 0.2642, - "step": 25730 - }, - { - "epoch": 89.37, - "learning_rate": 4.3434628975265014e-07, - "loss": 0.247, - "step": 25740 - }, - { - "epoch": 89.41, - "learning_rate": 4.329328621908127e-07, - "loss": 0.2563, - "step": 25750 - }, - { - "epoch": 89.44, - "learning_rate": 4.315194346289752e-07, - "loss": 0.2376, - "step": 25760 - }, - { - "epoch": 89.48, - "learning_rate": 4.301060070671378e-07, - "loss": 0.2545, - "step": 25770 - }, - { - "epoch": 89.51, - "learning_rate": 4.2869257950530036e-07, - "loss": 0.2652, - "step": 25780 - }, - { - "epoch": 89.55, - "learning_rate": 4.2727915194346287e-07, - "loss": 0.2539, - "step": 25790 - }, - { - "epoch": 89.58, - "learning_rate": 4.2586572438162544e-07, - "loss": 0.2437, - "step": 25800 - }, - { - "epoch": 89.62, - "learning_rate": 4.2445229681978796e-07, - "loss": 0.2495, - "step": 25810 - }, - { - "epoch": 89.65, - "learning_rate": 4.230388692579505e-07, - "loss": 0.2779, - "step": 25820 - }, - { - "epoch": 89.69, - "learning_rate": 4.216254416961131e-07, - "loss": 0.271, - "step": 25830 - }, - { - "epoch": 89.72, - "learning_rate": 4.202120141342756e-07, - "loss": 0.2341, - "step": 25840 - }, - { - "epoch": 89.75, - "learning_rate": 4.187985865724382e-07, - "loss": 0.2561, - "step": 25850 - }, - { - "epoch": 89.79, - "learning_rate": 4.173851590106007e-07, - "loss": 0.2337, - "step": 25860 - }, - { - "epoch": 89.82, - "learning_rate": 4.1597173144876326e-07, - "loss": 0.277, - "step": 25870 - }, - { - "epoch": 89.86, - "learning_rate": 4.145583038869258e-07, - "loss": 0.2535, - "step": 25880 - }, - { - "epoch": 89.89, - "learning_rate": 4.1314487632508834e-07, - "loss": 0.2577, - "step": 25890 - }, - { - "epoch": 89.93, - "learning_rate": 4.117314487632509e-07, - "loss": 0.232, - "step": 25900 - }, - { - "epoch": 89.96, - "learning_rate": 4.103180212014134e-07, - "loss": 0.2724, - "step": 25910 - }, - { - "epoch": 90.0, - "learning_rate": 4.0890459363957594e-07, - "loss": 0.2581, - "step": 25920 - }, - { - "epoch": 90.0, - "eval_loss": 0.5159129500389099, - "eval_runtime": 134.2388, - "eval_samples_per_second": 3.963, - "eval_steps_per_second": 0.991, - "eval_wer": 0.19688886032011313, - "step": 25920 - }, - { - "epoch": 90.03, - "learning_rate": 4.0749116607773846e-07, - "loss": 0.2464, - "step": 25930 - }, - { - "epoch": 90.07, - "learning_rate": 4.0607773851590103e-07, - "loss": 0.2409, - "step": 25940 - }, - { - "epoch": 90.1, - "learning_rate": 4.0466431095406354e-07, - "loss": 0.2413, - "step": 25950 - }, - { - "epoch": 90.14, - "learning_rate": 4.032508833922261e-07, - "loss": 0.271, - "step": 25960 - }, - { - "epoch": 90.17, - "learning_rate": 4.018374558303887e-07, - "loss": 0.2487, - "step": 25970 - }, - { - "epoch": 90.21, - "learning_rate": 4.004240282685512e-07, - "loss": 0.2356, - "step": 25980 - }, - { - "epoch": 90.24, - "learning_rate": 3.9901060070671376e-07, - "loss": 0.2434, - "step": 25990 - }, - { - "epoch": 90.28, - "learning_rate": 3.975971731448763e-07, - "loss": 0.2607, - "step": 26000 - }, - { - "epoch": 90.31, - "learning_rate": 3.9618374558303885e-07, - "loss": 0.2515, - "step": 26010 - }, - { - "epoch": 90.35, - "learning_rate": 3.947703180212014e-07, - "loss": 0.2596, - "step": 26020 - }, - { - "epoch": 90.38, - "learning_rate": 3.9335689045936393e-07, - "loss": 0.2541, - "step": 26030 - }, - { - "epoch": 90.42, - "learning_rate": 3.919434628975265e-07, - "loss": 0.2471, - "step": 26040 - }, - { - "epoch": 90.45, - "learning_rate": 3.90530035335689e-07, - "loss": 0.2417, - "step": 26050 - }, - { - "epoch": 90.48, - "learning_rate": 3.891166077738516e-07, - "loss": 0.2659, - "step": 26060 - }, - { - "epoch": 90.52, - "learning_rate": 3.877031802120141e-07, - "loss": 0.2496, - "step": 26070 - }, - { - "epoch": 90.55, - "learning_rate": 3.8628975265017667e-07, - "loss": 0.2371, - "step": 26080 - }, - { - "epoch": 90.59, - "learning_rate": 3.8487632508833924e-07, - "loss": 0.2709, - "step": 26090 - }, - { - "epoch": 90.62, - "learning_rate": 3.8346289752650175e-07, - "loss": 0.238, - "step": 26100 - }, - { - "epoch": 90.66, - "learning_rate": 3.820494699646643e-07, - "loss": 0.2642, - "step": 26110 - }, - { - "epoch": 90.69, - "learning_rate": 3.8063604240282683e-07, - "loss": 0.2699, - "step": 26120 - }, - { - "epoch": 90.73, - "learning_rate": 3.792226148409894e-07, - "loss": 0.2729, - "step": 26130 - }, - { - "epoch": 90.76, - "learning_rate": 3.7780918727915197e-07, - "loss": 0.2473, - "step": 26140 - }, - { - "epoch": 90.8, - "learning_rate": 3.763957597173145e-07, - "loss": 0.27, - "step": 26150 - }, - { - "epoch": 90.83, - "learning_rate": 3.7498233215547706e-07, - "loss": 0.267, - "step": 26160 - }, - { - "epoch": 90.87, - "learning_rate": 3.7356890459363957e-07, - "loss": 0.2617, - "step": 26170 - }, - { - "epoch": 90.9, - "learning_rate": 3.721554770318021e-07, - "loss": 0.2436, - "step": 26180 - }, - { - "epoch": 90.94, - "learning_rate": 3.707420494699646e-07, - "loss": 0.2425, - "step": 26190 - }, - { - "epoch": 90.97, - "learning_rate": 3.6932862190812717e-07, - "loss": 0.26, - "step": 26200 - }, - { - "epoch": 91.0, - "eval_loss": 0.514625608921051, - "eval_runtime": 135.1986, - "eval_samples_per_second": 3.935, - "eval_steps_per_second": 0.984, - "eval_wer": 0.19688886032011313, - "step": 26208 - }, - { - "epoch": 91.01, - "learning_rate": 3.6791519434628974e-07, - "loss": 0.2532, - "step": 26210 - }, - { - "epoch": 91.04, - "learning_rate": 3.6650176678445225e-07, - "loss": 0.2408, - "step": 26220 - }, - { - "epoch": 91.08, - "learning_rate": 3.650883392226148e-07, - "loss": 0.2654, - "step": 26230 - }, - { - "epoch": 91.11, - "learning_rate": 3.6367491166077734e-07, - "loss": 0.2836, - "step": 26240 - }, - { - "epoch": 91.15, - "learning_rate": 3.622614840989399e-07, - "loss": 0.2472, - "step": 26250 - }, - { - "epoch": 91.18, - "learning_rate": 3.608480565371024e-07, - "loss": 0.2489, - "step": 26260 - }, - { - "epoch": 91.21, - "learning_rate": 3.59434628975265e-07, - "loss": 0.2713, - "step": 26270 - }, - { - "epoch": 91.25, - "learning_rate": 3.5802120141342756e-07, - "loss": 0.2338, - "step": 26280 - }, - { - "epoch": 91.28, - "learning_rate": 3.566077738515901e-07, - "loss": 0.2466, - "step": 26290 - }, - { - "epoch": 91.32, - "learning_rate": 3.5519434628975264e-07, - "loss": 0.2362, - "step": 26300 - }, - { - "epoch": 91.35, - "learning_rate": 3.5378091872791516e-07, - "loss": 0.2476, - "step": 26310 - }, - { - "epoch": 91.39, - "learning_rate": 3.523674911660777e-07, - "loss": 0.2393, - "step": 26320 - }, - { - "epoch": 91.42, - "learning_rate": 3.509540636042403e-07, - "loss": 0.2541, - "step": 26330 - }, - { - "epoch": 91.46, - "learning_rate": 3.495406360424028e-07, - "loss": 0.2439, - "step": 26340 - }, - { - "epoch": 91.49, - "learning_rate": 3.481272084805654e-07, - "loss": 0.2573, - "step": 26350 - }, - { - "epoch": 91.53, - "learning_rate": 3.467137809187279e-07, - "loss": 0.2586, - "step": 26360 - }, - { - "epoch": 91.56, - "learning_rate": 3.4530035335689046e-07, - "loss": 0.2369, - "step": 26370 - }, - { - "epoch": 91.6, - "learning_rate": 3.43886925795053e-07, - "loss": 0.2543, - "step": 26380 - }, - { - "epoch": 91.63, - "learning_rate": 3.4247349823321555e-07, - "loss": 0.2695, - "step": 26390 - }, - { - "epoch": 91.66, - "learning_rate": 3.410600706713781e-07, - "loss": 0.2457, - "step": 26400 - }, - { - "epoch": 91.7, - "learning_rate": 3.3964664310954063e-07, - "loss": 0.2456, - "step": 26410 - }, - { - "epoch": 91.73, - "learning_rate": 3.382332155477032e-07, - "loss": 0.2432, - "step": 26420 - }, - { - "epoch": 91.77, - "learning_rate": 3.368197879858657e-07, - "loss": 0.2264, - "step": 26430 - }, - { - "epoch": 91.8, - "learning_rate": 3.354063604240283e-07, - "loss": 0.242, - "step": 26440 - }, - { - "epoch": 91.84, - "learning_rate": 3.3399293286219085e-07, - "loss": 0.2651, - "step": 26450 - }, - { - "epoch": 91.87, - "learning_rate": 3.325795053003533e-07, - "loss": 0.2717, - "step": 26460 - }, - { - "epoch": 91.91, - "learning_rate": 3.311660777385159e-07, - "loss": 0.2417, - "step": 26470 - }, - { - "epoch": 91.94, - "learning_rate": 3.297526501766784e-07, - "loss": 0.2447, - "step": 26480 - }, - { - "epoch": 91.98, - "learning_rate": 3.2833922261484096e-07, - "loss": 0.2796, - "step": 26490 - }, - { - "epoch": 92.0, - "eval_loss": 0.5150091648101807, - "eval_runtime": 134.13, - "eval_samples_per_second": 3.966, - "eval_steps_per_second": 0.992, - "eval_wer": 0.1965674615928521, - "step": 26496 - }, - { - "epoch": 92.01, - "learning_rate": 3.269257950530035e-07, - "loss": 0.2811, - "step": 26500 - }, - { - "epoch": 92.05, - "learning_rate": 3.2551236749116605e-07, - "loss": 0.2589, - "step": 26510 - }, - { - "epoch": 92.08, - "learning_rate": 3.240989399293286e-07, - "loss": 0.2453, - "step": 26520 - }, - { - "epoch": 92.12, - "learning_rate": 3.2268551236749113e-07, - "loss": 0.2482, - "step": 26530 - }, - { - "epoch": 92.15, - "learning_rate": 3.212720848056537e-07, - "loss": 0.2619, - "step": 26540 - }, - { - "epoch": 92.19, - "learning_rate": 3.198586572438162e-07, - "loss": 0.2415, - "step": 26550 - }, - { - "epoch": 92.22, - "learning_rate": 3.184452296819788e-07, - "loss": 0.2459, - "step": 26560 - }, - { - "epoch": 92.26, - "learning_rate": 3.170318021201413e-07, - "loss": 0.253, - "step": 26570 - }, - { - "epoch": 92.29, - "learning_rate": 3.1561837455830387e-07, - "loss": 0.2728, - "step": 26580 - }, - { - "epoch": 92.33, - "learning_rate": 3.1420494699646644e-07, - "loss": 0.255, - "step": 26590 - }, - { - "epoch": 92.36, - "learning_rate": 3.1279151943462895e-07, - "loss": 0.2464, - "step": 26600 - }, - { - "epoch": 92.39, - "learning_rate": 3.113780918727915e-07, - "loss": 0.24, - "step": 26610 - }, - { - "epoch": 92.43, - "learning_rate": 3.0996466431095404e-07, - "loss": 0.2343, - "step": 26620 - }, - { - "epoch": 92.46, - "learning_rate": 3.085512367491166e-07, - "loss": 0.245, - "step": 26630 - }, - { - "epoch": 92.5, - "learning_rate": 3.0713780918727917e-07, - "loss": 0.2556, - "step": 26640 - }, - { - "epoch": 92.53, - "learning_rate": 3.057243816254417e-07, - "loss": 0.2431, - "step": 26650 - }, - { - "epoch": 92.57, - "learning_rate": 3.0431095406360426e-07, - "loss": 0.2274, - "step": 26660 - }, - { - "epoch": 92.6, - "learning_rate": 3.0289752650176677e-07, - "loss": 0.254, - "step": 26670 - }, - { - "epoch": 92.64, - "learning_rate": 3.0148409893992934e-07, - "loss": 0.2559, - "step": 26680 - }, - { - "epoch": 92.67, - "learning_rate": 3.0007067137809186e-07, - "loss": 0.2563, - "step": 26690 - }, - { - "epoch": 92.71, - "learning_rate": 2.986572438162544e-07, - "loss": 0.2375, - "step": 26700 - }, - { - "epoch": 92.74, - "learning_rate": 2.97243816254417e-07, - "loss": 0.2797, - "step": 26710 - }, - { - "epoch": 92.78, - "learning_rate": 2.9583038869257945e-07, - "loss": 0.2366, - "step": 26720 - }, - { - "epoch": 92.81, - "learning_rate": 2.94416961130742e-07, - "loss": 0.2638, - "step": 26730 - }, - { - "epoch": 92.85, - "learning_rate": 2.9300353356890454e-07, - "loss": 0.2595, - "step": 26740 - }, - { - "epoch": 92.88, - "learning_rate": 2.915901060070671e-07, - "loss": 0.2488, - "step": 26750 - }, - { - "epoch": 92.91, - "learning_rate": 2.901766784452297e-07, - "loss": 0.2517, - "step": 26760 - }, - { - "epoch": 92.95, - "learning_rate": 2.887632508833922e-07, - "loss": 0.2589, - "step": 26770 - }, - { - "epoch": 92.98, - "learning_rate": 2.8734982332155476e-07, - "loss": 0.2723, - "step": 26780 - }, - { - "epoch": 93.0, - "eval_loss": 0.5132827758789062, - "eval_runtime": 134.2687, - "eval_samples_per_second": 3.962, - "eval_steps_per_second": 0.991, - "eval_wer": 0.19708169955646976, - "step": 26784 - }, - { - "epoch": 93.02, - "learning_rate": 2.859363957597173e-07, - "loss": 0.2599, - "step": 26790 - }, - { - "epoch": 93.06, - "learning_rate": 2.8452296819787984e-07, - "loss": 0.2383, - "step": 26800 - }, - { - "epoch": 93.09, - "learning_rate": 2.8310954063604236e-07, - "loss": 0.2709, - "step": 26810 - }, - { - "epoch": 93.12, - "learning_rate": 2.816961130742049e-07, - "loss": 0.2514, - "step": 26820 - }, - { - "epoch": 93.16, - "learning_rate": 2.802826855123675e-07, - "loss": 0.2503, - "step": 26830 - }, - { - "epoch": 93.19, - "learning_rate": 2.7886925795053e-07, - "loss": 0.2455, - "step": 26840 - }, - { - "epoch": 93.23, - "learning_rate": 2.774558303886926e-07, - "loss": 0.2576, - "step": 26850 - }, - { - "epoch": 93.26, - "learning_rate": 2.760424028268551e-07, - "loss": 0.2415, - "step": 26860 - }, - { - "epoch": 93.3, - "learning_rate": 2.7462897526501766e-07, - "loss": 0.2765, - "step": 26870 - }, - { - "epoch": 93.33, - "learning_rate": 2.7321554770318023e-07, - "loss": 0.2527, - "step": 26880 - }, - { - "epoch": 93.37, - "learning_rate": 2.7180212014134275e-07, - "loss": 0.2404, - "step": 26890 - }, - { - "epoch": 93.4, - "learning_rate": 2.703886925795053e-07, - "loss": 0.2534, - "step": 26900 - }, - { - "epoch": 93.44, - "learning_rate": 2.6897526501766783e-07, - "loss": 0.2223, - "step": 26910 - }, - { - "epoch": 93.47, - "learning_rate": 2.675618374558304e-07, - "loss": 0.2735, - "step": 26920 - }, - { - "epoch": 93.51, - "learning_rate": 2.661484098939929e-07, - "loss": 0.2666, - "step": 26930 - }, - { - "epoch": 93.54, - "learning_rate": 2.647349823321555e-07, - "loss": 0.2513, - "step": 26940 - }, - { - "epoch": 93.57, - "learning_rate": 2.6332155477031805e-07, - "loss": 0.2531, - "step": 26950 - }, - { - "epoch": 93.61, - "learning_rate": 2.6190812720848057e-07, - "loss": 0.2438, - "step": 26960 - }, - { - "epoch": 93.64, - "learning_rate": 2.6049469964664313e-07, - "loss": 0.2672, - "step": 26970 - }, - { - "epoch": 93.68, - "learning_rate": 2.5908127208480565e-07, - "loss": 0.2743, - "step": 26980 - }, - { - "epoch": 93.71, - "learning_rate": 2.576678445229682e-07, - "loss": 0.2549, - "step": 26990 - }, - { - "epoch": 93.75, - "learning_rate": 2.562544169611307e-07, - "loss": 0.2564, - "step": 27000 - }, - { - "epoch": 93.78, - "learning_rate": 2.5484098939929325e-07, - "loss": 0.2593, - "step": 27010 - }, - { - "epoch": 93.82, - "learning_rate": 2.534275618374558e-07, - "loss": 0.2585, - "step": 27020 - }, - { - "epoch": 93.85, - "learning_rate": 2.5201413427561833e-07, - "loss": 0.2472, - "step": 27030 - }, - { - "epoch": 93.89, - "learning_rate": 2.506007067137809e-07, - "loss": 0.2225, - "step": 27040 - }, - { - "epoch": 93.92, - "learning_rate": 2.4918727915194347e-07, - "loss": 0.2766, - "step": 27050 - }, - { - "epoch": 93.96, - "learning_rate": 2.47773851590106e-07, - "loss": 0.2493, - "step": 27060 - }, - { - "epoch": 93.99, - "learning_rate": 2.4636042402826855e-07, - "loss": 0.249, - "step": 27070 - }, - { - "epoch": 94.0, - "eval_loss": 0.509568452835083, - "eval_runtime": 135.0584, - "eval_samples_per_second": 3.939, - "eval_steps_per_second": 0.985, - "eval_wer": 0.19605322362923444, - "step": 27072 - }, - { - "epoch": 94.03, - "learning_rate": 2.4494699646643107e-07, - "loss": 0.2773, - "step": 27080 - }, - { - "epoch": 94.06, - "learning_rate": 2.4353356890459364e-07, - "loss": 0.2497, - "step": 27090 - }, - { - "epoch": 94.1, - "learning_rate": 2.421201413427562e-07, - "loss": 0.2476, - "step": 27100 - }, - { - "epoch": 94.13, - "learning_rate": 2.407067137809187e-07, - "loss": 0.268, - "step": 27110 - }, - { - "epoch": 94.17, - "learning_rate": 2.392932862190813e-07, - "loss": 0.2523, - "step": 27120 - }, - { - "epoch": 94.2, - "learning_rate": 2.378798586572438e-07, - "loss": 0.2356, - "step": 27130 - }, - { - "epoch": 94.24, - "learning_rate": 2.3646643109540635e-07, - "loss": 0.2633, - "step": 27140 - }, - { - "epoch": 94.27, - "learning_rate": 2.350530035335689e-07, - "loss": 0.2345, - "step": 27150 - }, - { - "epoch": 94.3, - "learning_rate": 2.3363957597173146e-07, - "loss": 0.2828, - "step": 27160 - }, - { - "epoch": 94.34, - "learning_rate": 2.32226148409894e-07, - "loss": 0.259, - "step": 27170 - }, - { - "epoch": 94.37, - "learning_rate": 2.3081272084805654e-07, - "loss": 0.2528, - "step": 27180 - }, - { - "epoch": 94.41, - "learning_rate": 2.2939929328621908e-07, - "loss": 0.2359, - "step": 27190 - }, - { - "epoch": 94.44, - "learning_rate": 2.279858657243816e-07, - "loss": 0.2267, - "step": 27200 - }, - { - "epoch": 94.48, - "learning_rate": 2.2657243816254414e-07, - "loss": 0.2596, - "step": 27210 - }, - { - "epoch": 94.51, - "learning_rate": 2.251590106007067e-07, - "loss": 0.259, - "step": 27220 - }, - { - "epoch": 94.55, - "learning_rate": 2.2374558303886925e-07, - "loss": 0.2455, - "step": 27230 - }, - { - "epoch": 94.58, - "learning_rate": 2.223321554770318e-07, - "loss": 0.268, - "step": 27240 - }, - { - "epoch": 94.62, - "learning_rate": 2.2091872791519433e-07, - "loss": 0.2472, - "step": 27250 - }, - { - "epoch": 94.65, - "learning_rate": 2.1950530035335688e-07, - "loss": 0.2573, - "step": 27260 - }, - { - "epoch": 94.69, - "learning_rate": 2.1809187279151942e-07, - "loss": 0.2845, - "step": 27270 - }, - { - "epoch": 94.72, - "learning_rate": 2.1667844522968196e-07, - "loss": 0.2401, - "step": 27280 - }, - { - "epoch": 94.75, - "learning_rate": 2.1526501766784453e-07, - "loss": 0.2497, - "step": 27290 - }, - { - "epoch": 94.79, - "learning_rate": 2.1385159010600707e-07, - "loss": 0.2693, - "step": 27300 - }, - { - "epoch": 94.82, - "learning_rate": 2.124381625441696e-07, - "loss": 0.2634, - "step": 27310 - }, - { - "epoch": 94.86, - "learning_rate": 2.1102473498233215e-07, - "loss": 0.2539, - "step": 27320 - }, - { - "epoch": 94.89, - "learning_rate": 2.0961130742049467e-07, - "loss": 0.2747, - "step": 27330 - }, - { - "epoch": 94.93, - "learning_rate": 2.081978798586572e-07, - "loss": 0.2487, - "step": 27340 - }, - { - "epoch": 94.96, - "learning_rate": 2.0678445229681978e-07, - "loss": 0.2491, - "step": 27350 - }, - { - "epoch": 95.0, - "learning_rate": 2.0537102473498232e-07, - "loss": 0.266, - "step": 27360 - }, - { - "epoch": 95.0, - "eval_loss": 0.5116358399391174, - "eval_runtime": 134.7906, - "eval_samples_per_second": 3.947, - "eval_steps_per_second": 0.987, - "eval_wer": 0.19637462235649547, - "step": 27360 - }, - { - "epoch": 95.03, - "learning_rate": 2.0395759717314486e-07, - "loss": 0.2359, - "step": 27370 - }, - { - "epoch": 95.07, - "learning_rate": 2.025441696113074e-07, - "loss": 0.2421, - "step": 27380 - }, - { - "epoch": 95.1, - "learning_rate": 2.0113074204946995e-07, - "loss": 0.2358, - "step": 27390 - }, - { - "epoch": 95.14, - "learning_rate": 1.997173144876325e-07, - "loss": 0.2741, - "step": 27400 - }, - { - "epoch": 95.17, - "learning_rate": 1.9830388692579506e-07, - "loss": 0.2423, - "step": 27410 - }, - { - "epoch": 95.21, - "learning_rate": 1.968904593639576e-07, - "loss": 0.2617, - "step": 27420 - }, - { - "epoch": 95.24, - "learning_rate": 1.9547703180212014e-07, - "loss": 0.2387, - "step": 27430 - }, - { - "epoch": 95.28, - "learning_rate": 1.9406360424028268e-07, - "loss": 0.2223, - "step": 27440 - }, - { - "epoch": 95.31, - "learning_rate": 1.9265017667844522e-07, - "loss": 0.2613, - "step": 27450 - }, - { - "epoch": 95.35, - "learning_rate": 1.9123674911660777e-07, - "loss": 0.2723, - "step": 27460 - }, - { - "epoch": 95.38, - "learning_rate": 1.898233215547703e-07, - "loss": 0.2495, - "step": 27470 - }, - { - "epoch": 95.42, - "learning_rate": 1.8840989399293285e-07, - "loss": 0.2446, - "step": 27480 - }, - { - "epoch": 95.45, - "learning_rate": 1.869964664310954e-07, - "loss": 0.2454, - "step": 27490 - }, - { - "epoch": 95.48, - "learning_rate": 1.8558303886925793e-07, - "loss": 0.2713, - "step": 27500 - }, - { - "epoch": 95.52, - "learning_rate": 1.8416961130742048e-07, - "loss": 0.2616, - "step": 27510 - }, - { - "epoch": 95.55, - "learning_rate": 1.8275618374558302e-07, - "loss": 0.2538, - "step": 27520 - }, - { - "epoch": 95.59, - "learning_rate": 1.8134275618374559e-07, - "loss": 0.2452, - "step": 27530 - }, - { - "epoch": 95.62, - "learning_rate": 1.7992932862190813e-07, - "loss": 0.2413, - "step": 27540 - }, - { - "epoch": 95.66, - "learning_rate": 1.7851590106007067e-07, - "loss": 0.2753, - "step": 27550 - }, - { - "epoch": 95.69, - "learning_rate": 1.771024734982332e-07, - "loss": 0.2428, - "step": 27560 - }, - { - "epoch": 95.73, - "learning_rate": 1.7568904593639575e-07, - "loss": 0.2359, - "step": 27570 - }, - { - "epoch": 95.76, - "learning_rate": 1.742756183745583e-07, - "loss": 0.2472, - "step": 27580 - }, - { - "epoch": 95.8, - "learning_rate": 1.7286219081272086e-07, - "loss": 0.2241, - "step": 27590 - }, - { - "epoch": 95.83, - "learning_rate": 1.714487632508834e-07, - "loss": 0.2494, - "step": 27600 - }, - { - "epoch": 95.87, - "learning_rate": 1.7003533568904592e-07, - "loss": 0.2686, - "step": 27610 - }, - { - "epoch": 95.9, - "learning_rate": 1.6862190812720846e-07, - "loss": 0.2426, - "step": 27620 - }, - { - "epoch": 95.94, - "learning_rate": 1.67208480565371e-07, - "loss": 0.2698, - "step": 27630 - }, - { - "epoch": 95.97, - "learning_rate": 1.6579505300353355e-07, - "loss": 0.2683, - "step": 27640 - }, - { - "epoch": 96.0, - "eval_loss": 0.5132885575294495, - "eval_runtime": 135.195, - "eval_samples_per_second": 3.935, - "eval_steps_per_second": 0.984, - "eval_wer": 0.1966960210837565, - "step": 27648 - }, - { - "epoch": 96.01, - "learning_rate": 1.643816254416961e-07, - "loss": 0.2756, - "step": 27650 - }, - { - "epoch": 96.04, - "learning_rate": 1.6296819787985866e-07, - "loss": 0.264, - "step": 27660 - }, - { - "epoch": 96.08, - "learning_rate": 1.615547703180212e-07, - "loss": 0.2275, - "step": 27670 - }, - { - "epoch": 96.11, - "learning_rate": 1.6014134275618374e-07, - "loss": 0.2498, - "step": 27680 - }, - { - "epoch": 96.15, - "learning_rate": 1.5872791519434628e-07, - "loss": 0.2453, - "step": 27690 - }, - { - "epoch": 96.18, - "learning_rate": 1.5731448763250883e-07, - "loss": 0.2527, - "step": 27700 - }, - { - "epoch": 96.21, - "learning_rate": 1.5590106007067137e-07, - "loss": 0.2548, - "step": 27710 - }, - { - "epoch": 96.25, - "learning_rate": 1.5448763250883394e-07, - "loss": 0.2589, - "step": 27720 - }, - { - "epoch": 96.28, - "learning_rate": 1.5307420494699648e-07, - "loss": 0.2361, - "step": 27730 - }, - { - "epoch": 96.32, - "learning_rate": 1.51660777385159e-07, - "loss": 0.2798, - "step": 27740 - }, - { - "epoch": 96.35, - "learning_rate": 1.5024734982332153e-07, - "loss": 0.2742, - "step": 27750 - }, - { - "epoch": 96.39, - "learning_rate": 1.4883392226148408e-07, - "loss": 0.2475, - "step": 27760 - }, - { - "epoch": 96.42, - "learning_rate": 1.4742049469964662e-07, - "loss": 0.237, - "step": 27770 - }, - { - "epoch": 96.46, - "learning_rate": 1.4600706713780919e-07, - "loss": 0.2548, - "step": 27780 - }, - { - "epoch": 96.49, - "learning_rate": 1.4459363957597173e-07, - "loss": 0.2458, - "step": 27790 - }, - { - "epoch": 96.53, - "learning_rate": 1.4318021201413427e-07, - "loss": 0.2448, - "step": 27800 - }, - { - "epoch": 96.56, - "learning_rate": 1.417667844522968e-07, - "loss": 0.2604, - "step": 27810 - }, - { - "epoch": 96.6, - "learning_rate": 1.4035335689045935e-07, - "loss": 0.252, - "step": 27820 - }, - { - "epoch": 96.63, - "learning_rate": 1.389399293286219e-07, - "loss": 0.2356, - "step": 27830 - }, - { - "epoch": 96.66, - "learning_rate": 1.3752650176678446e-07, - "loss": 0.2531, - "step": 27840 - }, - { - "epoch": 96.7, - "learning_rate": 1.36113074204947e-07, - "loss": 0.2657, - "step": 27850 - }, - { - "epoch": 96.73, - "learning_rate": 1.3469964664310955e-07, - "loss": 0.2601, - "step": 27860 - }, - { - "epoch": 96.77, - "learning_rate": 1.332862190812721e-07, - "loss": 0.2507, - "step": 27870 - }, - { - "epoch": 96.8, - "learning_rate": 1.318727915194346e-07, - "loss": 0.2657, - "step": 27880 - }, - { - "epoch": 96.84, - "learning_rate": 1.3045936395759715e-07, - "loss": 0.2588, - "step": 27890 - }, - { - "epoch": 96.87, - "learning_rate": 1.2904593639575972e-07, - "loss": 0.2474, - "step": 27900 - }, - { - "epoch": 96.91, - "learning_rate": 1.2763250883392226e-07, - "loss": 0.2616, - "step": 27910 - }, - { - "epoch": 96.94, - "learning_rate": 1.262190812720848e-07, - "loss": 0.2405, - "step": 27920 - }, - { - "epoch": 96.98, - "learning_rate": 1.2480565371024734e-07, - "loss": 0.2451, - "step": 27930 - }, - { - "epoch": 97.0, - "eval_loss": 0.5141022205352783, - "eval_runtime": 134.2101, - "eval_samples_per_second": 3.964, - "eval_steps_per_second": 0.991, - "eval_wer": 0.19650318184739987, - "step": 27936 - }, - { - "epoch": 97.01, - "learning_rate": 1.2339222614840988e-07, - "loss": 0.2512, - "step": 27940 - }, - { - "epoch": 97.05, - "learning_rate": 1.2197879858657243e-07, - "loss": 0.2491, - "step": 27950 - }, - { - "epoch": 97.08, - "learning_rate": 1.2056537102473497e-07, - "loss": 0.2663, - "step": 27960 - }, - { - "epoch": 97.12, - "learning_rate": 1.1915194346289752e-07, - "loss": 0.2532, - "step": 27970 - }, - { - "epoch": 97.15, - "learning_rate": 1.1773851590106006e-07, - "loss": 0.263, - "step": 27980 - }, - { - "epoch": 97.19, - "learning_rate": 1.163250883392226e-07, - "loss": 0.2544, - "step": 27990 - }, - { - "epoch": 97.22, - "learning_rate": 1.1491166077738515e-07, - "loss": 0.2543, - "step": 28000 - }, - { - "epoch": 97.26, - "learning_rate": 1.134982332155477e-07, - "loss": 0.2582, - "step": 28010 - }, - { - "epoch": 97.29, - "learning_rate": 1.1208480565371025e-07, - "loss": 0.2577, - "step": 28020 - }, - { - "epoch": 97.33, - "learning_rate": 1.1067137809187279e-07, - "loss": 0.2445, - "step": 28030 - }, - { - "epoch": 97.36, - "learning_rate": 1.0925795053003534e-07, - "loss": 0.2692, - "step": 28040 - }, - { - "epoch": 97.39, - "learning_rate": 1.0784452296819787e-07, - "loss": 0.2461, - "step": 28050 - }, - { - "epoch": 97.43, - "learning_rate": 1.0643109540636041e-07, - "loss": 0.2136, - "step": 28060 - }, - { - "epoch": 97.46, - "learning_rate": 1.0501766784452297e-07, - "loss": 0.2604, - "step": 28070 - }, - { - "epoch": 97.5, - "learning_rate": 1.0360424028268551e-07, - "loss": 0.2517, - "step": 28080 - }, - { - "epoch": 97.53, - "learning_rate": 1.0219081272084805e-07, - "loss": 0.247, - "step": 28090 - }, - { - "epoch": 97.57, - "learning_rate": 1.0077738515901061e-07, - "loss": 0.2481, - "step": 28100 - }, - { - "epoch": 97.6, - "learning_rate": 9.936395759717315e-08, - "loss": 0.2215, - "step": 28110 - }, - { - "epoch": 97.64, - "learning_rate": 9.795053003533568e-08, - "loss": 0.2549, - "step": 28120 - }, - { - "epoch": 97.67, - "learning_rate": 9.653710247349822e-08, - "loss": 0.2656, - "step": 28130 - }, - { - "epoch": 97.71, - "learning_rate": 9.512367491166077e-08, - "loss": 0.2415, - "step": 28140 - }, - { - "epoch": 97.74, - "learning_rate": 9.371024734982332e-08, - "loss": 0.2388, - "step": 28150 - }, - { - "epoch": 97.78, - "learning_rate": 9.229681978798586e-08, - "loss": 0.2437, - "step": 28160 - }, - { - "epoch": 97.81, - "learning_rate": 9.088339222614841e-08, - "loss": 0.2621, - "step": 28170 - }, - { - "epoch": 97.85, - "learning_rate": 8.946996466431094e-08, - "loss": 0.2629, - "step": 28180 - }, - { - "epoch": 97.88, - "learning_rate": 8.805653710247348e-08, - "loss": 0.2346, - "step": 28190 - }, - { - "epoch": 97.91, - "learning_rate": 8.664310954063604e-08, - "loss": 0.2638, - "step": 28200 - }, - { - "epoch": 97.95, - "learning_rate": 8.522968197879858e-08, - "loss": 0.2465, - "step": 28210 - }, - { - "epoch": 97.98, - "learning_rate": 8.381625441696112e-08, - "loss": 0.2723, - "step": 28220 - }, - { - "epoch": 98.0, - "eval_loss": 0.5122572779655457, - "eval_runtime": 135.6766, - "eval_samples_per_second": 3.921, - "eval_steps_per_second": 0.98, - "eval_wer": 0.19624606286559104, - "step": 28224 - }, - { - "epoch": 98.02, - "learning_rate": 8.240282685512368e-08, - "loss": 0.2508, - "step": 28230 - }, - { - "epoch": 98.06, - "learning_rate": 8.098939929328622e-08, - "loss": 0.2573, - "step": 28240 - }, - { - "epoch": 98.09, - "learning_rate": 7.957597173144875e-08, - "loss": 0.2363, - "step": 28250 - }, - { - "epoch": 98.12, - "learning_rate": 7.81625441696113e-08, - "loss": 0.2677, - "step": 28260 - }, - { - "epoch": 98.16, - "learning_rate": 7.674911660777385e-08, - "loss": 0.2611, - "step": 28270 - }, - { - "epoch": 98.19, - "learning_rate": 7.533568904593639e-08, - "loss": 0.2331, - "step": 28280 - }, - { - "epoch": 98.23, - "learning_rate": 7.392226148409894e-08, - "loss": 0.2688, - "step": 28290 - }, - { - "epoch": 98.26, - "learning_rate": 7.250883392226148e-08, - "loss": 0.2321, - "step": 28300 - }, - { - "epoch": 98.3, - "learning_rate": 7.109540636042403e-08, - "loss": 0.278, - "step": 28310 - }, - { - "epoch": 98.33, - "learning_rate": 6.968197879858657e-08, - "loss": 0.2502, - "step": 28320 - }, - { - "epoch": 98.37, - "learning_rate": 6.826855123674911e-08, - "loss": 0.2497, - "step": 28330 - }, - { - "epoch": 98.4, - "learning_rate": 6.685512367491165e-08, - "loss": 0.2593, - "step": 28340 - }, - { - "epoch": 98.44, - "learning_rate": 6.544169611307421e-08, - "loss": 0.25, - "step": 28350 - }, - { - "epoch": 98.47, - "learning_rate": 6.402826855123675e-08, - "loss": 0.2518, - "step": 28360 - }, - { - "epoch": 98.51, - "learning_rate": 6.261484098939929e-08, - "loss": 0.2586, - "step": 28370 - }, - { - "epoch": 98.54, - "learning_rate": 6.120141342756183e-08, - "loss": 0.2632, - "step": 28380 - }, - { - "epoch": 98.57, - "learning_rate": 5.978798586572437e-08, - "loss": 0.2588, - "step": 28390 - }, - { - "epoch": 98.61, - "learning_rate": 5.837455830388692e-08, - "loss": 0.2575, - "step": 28400 - }, - { - "epoch": 98.64, - "learning_rate": 5.6961130742049465e-08, - "loss": 0.2669, - "step": 28410 - }, - { - "epoch": 98.68, - "learning_rate": 5.5547703180212014e-08, - "loss": 0.2753, - "step": 28420 - }, - { - "epoch": 98.71, - "learning_rate": 5.4134275618374555e-08, - "loss": 0.2383, - "step": 28430 - }, - { - "epoch": 98.75, - "learning_rate": 5.27208480565371e-08, - "loss": 0.2534, - "step": 28440 - }, - { - "epoch": 98.78, - "learning_rate": 5.1307420494699646e-08, - "loss": 0.2444, - "step": 28450 - }, - { - "epoch": 98.82, - "learning_rate": 4.989399293286219e-08, - "loss": 0.2627, - "step": 28460 - }, - { - "epoch": 98.85, - "learning_rate": 4.848056537102473e-08, - "loss": 0.2374, - "step": 28470 - }, - { - "epoch": 98.89, - "learning_rate": 4.706713780918728e-08, - "loss": 0.2649, - "step": 28480 - }, - { - "epoch": 98.92, - "learning_rate": 4.565371024734982e-08, - "loss": 0.2567, - "step": 28490 - }, - { - "epoch": 98.96, - "learning_rate": 4.424028268551237e-08, - "loss": 0.251, - "step": 28500 - }, - { - "epoch": 98.99, - "learning_rate": 4.282685512367491e-08, - "loss": 0.2527, - "step": 28510 - }, - { - "epoch": 99.0, - "eval_loss": 0.5119685530662537, - "eval_runtime": 134.8373, - "eval_samples_per_second": 3.945, - "eval_steps_per_second": 0.986, - "eval_wer": 0.1965674615928521, - "step": 28512 - }, - { - "epoch": 99.03, - "learning_rate": 4.141342756183745e-08, - "loss": 0.2849, - "step": 28520 - }, - { - "epoch": 99.06, - "learning_rate": 4e-08, - "loss": 0.2756, - "step": 28530 - }, - { - "epoch": 99.1, - "learning_rate": 3.858657243816254e-08, - "loss": 0.2378, - "step": 28540 - }, - { - "epoch": 99.13, - "learning_rate": 3.7173144876325085e-08, - "loss": 0.2709, - "step": 28550 - }, - { - "epoch": 99.17, - "learning_rate": 3.575971731448763e-08, - "loss": 0.2569, - "step": 28560 - }, - { - "epoch": 99.2, - "learning_rate": 3.4346289752650175e-08, - "loss": 0.2597, - "step": 28570 - }, - { - "epoch": 99.24, - "learning_rate": 3.293286219081272e-08, - "loss": 0.2418, - "step": 28580 - }, - { - "epoch": 99.27, - "learning_rate": 3.1519434628975265e-08, - "loss": 0.239, - "step": 28590 - }, - { - "epoch": 99.3, - "learning_rate": 3.010600706713781e-08, - "loss": 0.2535, - "step": 28600 - }, - { - "epoch": 99.34, - "learning_rate": 2.8692579505300353e-08, - "loss": 0.2642, - "step": 28610 - }, - { - "epoch": 99.37, - "learning_rate": 2.7279151943462894e-08, - "loss": 0.2302, - "step": 28620 - }, - { - "epoch": 99.41, - "learning_rate": 2.5865724381625443e-08, - "loss": 0.2619, - "step": 28630 - }, - { - "epoch": 99.44, - "learning_rate": 2.4452296819787985e-08, - "loss": 0.232, - "step": 28640 - }, - { - "epoch": 99.48, - "learning_rate": 2.3038869257950527e-08, - "loss": 0.2763, - "step": 28650 - }, - { - "epoch": 99.51, - "learning_rate": 2.1625441696113075e-08, - "loss": 0.2569, - "step": 28660 - }, - { - "epoch": 99.55, - "learning_rate": 2.0212014134275617e-08, - "loss": 0.2466, - "step": 28670 - }, - { - "epoch": 99.58, - "learning_rate": 1.8798586572438162e-08, - "loss": 0.2511, - "step": 28680 - }, - { - "epoch": 99.62, - "learning_rate": 1.7385159010600704e-08, - "loss": 0.2401, - "step": 28690 - }, - { - "epoch": 99.65, - "learning_rate": 1.597173144876325e-08, - "loss": 0.2573, - "step": 28700 - }, - { - "epoch": 99.69, - "learning_rate": 1.4558303886925795e-08, - "loss": 0.2663, - "step": 28710 - }, - { - "epoch": 99.72, - "learning_rate": 1.314487632508834e-08, - "loss": 0.2237, - "step": 28720 - }, - { - "epoch": 99.75, - "learning_rate": 1.1731448763250882e-08, - "loss": 0.2567, - "step": 28730 - }, - { - "epoch": 99.79, - "learning_rate": 1.0318021201413427e-08, - "loss": 0.2448, - "step": 28740 - }, - { - "epoch": 99.82, - "learning_rate": 8.90459363957597e-09, - "loss": 0.2673, - "step": 28750 - }, - { - "epoch": 99.86, - "learning_rate": 7.491166077738516e-09, - "loss": 0.2539, - "step": 28760 - }, - { - "epoch": 99.89, - "learning_rate": 6.077738515901059e-09, - "loss": 0.2329, - "step": 28770 - }, - { - "epoch": 99.93, - "learning_rate": 4.6643109540636045e-09, - "loss": 0.24, - "step": 28780 - }, - { - "epoch": 99.96, - "learning_rate": 3.250883392226148e-09, - "loss": 0.2402, - "step": 28790 - }, - { - "epoch": 100.0, - "learning_rate": 1.8374558303886924e-09, - "loss": 0.2604, - "step": 28800 - }, - { - "epoch": 100.0, - "eval_loss": 0.5110756158828735, - "eval_runtime": 135.2128, - "eval_samples_per_second": 3.935, - "eval_steps_per_second": 0.984, - "eval_wer": 0.19605322362923444, - "step": 28800 - }, { "epoch": 100.0, - "step": 28800, - "total_flos": 2.718335465990856e+20, - "train_loss": 0.26551002427107756, - "train_runtime": 210411.5326, - "train_samples_per_second": 2.194, - "train_steps_per_second": 0.137 + "step": 7200, + "total_flos": 2.7202925310621965e+20, + "train_loss": 0.44683600352870095, + "train_runtime": 190307.0487, + "train_samples_per_second": 2.426, + "train_steps_per_second": 0.038 } ], - "max_steps": 28800, + "max_steps": 7200, "num_train_epochs": 100, - "total_flos": 2.718335465990856e+20, + "total_flos": 2.7202925310621965e+20, "trial_name": null, "trial_params": null }