diff --git "a/trainer_state.json" "b/trainer_state.json" --- "a/trainer_state.json" +++ "b/trainer_state.json" @@ -1,5245 +1,18205 @@ { - "best_metric": 0.47944945096969604, - "best_model_checkpoint": "ai-light-dance_singing3_ft_wav2vec2-large-xlsr-53-v1-5gram/checkpoint-1512", - "epoch": 99.99653979238754, - "global_step": 7200, + "best_metric": 0.4693412184715271, + "best_model_checkpoint": "ai-light-dance_singing3_ft_wav2vec2-large-xlsr-53-v1-5gram/checkpoint-288", + "epoch": 99.9974025974026, + "global_step": 28800, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { - "epoch": 0.14, - "learning_rate": 5.000000000000001e-07, - "loss": 0.3086, + "epoch": 0.03, + "learning_rate": 8e-08, + "loss": 0.3037, "step": 10 }, { - "epoch": 0.28, - "learning_rate": 1.0000000000000002e-06, - "loss": 0.3275, + "epoch": 0.07, + "learning_rate": 1.6e-07, + "loss": 0.3044, "step": 20 }, { - "epoch": 0.42, - "learning_rate": 1.5e-06, - "loss": 0.3051, + "epoch": 0.1, + "learning_rate": 2.32e-07, + "loss": 0.2922, "step": 30 }, { - "epoch": 0.55, - "learning_rate": 2.0000000000000003e-06, - "loss": 0.3072, + "epoch": 0.14, + "learning_rate": 3.12e-07, + "loss": 0.3287, "step": 40 }, { - "epoch": 0.69, - "learning_rate": 2.5e-06, - "loss": 0.2957, + "epoch": 0.17, + "learning_rate": 3.92e-07, + "loss": 0.3189, "step": 50 }, { - "epoch": 0.83, - "learning_rate": 3e-06, - "loss": 0.2856, + "epoch": 0.21, + "learning_rate": 4.64e-07, + "loss": 0.2791, "step": 60 }, { - "epoch": 0.97, - "learning_rate": 3.5000000000000004e-06, - "loss": 0.314, + "epoch": 0.24, + "learning_rate": 5.44e-07, + "loss": 0.2892, "step": 70 }, { - "epoch": 1.0, - "eval_loss": 0.4815235435962677, - "eval_runtime": 130.4571, - "eval_samples_per_second": 4.078, - "eval_steps_per_second": 0.514, - "eval_wer": 0.20768785755608407, - "step": 72 - }, - { - "epoch": 1.11, - "learning_rate": 4.000000000000001e-06, - "loss": 0.2981, + "epoch": 0.28, + "learning_rate": 6.24e-07, + "loss": 0.3011, "step": 80 }, { - "epoch": 1.25, - "learning_rate": 4.5e-06, - "loss": 0.2972, + "epoch": 0.31, + "learning_rate": 7.04e-07, + "loss": 0.3154, "step": 90 }, { - "epoch": 1.39, - "learning_rate": 5e-06, - "loss": 0.2892, + "epoch": 0.35, + "learning_rate": 7.84e-07, + "loss": 0.3242, "step": 100 }, { - "epoch": 1.53, - "learning_rate": 5.500000000000001e-06, - "loss": 0.3014, + "epoch": 0.38, + "learning_rate": 8.639999999999999e-07, + "loss": 0.2931, "step": 110 }, { - "epoch": 1.66, - "learning_rate": 6e-06, - "loss": 0.3013, + "epoch": 0.42, + "learning_rate": 9.439999999999999e-07, + "loss": 0.2822, "step": 120 }, { - "epoch": 1.8, - "learning_rate": 6.5000000000000004e-06, - "loss": 0.315, + "epoch": 0.45, + "learning_rate": 1.024e-06, + "loss": 0.3186, "step": 130 }, { - "epoch": 1.94, - "learning_rate": 7.000000000000001e-06, - "loss": 0.3064, + "epoch": 0.48, + "learning_rate": 1.1040000000000001e-06, + "loss": 0.3111, "step": 140 }, { - "epoch": 2.0, - "eval_loss": 0.5082846283912659, - "eval_runtime": 130.0863, - "eval_samples_per_second": 4.09, - "eval_steps_per_second": 0.515, - "eval_wer": 0.2101947676287202, - "step": 144 - }, - { - "epoch": 2.08, - "learning_rate": 7.5e-06, - "loss": 0.3067, + "epoch": 0.52, + "learning_rate": 1.1839999999999998e-06, + "loss": 0.2909, "step": 150 }, { - "epoch": 2.22, - "learning_rate": 7.95e-06, - "loss": 0.304, + "epoch": 0.55, + "learning_rate": 1.2639999999999999e-06, + "loss": 0.299, "step": 160 }, { - "epoch": 2.36, - "learning_rate": 8.45e-06, - "loss": 0.3065, + "epoch": 0.59, + "learning_rate": 1.344e-06, + "loss": 0.3338, "step": 170 }, { - "epoch": 2.5, - "learning_rate": 8.95e-06, - "loss": 0.3014, + "epoch": 0.62, + "learning_rate": 1.4239999999999998e-06, + "loss": 0.2607, "step": 180 }, { - "epoch": 2.64, - "learning_rate": 9.450000000000001e-06, - "loss": 0.2938, + "epoch": 0.66, + "learning_rate": 1.504e-06, + "loss": 0.2763, "step": 190 }, { - "epoch": 2.78, - "learning_rate": 9.950000000000001e-06, - "loss": 0.3086, + "epoch": 0.69, + "learning_rate": 1.584e-06, + "loss": 0.296, "step": 200 }, { - "epoch": 2.91, - "learning_rate": 1.045e-05, - "loss": 0.2951, + "epoch": 0.73, + "learning_rate": 1.6639999999999999e-06, + "loss": 0.2896, "step": 210 }, { - "epoch": 3.0, - "eval_loss": 0.5146709680557251, - "eval_runtime": 129.1484, - "eval_samples_per_second": 4.119, - "eval_steps_per_second": 0.519, - "eval_wer": 0.2158513852285145, - "step": 216 - }, - { - "epoch": 3.06, - "learning_rate": 1.095e-05, - "loss": 0.3079, + "epoch": 0.76, + "learning_rate": 1.744e-06, + "loss": 0.2852, "step": 220 }, { - "epoch": 3.19, - "learning_rate": 1.145e-05, - "loss": 0.2984, + "epoch": 0.8, + "learning_rate": 1.824e-06, + "loss": 0.2691, "step": 230 }, { - "epoch": 3.33, - "learning_rate": 1.195e-05, - "loss": 0.3067, + "epoch": 0.83, + "learning_rate": 1.904e-06, + "loss": 0.3116, "step": 240 }, { - "epoch": 3.47, - "learning_rate": 1.2450000000000001e-05, - "loss": 0.3033, + "epoch": 0.87, + "learning_rate": 1.976e-06, + "loss": 0.3348, "step": 250 }, { - "epoch": 3.61, - "learning_rate": 1.2950000000000001e-05, - "loss": 0.2912, + "epoch": 0.9, + "learning_rate": 2.056e-06, + "loss": 0.2831, "step": 260 }, { - "epoch": 3.75, - "learning_rate": 1.3450000000000002e-05, - "loss": 0.2915, + "epoch": 0.94, + "learning_rate": 2.136e-06, + "loss": 0.2814, "step": 270 }, { - "epoch": 3.89, - "learning_rate": 1.3950000000000002e-05, - "loss": 0.2835, + "epoch": 0.97, + "learning_rate": 2.216e-06, + "loss": 0.3028, "step": 280 }, { - "epoch": 4.0, - "eval_loss": 0.515735387802124, - "eval_runtime": 128.8527, - "eval_samples_per_second": 4.129, - "eval_steps_per_second": 0.52, - "eval_wer": 0.20910201195603265, + "epoch": 1.0, + "eval_loss": 0.4693412184715271, + "eval_runtime": 130.2494, + "eval_samples_per_second": 4.084, + "eval_steps_per_second": 1.021, + "eval_wer": 0.2046024297743781, "step": 288 }, { - "epoch": 4.03, - "learning_rate": 1.4449999999999999e-05, - "loss": 0.3069, + "epoch": 1.01, + "learning_rate": 2.2959999999999997e-06, + "loss": 0.3338, "step": 290 }, { - "epoch": 4.17, - "learning_rate": 1.4950000000000001e-05, - "loss": 0.2931, + "epoch": 1.04, + "learning_rate": 2.3759999999999998e-06, + "loss": 0.2803, "step": 300 }, { - "epoch": 4.3, - "learning_rate": 1.545e-05, - "loss": 0.2916, + "epoch": 1.08, + "learning_rate": 2.456e-06, + "loss": 0.2859, "step": 310 }, { - "epoch": 4.44, - "learning_rate": 1.595e-05, - "loss": 0.304, + "epoch": 1.11, + "learning_rate": 2.536e-06, + "loss": 0.282, "step": 320 }, { - "epoch": 4.58, - "learning_rate": 1.645e-05, - "loss": 0.301, + "epoch": 1.15, + "learning_rate": 2.616e-06, + "loss": 0.2971, "step": 330 }, { - "epoch": 4.72, - "learning_rate": 1.6950000000000002e-05, - "loss": 0.3098, + "epoch": 1.18, + "learning_rate": 2.696e-06, + "loss": 0.2832, "step": 340 }, { - "epoch": 4.86, - "learning_rate": 1.745e-05, - "loss": 0.2935, + "epoch": 1.21, + "learning_rate": 2.7759999999999998e-06, + "loss": 0.2776, "step": 350 }, { - "epoch": 5.0, - "learning_rate": 1.795e-05, - "loss": 0.3011, - "step": 360 - }, - { - "epoch": 5.0, - "eval_loss": 0.495644748210907, - "eval_runtime": 129.107, - "eval_samples_per_second": 4.121, - "eval_steps_per_second": 0.519, - "eval_wer": 0.215080028283088, + "epoch": 1.25, + "learning_rate": 2.856e-06, + "loss": 0.2812, "step": 360 }, { - "epoch": 5.14, - "learning_rate": 1.845e-05, - "loss": 0.302, + "epoch": 1.28, + "learning_rate": 2.936e-06, + "loss": 0.2765, "step": 370 }, { - "epoch": 5.28, - "learning_rate": 1.895e-05, - "loss": 0.3081, + "epoch": 1.32, + "learning_rate": 3.016e-06, + "loss": 0.2905, "step": 380 }, { - "epoch": 5.42, - "learning_rate": 1.9450000000000002e-05, - "loss": 0.3041, + "epoch": 1.35, + "learning_rate": 3.096e-06, + "loss": 0.2992, "step": 390 }, { - "epoch": 5.55, - "learning_rate": 1.995e-05, - "loss": 0.3061, + "epoch": 1.39, + "learning_rate": 3.176e-06, + "loss": 0.2972, "step": 400 }, { - "epoch": 5.69, - "learning_rate": 2.045e-05, - "loss": 0.3081, + "epoch": 1.42, + "learning_rate": 3.256e-06, + "loss": 0.2884, "step": 410 }, { - "epoch": 5.83, - "learning_rate": 2.09e-05, - "loss": 0.2989, + "epoch": 1.46, + "learning_rate": 3.336e-06, + "loss": 0.2667, "step": 420 }, { - "epoch": 5.97, - "learning_rate": 2.1400000000000002e-05, - "loss": 0.3097, + "epoch": 1.49, + "learning_rate": 3.4159999999999996e-06, + "loss": 0.3059, "step": 430 }, { - "epoch": 6.0, - "eval_loss": 0.5190498232841492, - "eval_runtime": 129.2076, - "eval_samples_per_second": 4.117, - "eval_steps_per_second": 0.519, - "eval_wer": 0.21533714726489683, - "step": 432 - }, - { - "epoch": 6.11, - "learning_rate": 2.19e-05, - "loss": 0.3235, + "epoch": 1.53, + "learning_rate": 3.4959999999999996e-06, + "loss": 0.2853, "step": 440 }, { - "epoch": 6.25, - "learning_rate": 2.2400000000000002e-05, - "loss": 0.3015, + "epoch": 1.56, + "learning_rate": 3.5759999999999997e-06, + "loss": 0.2775, "step": 450 }, { - "epoch": 6.39, - "learning_rate": 2.29e-05, - "loss": 0.2979, + "epoch": 1.6, + "learning_rate": 3.656e-06, + "loss": 0.2873, "step": 460 }, { - "epoch": 6.53, - "learning_rate": 2.3400000000000003e-05, - "loss": 0.3303, + "epoch": 1.63, + "learning_rate": 3.736e-06, + "loss": 0.2874, "step": 470 }, { - "epoch": 6.66, - "learning_rate": 2.39e-05, - "loss": 0.318, + "epoch": 1.66, + "learning_rate": 3.8159999999999995e-06, + "loss": 0.2988, "step": 480 }, { - "epoch": 6.8, - "learning_rate": 2.44e-05, - "loss": 0.3111, + "epoch": 1.7, + "learning_rate": 3.896e-06, + "loss": 0.2957, "step": 490 }, { - "epoch": 6.94, - "learning_rate": 2.4900000000000002e-05, - "loss": 0.2998, + "epoch": 1.73, + "learning_rate": 3.976e-06, + "loss": 0.3037, "step": 500 }, { - "epoch": 7.0, - "eval_loss": 0.5349323153495789, - "eval_runtime": 129.2108, - "eval_samples_per_second": 4.117, - "eval_steps_per_second": 0.519, - "eval_wer": 0.22015812817381245, - "step": 504 - }, - { - "epoch": 7.08, - "learning_rate": 2.4970149253731346e-05, - "loss": 0.3216, + "epoch": 1.77, + "learning_rate": 3.999010600706714e-06, + "loss": 0.2873, "step": 510 }, { - "epoch": 7.22, - "learning_rate": 2.493283582089552e-05, - "loss": 0.3147, + "epoch": 1.8, + "learning_rate": 3.997597173144876e-06, + "loss": 0.2904, "step": 520 }, { - "epoch": 7.36, - "learning_rate": 2.4895522388059704e-05, - "loss": 0.3128, + "epoch": 1.84, + "learning_rate": 3.996183745583039e-06, + "loss": 0.3108, "step": 530 }, { - "epoch": 7.5, - "learning_rate": 2.4858208955223883e-05, - "loss": 0.3079, + "epoch": 1.87, + "learning_rate": 3.994770318021201e-06, + "loss": 0.3071, "step": 540 }, { - "epoch": 7.64, - "learning_rate": 2.482089552238806e-05, - "loss": 0.2967, + "epoch": 1.91, + "learning_rate": 3.993356890459364e-06, + "loss": 0.2944, "step": 550 }, { - "epoch": 7.78, - "learning_rate": 2.478358208955224e-05, - "loss": 0.3098, + "epoch": 1.94, + "learning_rate": 3.9919434628975264e-06, + "loss": 0.2848, "step": 560 }, { - "epoch": 7.91, - "learning_rate": 2.474626865671642e-05, - "loss": 0.3086, + "epoch": 1.98, + "learning_rate": 3.990530035335689e-06, + "loss": 0.2986, "step": 570 }, { - "epoch": 8.0, - "eval_loss": 0.5055466890335083, - "eval_runtime": 128.9787, - "eval_samples_per_second": 4.125, - "eval_steps_per_second": 0.519, - "eval_wer": 0.21450151057401812, + "epoch": 2.0, + "eval_loss": 0.48284950852394104, + "eval_runtime": 130.0663, + "eval_samples_per_second": 4.09, + "eval_steps_per_second": 1.023, + "eval_wer": 0.20575946519251784, "step": 576 }, { - "epoch": 8.06, - "learning_rate": 2.4708955223880597e-05, - "loss": 0.3243, + "epoch": 2.01, + "learning_rate": 3.989116607773851e-06, + "loss": 0.3048, "step": 580 }, { - "epoch": 8.19, - "learning_rate": 2.467164179104478e-05, - "loss": 0.3088, + "epoch": 2.05, + "learning_rate": 3.987703180212014e-06, + "loss": 0.2977, "step": 590 }, { - "epoch": 8.33, - "learning_rate": 2.4634328358208955e-05, - "loss": 0.3071, + "epoch": 2.08, + "learning_rate": 3.986289752650176e-06, + "loss": 0.2796, "step": 600 }, { - "epoch": 8.47, - "learning_rate": 2.4597014925373134e-05, - "loss": 0.3094, + "epoch": 2.12, + "learning_rate": 3.984876325088339e-06, + "loss": 0.2934, "step": 610 }, { - "epoch": 8.61, - "learning_rate": 2.4559701492537317e-05, - "loss": 0.3049, + "epoch": 2.15, + "learning_rate": 3.983462897526502e-06, + "loss": 0.3091, "step": 620 }, { - "epoch": 8.75, - "learning_rate": 2.4522388059701492e-05, - "loss": 0.3061, + "epoch": 2.19, + "learning_rate": 3.982049469964665e-06, + "loss": 0.2864, "step": 630 }, { - "epoch": 8.89, - "learning_rate": 2.448507462686567e-05, - "loss": 0.2964, + "epoch": 2.22, + "learning_rate": 3.9806360424028266e-06, + "loss": 0.2948, "step": 640 }, { - "epoch": 9.0, - "eval_loss": 0.5091516971588135, - "eval_runtime": 129.4051, - "eval_samples_per_second": 4.111, - "eval_steps_per_second": 0.518, - "eval_wer": 0.2183582953011506, - "step": 648 - }, - { - "epoch": 9.03, - "learning_rate": 2.4447761194029854e-05, - "loss": 0.3212, + "epoch": 2.26, + "learning_rate": 3.979222614840989e-06, + "loss": 0.3012, "step": 650 }, { - "epoch": 9.17, - "learning_rate": 2.441044776119403e-05, - "loss": 0.302, + "epoch": 2.29, + "learning_rate": 3.977809187279151e-06, + "loss": 0.2824, "step": 660 }, { - "epoch": 9.3, - "learning_rate": 2.437313432835821e-05, - "loss": 0.3103, + "epoch": 2.33, + "learning_rate": 3.976395759717314e-06, + "loss": 0.3008, "step": 670 }, { - "epoch": 9.44, - "learning_rate": 2.433582089552239e-05, - "loss": 0.3102, + "epoch": 2.36, + "learning_rate": 3.974982332155477e-06, + "loss": 0.3, "step": 680 }, { - "epoch": 9.58, - "learning_rate": 2.4298507462686567e-05, - "loss": 0.3045, + "epoch": 2.39, + "learning_rate": 3.97356890459364e-06, + "loss": 0.2641, "step": 690 }, { - "epoch": 9.72, - "learning_rate": 2.4261194029850746e-05, - "loss": 0.3162, + "epoch": 2.43, + "learning_rate": 3.972155477031802e-06, + "loss": 0.2677, "step": 700 }, { - "epoch": 9.86, - "learning_rate": 2.4223880597014926e-05, - "loss": 0.3186, + "epoch": 2.46, + "learning_rate": 3.970742049469965e-06, + "loss": 0.2851, "step": 710 }, { - "epoch": 10.0, - "learning_rate": 2.4186567164179105e-05, - "loss": 0.3288, - "step": 720 - }, - { - "epoch": 10.0, - "eval_loss": 0.5076370239257812, - "eval_runtime": 129.7675, - "eval_samples_per_second": 4.1, - "eval_steps_per_second": 0.516, - "eval_wer": 0.2190653725011249, + "epoch": 2.5, + "learning_rate": 3.969328621908127e-06, + "loss": 0.2923, "step": 720 }, { - "epoch": 10.14, - "learning_rate": 2.4149253731343284e-05, - "loss": 0.3037, + "epoch": 2.53, + "learning_rate": 3.9679151943462895e-06, + "loss": 0.2957, "step": 730 }, { - "epoch": 10.28, - "learning_rate": 2.4111940298507463e-05, - "loss": 0.3256, + "epoch": 2.57, + "learning_rate": 3.966501766784452e-06, + "loss": 0.2915, "step": 740 }, { - "epoch": 10.42, - "learning_rate": 2.4074626865671642e-05, - "loss": 0.3209, + "epoch": 2.6, + "learning_rate": 3.965088339222615e-06, + "loss": 0.2786, "step": 750 }, { - "epoch": 10.55, - "learning_rate": 2.403731343283582e-05, - "loss": 0.3259, + "epoch": 2.64, + "learning_rate": 3.963674911660777e-06, + "loss": 0.3032, "step": 760 }, { - "epoch": 10.69, - "learning_rate": 2.4e-05, - "loss": 0.3081, + "epoch": 2.67, + "learning_rate": 3.96226148409894e-06, + "loss": 0.3004, "step": 770 }, { - "epoch": 10.83, - "learning_rate": 2.396268656716418e-05, - "loss": 0.3153, + "epoch": 2.71, + "learning_rate": 3.960848056537102e-06, + "loss": 0.2904, "step": 780 }, { - "epoch": 10.97, - "learning_rate": 2.392537313432836e-05, - "loss": 0.3019, + "epoch": 2.74, + "learning_rate": 3.959434628975265e-06, + "loss": 0.2702, "step": 790 }, { - "epoch": 11.0, - "eval_loss": 0.5125810503959656, - "eval_runtime": 128.8657, - "eval_samples_per_second": 4.128, - "eval_steps_per_second": 0.52, - "eval_wer": 0.20916629170148487, - "step": 792 - }, - { - "epoch": 11.11, - "learning_rate": 2.3888059701492538e-05, - "loss": 0.3151, + "epoch": 2.78, + "learning_rate": 3.958021201413428e-06, + "loss": 0.2831, "step": 800 }, { - "epoch": 11.25, - "learning_rate": 2.3850746268656717e-05, - "loss": 0.3154, + "epoch": 2.81, + "learning_rate": 3.95660777385159e-06, + "loss": 0.2874, "step": 810 }, { - "epoch": 11.39, - "learning_rate": 2.3813432835820896e-05, - "loss": 0.2949, + "epoch": 2.85, + "learning_rate": 3.9551943462897525e-06, + "loss": 0.2791, "step": 820 }, { - "epoch": 11.53, - "learning_rate": 2.3776119402985076e-05, - "loss": 0.3214, + "epoch": 2.88, + "learning_rate": 3.953780918727915e-06, + "loss": 0.2896, "step": 830 }, { - "epoch": 11.66, - "learning_rate": 2.3738805970149255e-05, - "loss": 0.2946, + "epoch": 2.91, + "learning_rate": 3.952367491166077e-06, + "loss": 0.2694, "step": 840 }, { - "epoch": 11.8, - "learning_rate": 2.3701492537313434e-05, - "loss": 0.3154, + "epoch": 2.95, + "learning_rate": 3.95095406360424e-06, + "loss": 0.277, "step": 850 }, { - "epoch": 11.94, - "learning_rate": 2.3664179104477613e-05, - "loss": 0.3047, + "epoch": 2.98, + "learning_rate": 3.949540636042403e-06, + "loss": 0.297, "step": 860 }, { - "epoch": 12.0, - "eval_loss": 0.5249019861221313, - "eval_runtime": 129.2154, - "eval_samples_per_second": 4.117, - "eval_steps_per_second": 0.519, - "eval_wer": 0.2117374815195732, + "epoch": 3.0, + "eval_loss": 0.5019953846931458, + "eval_runtime": 130.2566, + "eval_samples_per_second": 4.084, + "eval_steps_per_second": 1.021, + "eval_wer": 0.2038310728289516, "step": 864 }, { - "epoch": 12.08, - "learning_rate": 2.3626865671641792e-05, - "loss": 0.2959, + "epoch": 3.02, + "learning_rate": 3.948127208480565e-06, + "loss": 0.2977, "step": 870 }, { - "epoch": 12.22, - "learning_rate": 2.358955223880597e-05, - "loss": 0.295, + "epoch": 3.06, + "learning_rate": 3.946713780918728e-06, + "loss": 0.3039, "step": 880 }, { - "epoch": 12.36, - "learning_rate": 2.355223880597015e-05, - "loss": 0.3122, + "epoch": 3.09, + "learning_rate": 3.945300353356891e-06, + "loss": 0.2913, "step": 890 }, { - "epoch": 12.5, - "learning_rate": 2.351492537313433e-05, - "loss": 0.3028, + "epoch": 3.12, + "learning_rate": 3.943886925795053e-06, + "loss": 0.307, "step": 900 }, { - "epoch": 12.64, - "learning_rate": 2.347761194029851e-05, - "loss": 0.2777, + "epoch": 3.16, + "learning_rate": 3.9424734982332154e-06, + "loss": 0.3053, "step": 910 }, { - "epoch": 12.78, - "learning_rate": 2.3440298507462688e-05, - "loss": 0.3025, + "epoch": 3.19, + "learning_rate": 3.941060070671378e-06, + "loss": 0.2781, "step": 920 }, { - "epoch": 12.91, - "learning_rate": 2.3402985074626867e-05, - "loss": 0.2998, + "epoch": 3.23, + "learning_rate": 3.93964664310954e-06, + "loss": 0.2978, "step": 930 }, { - "epoch": 13.0, - "eval_loss": 0.531330406665802, - "eval_runtime": 129.1703, - "eval_samples_per_second": 4.119, - "eval_steps_per_second": 0.519, - "eval_wer": 0.21405155235585266, - "step": 936 - }, - { - "epoch": 13.06, - "learning_rate": 2.3365671641791046e-05, - "loss": 0.3192, + "epoch": 3.26, + "learning_rate": 3.938233215547703e-06, + "loss": 0.2859, "step": 940 }, { - "epoch": 13.19, - "learning_rate": 2.3328358208955225e-05, - "loss": 0.2997, + "epoch": 3.3, + "learning_rate": 3.936819787985866e-06, + "loss": 0.3001, "step": 950 }, { - "epoch": 13.33, - "learning_rate": 2.32910447761194e-05, - "loss": 0.3163, + "epoch": 3.33, + "learning_rate": 3.935406360424028e-06, + "loss": 0.3167, "step": 960 }, { - "epoch": 13.47, - "learning_rate": 2.3253731343283584e-05, - "loss": 0.3046, + "epoch": 3.37, + "learning_rate": 3.933992932862191e-06, + "loss": 0.307, "step": 970 }, { - "epoch": 13.61, - "learning_rate": 2.3216417910447763e-05, - "loss": 0.2924, + "epoch": 3.4, + "learning_rate": 3.932579505300353e-06, + "loss": 0.3129, "step": 980 }, { - "epoch": 13.75, - "learning_rate": 2.317910447761194e-05, - "loss": 0.3161, + "epoch": 3.44, + "learning_rate": 3.9311660777385156e-06, + "loss": 0.2694, "step": 990 }, { - "epoch": 13.89, - "learning_rate": 2.314179104477612e-05, - "loss": 0.3043, + "epoch": 3.47, + "learning_rate": 3.929752650176678e-06, + "loss": 0.3088, "step": 1000 }, { - "epoch": 14.0, - "eval_loss": 0.5343348979949951, - "eval_runtime": 129.5843, - "eval_samples_per_second": 4.105, - "eval_steps_per_second": 0.517, - "eval_wer": 0.21861541428295944, - "step": 1008 - }, - { - "epoch": 14.03, - "learning_rate": 2.31044776119403e-05, - "loss": 0.3099, + "epoch": 3.51, + "learning_rate": 3.928339222614841e-06, + "loss": 0.2849, "step": 1010 }, { - "epoch": 14.17, - "learning_rate": 2.306716417910448e-05, - "loss": 0.2953, + "epoch": 3.54, + "learning_rate": 3.926925795053003e-06, + "loss": 0.3203, "step": 1020 }, { - "epoch": 14.3, - "learning_rate": 2.302985074626866e-05, - "loss": 0.3134, + "epoch": 3.57, + "learning_rate": 3.925512367491166e-06, + "loss": 0.3022, "step": 1030 }, { - "epoch": 14.44, - "learning_rate": 2.2992537313432838e-05, - "loss": 0.2917, + "epoch": 3.61, + "learning_rate": 3.924098939929328e-06, + "loss": 0.2711, "step": 1040 }, { - "epoch": 14.58, - "learning_rate": 2.2955223880597017e-05, - "loss": 0.3108, + "epoch": 3.64, + "learning_rate": 3.922685512367491e-06, + "loss": 0.2765, "step": 1050 }, { - "epoch": 14.72, - "learning_rate": 2.2917910447761196e-05, - "loss": 0.3085, + "epoch": 3.68, + "learning_rate": 3.921272084805654e-06, + "loss": 0.2897, "step": 1060 }, { - "epoch": 14.86, - "learning_rate": 2.2880597014925372e-05, - "loss": 0.2921, + "epoch": 3.71, + "learning_rate": 3.9198586572438165e-06, + "loss": 0.2561, "step": 1070 }, { - "epoch": 15.0, - "learning_rate": 2.2843283582089555e-05, - "loss": 0.3147, - "step": 1080 - }, - { - "epoch": 15.0, - "eval_loss": 0.506893515586853, - "eval_runtime": 129.0401, - "eval_samples_per_second": 4.123, - "eval_steps_per_second": 0.519, - "eval_wer": 0.21713698013755867, + "epoch": 3.75, + "learning_rate": 3.9184452296819785e-06, + "loss": 0.2596, "step": 1080 }, { - "epoch": 15.14, - "learning_rate": 2.2805970149253734e-05, - "loss": 0.307, + "epoch": 3.78, + "learning_rate": 3.917031802120141e-06, + "loss": 0.2759, "step": 1090 }, { - "epoch": 15.28, - "learning_rate": 2.276865671641791e-05, - "loss": 0.3152, + "epoch": 3.82, + "learning_rate": 3.915618374558303e-06, + "loss": 0.3017, "step": 1100 }, { - "epoch": 15.42, - "learning_rate": 2.2731343283582092e-05, - "loss": 0.3002, + "epoch": 3.85, + "learning_rate": 3.914204946996466e-06, + "loss": 0.2668, "step": 1110 }, { - "epoch": 15.55, - "learning_rate": 2.269402985074627e-05, - "loss": 0.2992, + "epoch": 3.89, + "learning_rate": 3.912791519434629e-06, + "loss": 0.284, "step": 1120 }, { - "epoch": 15.69, - "learning_rate": 2.2656716417910447e-05, - "loss": 0.2897, + "epoch": 3.92, + "learning_rate": 3.911378091872792e-06, + "loss": 0.2808, "step": 1130 }, { - "epoch": 15.83, - "learning_rate": 2.261940298507463e-05, - "loss": 0.3069, + "epoch": 3.96, + "learning_rate": 3.909964664310954e-06, + "loss": 0.2801, "step": 1140 }, { - "epoch": 15.97, - "learning_rate": 2.258208955223881e-05, - "loss": 0.3049, + "epoch": 3.99, + "learning_rate": 3.908551236749117e-06, + "loss": 0.2863, "step": 1150 }, { - "epoch": 16.0, - "eval_loss": 0.5032855272293091, - "eval_runtime": 129.2941, - "eval_samples_per_second": 4.115, - "eval_steps_per_second": 0.518, - "eval_wer": 0.20736645882882304, + "epoch": 4.0, + "eval_loss": 0.5215898752212524, + "eval_runtime": 130.8056, + "eval_samples_per_second": 4.067, + "eval_steps_per_second": 1.017, + "eval_wer": 0.20203123995628977, "step": 1152 }, { - "epoch": 16.11, - "learning_rate": 2.2544776119402984e-05, - "loss": 0.3014, + "epoch": 4.03, + "learning_rate": 3.907137809187279e-06, + "loss": 0.2845, "step": 1160 }, { - "epoch": 16.25, - "learning_rate": 2.2507462686567167e-05, - "loss": 0.3078, + "epoch": 4.06, + "learning_rate": 3.9057243816254415e-06, + "loss": 0.2787, "step": 1170 }, { - "epoch": 16.39, - "learning_rate": 2.2470149253731346e-05, - "loss": 0.2942, + "epoch": 4.1, + "learning_rate": 3.904310954063604e-06, + "loss": 0.2562, "step": 1180 }, { - "epoch": 16.53, - "learning_rate": 2.2432835820895522e-05, - "loss": 0.3168, + "epoch": 4.13, + "learning_rate": 3.902897526501767e-06, + "loss": 0.2833, "step": 1190 }, { - "epoch": 16.66, - "learning_rate": 2.2395522388059704e-05, - "loss": 0.3124, + "epoch": 4.17, + "learning_rate": 3.901484098939929e-06, + "loss": 0.2655, "step": 1200 }, { - "epoch": 16.8, - "learning_rate": 2.235820895522388e-05, - "loss": 0.2951, + "epoch": 4.2, + "learning_rate": 3.900070671378092e-06, + "loss": 0.2865, "step": 1210 }, { - "epoch": 16.94, - "learning_rate": 2.232089552238806e-05, - "loss": 0.298, + "epoch": 4.24, + "learning_rate": 3.898657243816254e-06, + "loss": 0.2702, "step": 1220 }, { - "epoch": 17.0, - "eval_loss": 0.5108718276023865, - "eval_runtime": 129.096, - "eval_samples_per_second": 4.121, - "eval_steps_per_second": 0.519, - "eval_wer": 0.20498810824709135, - "step": 1224 - }, - { - "epoch": 17.08, - "learning_rate": 2.2283582089552242e-05, - "loss": 0.3255, + "epoch": 4.27, + "learning_rate": 3.897243816254417e-06, + "loss": 0.2733, "step": 1230 }, { - "epoch": 17.22, - "learning_rate": 2.2246268656716418e-05, - "loss": 0.2867, + "epoch": 4.3, + "learning_rate": 3.89583038869258e-06, + "loss": 0.3136, "step": 1240 }, { - "epoch": 17.36, - "learning_rate": 2.2208955223880597e-05, - "loss": 0.2983, + "epoch": 4.34, + "learning_rate": 3.8944169611307424e-06, + "loss": 0.2846, "step": 1250 }, { - "epoch": 17.5, - "learning_rate": 2.217164179104478e-05, - "loss": 0.3105, + "epoch": 4.37, + "learning_rate": 3.8930035335689044e-06, + "loss": 0.2756, "step": 1260 }, { - "epoch": 17.64, - "learning_rate": 2.2134328358208955e-05, - "loss": 0.2818, + "epoch": 4.41, + "learning_rate": 3.891590106007066e-06, + "loss": 0.2934, "step": 1270 }, { - "epoch": 17.78, - "learning_rate": 2.2097014925373134e-05, - "loss": 0.3107, + "epoch": 4.44, + "learning_rate": 3.890176678445229e-06, + "loss": 0.2851, "step": 1280 }, { - "epoch": 17.91, - "learning_rate": 2.2059701492537317e-05, - "loss": 0.2948, + "epoch": 4.48, + "learning_rate": 3.888763250883392e-06, + "loss": 0.2979, "step": 1290 }, { - "epoch": 18.0, - "eval_loss": 0.5252682566642761, - "eval_runtime": 129.1692, - "eval_samples_per_second": 4.119, - "eval_steps_per_second": 0.519, - "eval_wer": 0.20993764864691136, - "step": 1296 - }, - { - "epoch": 18.06, - "learning_rate": 2.2022388059701493e-05, - "loss": 0.316, + "epoch": 4.51, + "learning_rate": 3.887349823321555e-06, + "loss": 0.2944, "step": 1300 }, { - "epoch": 18.19, - "learning_rate": 2.1985074626865672e-05, - "loss": 0.3066, + "epoch": 4.55, + "learning_rate": 3.885936395759717e-06, + "loss": 0.2839, "step": 1310 }, { - "epoch": 18.33, - "learning_rate": 2.194776119402985e-05, - "loss": 0.3031, + "epoch": 4.58, + "learning_rate": 3.88452296819788e-06, + "loss": 0.287, "step": 1320 }, { - "epoch": 18.47, - "learning_rate": 2.191044776119403e-05, - "loss": 0.3037, + "epoch": 4.62, + "learning_rate": 3.883109540636042e-06, + "loss": 0.2757, "step": 1330 }, { - "epoch": 18.61, - "learning_rate": 2.187313432835821e-05, - "loss": 0.2986, + "epoch": 4.65, + "learning_rate": 3.8816961130742046e-06, + "loss": 0.3039, "step": 1340 }, { - "epoch": 18.75, - "learning_rate": 2.183582089552239e-05, - "loss": 0.2955, + "epoch": 4.69, + "learning_rate": 3.880282685512367e-06, + "loss": 0.2852, "step": 1350 }, { - "epoch": 18.89, - "learning_rate": 2.1798507462686568e-05, - "loss": 0.2986, + "epoch": 4.72, + "learning_rate": 3.87886925795053e-06, + "loss": 0.2655, "step": 1360 }, { - "epoch": 19.0, - "eval_loss": 0.4976494014263153, - "eval_runtime": 129.378, - "eval_samples_per_second": 4.112, - "eval_steps_per_second": 0.518, - "eval_wer": 0.20209551970174197, - "step": 1368 - }, - { - "epoch": 19.03, - "learning_rate": 2.1761194029850747e-05, - "loss": 0.3021, + "epoch": 4.75, + "learning_rate": 3.877455830388692e-06, + "loss": 0.2777, "step": 1370 }, { - "epoch": 19.17, - "learning_rate": 2.1723880597014926e-05, - "loss": 0.2887, + "epoch": 4.79, + "learning_rate": 3.876042402826855e-06, + "loss": 0.2714, "step": 1380 }, { - "epoch": 19.3, - "learning_rate": 2.1686567164179105e-05, - "loss": 0.3059, + "epoch": 4.82, + "learning_rate": 3.874628975265017e-06, + "loss": 0.2803, "step": 1390 }, { - "epoch": 19.44, - "learning_rate": 2.1649253731343284e-05, - "loss": 0.2945, + "epoch": 4.86, + "learning_rate": 3.87321554770318e-06, + "loss": 0.3032, "step": 1400 }, { - "epoch": 19.58, - "learning_rate": 2.1611940298507463e-05, - "loss": 0.3006, + "epoch": 4.89, + "learning_rate": 3.871802120141343e-06, + "loss": 0.2808, "step": 1410 }, { - "epoch": 19.72, - "learning_rate": 2.1574626865671643e-05, - "loss": 0.3033, + "epoch": 4.93, + "learning_rate": 3.8703886925795055e-06, + "loss": 0.2795, "step": 1420 }, { - "epoch": 19.86, - "learning_rate": 2.153731343283582e-05, - "loss": 0.3002, + "epoch": 4.96, + "learning_rate": 3.8689752650176675e-06, + "loss": 0.2664, "step": 1430 }, { - "epoch": 20.0, - "learning_rate": 2.15e-05, - "loss": 0.2958, + "epoch": 5.0, + "learning_rate": 3.86756183745583e-06, + "loss": 0.3036, "step": 1440 }, { - "epoch": 20.0, - "eval_loss": 0.5233781933784485, - "eval_runtime": 129.422, - "eval_samples_per_second": 4.111, - "eval_steps_per_second": 0.518, - "eval_wer": 0.20935913093784148, + "epoch": 5.0, + "eval_loss": 0.49630099534988403, + "eval_runtime": 131.2377, + "eval_samples_per_second": 4.054, + "eval_steps_per_second": 1.013, + "eval_wer": 0.20080992479269782, "step": 1440 }, { - "epoch": 20.14, - "learning_rate": 2.146268656716418e-05, - "loss": 0.2982, + "epoch": 5.03, + "learning_rate": 3.866148409893992e-06, + "loss": 0.2955, "step": 1450 }, { - "epoch": 20.28, - "learning_rate": 2.142537313432836e-05, - "loss": 0.2861, + "epoch": 5.07, + "learning_rate": 3.864734982332155e-06, + "loss": 0.2806, "step": 1460 }, { - "epoch": 20.42, - "learning_rate": 2.1388059701492538e-05, - "loss": 0.293, + "epoch": 5.1, + "learning_rate": 3.863321554770318e-06, + "loss": 0.2625, "step": 1470 }, { - "epoch": 20.55, - "learning_rate": 2.1350746268656717e-05, - "loss": 0.304, + "epoch": 5.14, + "learning_rate": 3.861908127208481e-06, + "loss": 0.2775, "step": 1480 }, { - "epoch": 20.69, - "learning_rate": 2.1313432835820897e-05, - "loss": 0.2926, + "epoch": 5.17, + "learning_rate": 3.860494699646643e-06, + "loss": 0.2916, "step": 1490 }, { - "epoch": 20.83, - "learning_rate": 2.1276119402985076e-05, - "loss": 0.3092, + "epoch": 5.21, + "learning_rate": 3.859081272084806e-06, + "loss": 0.2783, "step": 1500 }, { - "epoch": 20.97, - "learning_rate": 2.1238805970149255e-05, - "loss": 0.2931, + "epoch": 5.24, + "learning_rate": 3.857667844522968e-06, + "loss": 0.2728, "step": 1510 }, { - "epoch": 21.0, - "eval_loss": 0.47944945096969604, - "eval_runtime": 130.2981, - "eval_samples_per_second": 4.083, - "eval_steps_per_second": 0.514, - "eval_wer": 0.20595230442887447, - "step": 1512 - }, - { - "epoch": 21.11, - "learning_rate": 2.1201492537313434e-05, - "loss": 0.2956, + "epoch": 5.28, + "learning_rate": 3.8562544169611305e-06, + "loss": 0.2706, "step": 1520 }, { - "epoch": 21.25, - "learning_rate": 2.1164179104477613e-05, - "loss": 0.3007, + "epoch": 5.31, + "learning_rate": 3.854840989399293e-06, + "loss": 0.2857, "step": 1530 }, { - "epoch": 21.39, - "learning_rate": 2.1126865671641792e-05, - "loss": 0.3045, + "epoch": 5.35, + "learning_rate": 3.853427561837456e-06, + "loss": 0.2956, "step": 1540 }, { - "epoch": 21.53, - "learning_rate": 2.108955223880597e-05, - "loss": 0.3002, + "epoch": 5.38, + "learning_rate": 3.852014134275618e-06, + "loss": 0.2629, "step": 1550 }, { - "epoch": 21.66, - "learning_rate": 2.105223880597015e-05, - "loss": 0.2848, + "epoch": 5.42, + "learning_rate": 3.850600706713781e-06, + "loss": 0.2656, "step": 1560 }, { - "epoch": 21.8, - "learning_rate": 2.1014925373134326e-05, - "loss": 0.286, + "epoch": 5.45, + "learning_rate": 3.849187279151943e-06, + "loss": 0.2842, "step": 1570 }, { - "epoch": 21.94, - "learning_rate": 2.097761194029851e-05, - "loss": 0.305, + "epoch": 5.48, + "learning_rate": 3.847773851590106e-06, + "loss": 0.3061, "step": 1580 }, { - "epoch": 22.0, - "eval_loss": 0.4916737377643585, - "eval_runtime": 129.0137, - "eval_samples_per_second": 4.124, - "eval_steps_per_second": 0.519, - "eval_wer": 0.20492382850163912, - "step": 1584 - }, - { - "epoch": 22.08, - "learning_rate": 2.0940298507462688e-05, - "loss": 0.3092, + "epoch": 5.52, + "learning_rate": 3.846360424028269e-06, + "loss": 0.2755, "step": 1590 }, { - "epoch": 22.22, - "learning_rate": 2.0902985074626867e-05, - "loss": 0.2979, + "epoch": 5.55, + "learning_rate": 3.844946996466431e-06, + "loss": 0.2695, "step": 1600 }, { - "epoch": 22.36, - "learning_rate": 2.0865671641791047e-05, - "loss": 0.2921, + "epoch": 5.59, + "learning_rate": 3.843533568904593e-06, + "loss": 0.2636, "step": 1610 }, { - "epoch": 22.5, - "learning_rate": 2.0828358208955226e-05, - "loss": 0.3052, + "epoch": 5.62, + "learning_rate": 3.842120141342756e-06, + "loss": 0.2822, "step": 1620 }, { - "epoch": 22.64, - "learning_rate": 2.0791044776119405e-05, - "loss": 0.2977, + "epoch": 5.66, + "learning_rate": 3.840706713780918e-06, + "loss": 0.2815, "step": 1630 }, { - "epoch": 22.78, - "learning_rate": 2.0753731343283584e-05, - "loss": 0.2938, + "epoch": 5.69, + "learning_rate": 3.839293286219081e-06, + "loss": 0.3095, "step": 1640 }, { - "epoch": 22.91, - "learning_rate": 2.0716417910447763e-05, - "loss": 0.2847, + "epoch": 5.73, + "learning_rate": 3.837879858657244e-06, + "loss": 0.2825, "step": 1650 }, { - "epoch": 23.0, - "eval_loss": 0.5089883804321289, - "eval_runtime": 129.655, - "eval_samples_per_second": 4.103, - "eval_steps_per_second": 0.517, - "eval_wer": 0.21000192839236356, - "step": 1656 - }, - { - "epoch": 23.06, - "learning_rate": 2.0679104477611942e-05, - "loss": 0.2993, + "epoch": 5.76, + "learning_rate": 3.836466431095406e-06, + "loss": 0.2883, "step": 1660 }, { - "epoch": 23.19, - "learning_rate": 2.064179104477612e-05, - "loss": 0.3081, + "epoch": 5.8, + "learning_rate": 3.835053003533569e-06, + "loss": 0.2781, "step": 1670 }, { - "epoch": 23.33, - "learning_rate": 2.0604477611940297e-05, - "loss": 0.2998, + "epoch": 5.83, + "learning_rate": 3.8336395759717316e-06, + "loss": 0.3046, "step": 1680 }, { - "epoch": 23.47, - "learning_rate": 2.056716417910448e-05, - "loss": 0.3125, + "epoch": 5.87, + "learning_rate": 3.8322261484098935e-06, + "loss": 0.2752, "step": 1690 }, { - "epoch": 23.61, - "learning_rate": 2.052985074626866e-05, - "loss": 0.3135, + "epoch": 5.9, + "learning_rate": 3.830812720848056e-06, + "loss": 0.2571, "step": 1700 }, { - "epoch": 23.75, - "learning_rate": 2.0492537313432835e-05, - "loss": 0.3039, + "epoch": 5.94, + "learning_rate": 3.829399293286218e-06, + "loss": 0.2836, "step": 1710 }, { - "epoch": 23.89, - "learning_rate": 2.0455223880597017e-05, - "loss": 0.2869, + "epoch": 5.97, + "learning_rate": 3.827985865724381e-06, + "loss": 0.3141, "step": 1720 }, { - "epoch": 24.0, - "eval_loss": 0.5296673774719238, - "eval_runtime": 132.3841, - "eval_samples_per_second": 4.019, - "eval_steps_per_second": 0.506, - "eval_wer": 0.2101947676287202, + "epoch": 6.0, + "eval_loss": 0.5004593729972839, + "eval_runtime": 130.6889, + "eval_samples_per_second": 4.071, + "eval_steps_per_second": 1.018, + "eval_wer": 0.20203123995628977, "step": 1728 }, { - "epoch": 24.03, - "learning_rate": 2.0417910447761196e-05, - "loss": 0.2958, + "epoch": 6.01, + "learning_rate": 3.826572438162544e-06, + "loss": 0.299, "step": 1730 }, { - "epoch": 24.17, - "learning_rate": 2.0380597014925372e-05, - "loss": 0.2985, + "epoch": 6.04, + "learning_rate": 3.825159010600707e-06, + "loss": 0.3013, "step": 1740 }, { - "epoch": 24.3, - "learning_rate": 2.0343283582089555e-05, - "loss": 0.2914, + "epoch": 6.08, + "learning_rate": 3.823745583038869e-06, + "loss": 0.2818, "step": 1750 }, { - "epoch": 24.44, - "learning_rate": 2.0305970149253734e-05, - "loss": 0.2975, + "epoch": 6.11, + "learning_rate": 3.822332155477032e-06, + "loss": 0.2743, "step": 1760 }, { - "epoch": 24.58, - "learning_rate": 2.026865671641791e-05, - "loss": 0.3037, + "epoch": 6.15, + "learning_rate": 3.820918727915194e-06, + "loss": 0.2774, "step": 1770 }, { - "epoch": 24.72, - "learning_rate": 2.0231343283582092e-05, - "loss": 0.294, + "epoch": 6.18, + "learning_rate": 3.8195053003533565e-06, + "loss": 0.2833, "step": 1780 }, { - "epoch": 24.86, - "learning_rate": 2.0194029850746268e-05, - "loss": 0.3024, + "epoch": 6.21, + "learning_rate": 3.818091872791519e-06, + "loss": 0.2895, "step": 1790 }, { - "epoch": 25.0, - "learning_rate": 2.0156716417910447e-05, - "loss": 0.2997, + "epoch": 6.25, + "learning_rate": 3.816678445229682e-06, + "loss": 0.2511, "step": 1800 }, { - "epoch": 25.0, - "eval_loss": 0.5185533165931702, - "eval_runtime": 132.6367, - "eval_samples_per_second": 4.011, - "eval_steps_per_second": 0.505, - "eval_wer": 0.20878061322877162, - "step": 1800 - }, - { - "epoch": 25.14, - "learning_rate": 2.011940298507463e-05, - "loss": 0.3077, + "epoch": 6.28, + "learning_rate": 3.815265017667844e-06, + "loss": 0.2567, "step": 1810 }, { - "epoch": 25.28, - "learning_rate": 2.0082089552238805e-05, - "loss": 0.2926, + "epoch": 6.32, + "learning_rate": 3.813851590106007e-06, + "loss": 0.3127, "step": 1820 }, { - "epoch": 25.42, - "learning_rate": 2.0044776119402985e-05, - "loss": 0.2924, + "epoch": 6.35, + "learning_rate": 3.8124381625441694e-06, + "loss": 0.3125, "step": 1830 }, { - "epoch": 25.55, - "learning_rate": 2.0007462686567167e-05, - "loss": 0.2969, + "epoch": 6.39, + "learning_rate": 3.811024734982332e-06, + "loss": 0.2699, "step": 1840 }, { - "epoch": 25.69, - "learning_rate": 1.9970149253731343e-05, - "loss": 0.299, + "epoch": 6.42, + "learning_rate": 3.8096113074204946e-06, + "loss": 0.2896, "step": 1850 }, { - "epoch": 25.83, - "learning_rate": 1.9932835820895522e-05, - "loss": 0.2963, + "epoch": 6.46, + "learning_rate": 3.808197879858657e-06, + "loss": 0.3067, "step": 1860 }, { - "epoch": 25.97, - "learning_rate": 1.9895522388059705e-05, - "loss": 0.2996, + "epoch": 6.49, + "learning_rate": 3.80678445229682e-06, + "loss": 0.2647, "step": 1870 }, { - "epoch": 26.0, - "eval_loss": 0.5218982100486755, - "eval_runtime": 131.3811, - "eval_samples_per_second": 4.049, - "eval_steps_per_second": 0.51, - "eval_wer": 0.20980908915600693, - "step": 1872 - }, - { - "epoch": 26.11, - "learning_rate": 1.985820895522388e-05, - "loss": 0.2972, + "epoch": 6.53, + "learning_rate": 3.805371024734982e-06, + "loss": 0.2916, "step": 1880 }, { - "epoch": 26.25, - "learning_rate": 1.982089552238806e-05, - "loss": 0.2993, + "epoch": 6.56, + "learning_rate": 3.8039575971731447e-06, + "loss": 0.2825, "step": 1890 }, { - "epoch": 26.39, - "learning_rate": 1.9783582089552242e-05, - "loss": 0.2877, + "epoch": 6.6, + "learning_rate": 3.802544169611307e-06, + "loss": 0.283, "step": 1900 }, { - "epoch": 26.53, - "learning_rate": 1.9746268656716418e-05, - "loss": 0.2864, + "epoch": 6.63, + "learning_rate": 3.80113074204947e-06, + "loss": 0.2913, "step": 1910 }, { - "epoch": 26.66, - "learning_rate": 1.9708955223880597e-05, - "loss": 0.2869, + "epoch": 6.66, + "learning_rate": 3.7997173144876324e-06, + "loss": 0.2937, "step": 1920 }, { - "epoch": 26.8, - "learning_rate": 1.9671641791044776e-05, - "loss": 0.3113, + "epoch": 6.7, + "learning_rate": 3.798303886925795e-06, + "loss": 0.2815, "step": 1930 }, { - "epoch": 26.94, - "learning_rate": 1.9634328358208955e-05, - "loss": 0.298, + "epoch": 6.73, + "learning_rate": 3.796890459363957e-06, + "loss": 0.261, "step": 1940 }, { - "epoch": 27.0, - "eval_loss": 0.506175696849823, - "eval_runtime": 132.0981, - "eval_samples_per_second": 4.027, - "eval_steps_per_second": 0.507, - "eval_wer": 0.21077328533779005, - "step": 1944 - }, - { - "epoch": 27.08, - "learning_rate": 1.9597014925373135e-05, - "loss": 0.3057, + "epoch": 6.77, + "learning_rate": 3.79547703180212e-06, + "loss": 0.2883, "step": 1950 }, { - "epoch": 27.22, - "learning_rate": 1.9559701492537314e-05, - "loss": 0.3026, + "epoch": 6.8, + "learning_rate": 3.7940636042402824e-06, + "loss": 0.2678, "step": 1960 }, { - "epoch": 27.36, - "learning_rate": 1.9522388059701493e-05, - "loss": 0.298, + "epoch": 6.84, + "learning_rate": 3.7926501766784452e-06, + "loss": 0.2959, "step": 1970 }, { - "epoch": 27.5, - "learning_rate": 1.9485074626865672e-05, - "loss": 0.3077, + "epoch": 6.87, + "learning_rate": 3.7912367491166077e-06, + "loss": 0.2933, "step": 1980 }, { - "epoch": 27.64, - "learning_rate": 1.944776119402985e-05, - "loss": 0.3073, + "epoch": 6.91, + "learning_rate": 3.7898233215547705e-06, + "loss": 0.2634, "step": 1990 }, { - "epoch": 27.78, - "learning_rate": 1.941044776119403e-05, - "loss": 0.3163, + "epoch": 6.94, + "learning_rate": 3.7884098939929325e-06, + "loss": 0.2767, "step": 2000 }, { - "epoch": 27.91, - "learning_rate": 1.9373134328358213e-05, - "loss": 0.3057, + "epoch": 6.98, + "learning_rate": 3.7869964664310953e-06, + "loss": 0.2898, "step": 2010 }, { - "epoch": 28.0, - "eval_loss": 0.5299437642097473, - "eval_runtime": 132.6119, - "eval_samples_per_second": 4.012, - "eval_steps_per_second": 0.505, - "eval_wer": 0.21366587388313943, + "epoch": 7.0, + "eval_loss": 0.4961535334587097, + "eval_runtime": 131.6974, + "eval_samples_per_second": 4.04, + "eval_steps_per_second": 1.01, + "eval_wer": 0.2029311563926207, "step": 2016 }, { - "epoch": 28.06, - "learning_rate": 1.933582089552239e-05, - "loss": 0.3058, + "epoch": 7.01, + "learning_rate": 3.7855830388692577e-06, + "loss": 0.295, "step": 2020 }, { - "epoch": 28.19, - "learning_rate": 1.9298507462686568e-05, - "loss": 0.2959, + "epoch": 7.05, + "learning_rate": 3.7841696113074206e-06, + "loss": 0.2862, "step": 2030 }, { - "epoch": 28.33, - "learning_rate": 1.9261194029850747e-05, - "loss": 0.3052, + "epoch": 7.08, + "learning_rate": 3.782756183745583e-06, + "loss": 0.2683, "step": 2040 }, { - "epoch": 28.47, - "learning_rate": 1.9223880597014926e-05, - "loss": 0.2961, + "epoch": 7.12, + "learning_rate": 3.7813427561837454e-06, + "loss": 0.2845, "step": 2050 }, { - "epoch": 28.61, - "learning_rate": 1.9186567164179105e-05, - "loss": 0.3006, + "epoch": 7.15, + "learning_rate": 3.7799293286219078e-06, + "loss": 0.2863, "step": 2060 }, { - "epoch": 28.75, - "learning_rate": 1.9149253731343284e-05, - "loss": 0.3096, + "epoch": 7.19, + "learning_rate": 3.7785159010600706e-06, + "loss": 0.2889, "step": 2070 }, { - "epoch": 28.89, - "learning_rate": 1.9111940298507464e-05, - "loss": 0.2937, + "epoch": 7.22, + "learning_rate": 3.777102473498233e-06, + "loss": 0.2837, "step": 2080 }, { - "epoch": 29.0, - "eval_loss": 0.5345147848129272, - "eval_runtime": 131.6737, - "eval_samples_per_second": 4.04, - "eval_steps_per_second": 0.509, - "eval_wer": 0.21540142701034903, - "step": 2088 - }, - { - "epoch": 29.03, - "learning_rate": 1.9074626865671643e-05, - "loss": 0.3, + "epoch": 7.26, + "learning_rate": 3.775689045936396e-06, + "loss": 0.2816, "step": 2090 }, { - "epoch": 29.17, - "learning_rate": 1.9037313432835822e-05, - "loss": 0.2895, + "epoch": 7.29, + "learning_rate": 3.7742756183745583e-06, + "loss": 0.2938, "step": 2100 }, { - "epoch": 29.3, - "learning_rate": 1.9e-05, - "loss": 0.2907, + "epoch": 7.33, + "learning_rate": 3.7728621908127207e-06, + "loss": 0.3051, "step": 2110 }, { - "epoch": 29.44, - "learning_rate": 1.896268656716418e-05, - "loss": 0.2975, + "epoch": 7.36, + "learning_rate": 3.771448763250883e-06, + "loss": 0.2662, "step": 2120 }, { - "epoch": 29.58, - "learning_rate": 1.892537313432836e-05, - "loss": 0.2945, + "epoch": 7.39, + "learning_rate": 3.770035335689046e-06, + "loss": 0.26, "step": 2130 }, { - "epoch": 29.72, - "learning_rate": 1.888805970149254e-05, - "loss": 0.3019, + "epoch": 7.43, + "learning_rate": 3.7686219081272083e-06, + "loss": 0.2823, "step": 2140 }, { - "epoch": 29.86, - "learning_rate": 1.8850746268656718e-05, - "loss": 0.2987, + "epoch": 7.46, + "learning_rate": 3.767208480565371e-06, + "loss": 0.2766, "step": 2150 }, { - "epoch": 30.0, - "learning_rate": 1.8813432835820897e-05, - "loss": 0.3064, - "step": 2160 - }, - { - "epoch": 30.0, - "eval_loss": 0.5374366044998169, - "eval_runtime": 131.625, - "eval_samples_per_second": 4.042, - "eval_steps_per_second": 0.509, - "eval_wer": 0.21160892202866877, + "epoch": 7.5, + "learning_rate": 3.7657950530035336e-06, + "loss": 0.275, "step": 2160 }, { - "epoch": 30.14, - "learning_rate": 1.8776119402985076e-05, - "loss": 0.2945, + "epoch": 7.53, + "learning_rate": 3.764381625441696e-06, + "loss": 0.2968, "step": 2170 }, { - "epoch": 30.28, - "learning_rate": 1.8738805970149255e-05, - "loss": 0.2925, + "epoch": 7.57, + "learning_rate": 3.7629681978798584e-06, + "loss": 0.2965, "step": 2180 }, { - "epoch": 30.42, - "learning_rate": 1.8701492537313434e-05, - "loss": 0.2875, + "epoch": 7.6, + "learning_rate": 3.7615547703180212e-06, + "loss": 0.2724, "step": 2190 }, { - "epoch": 30.55, - "learning_rate": 1.8664179104477613e-05, - "loss": 0.2936, + "epoch": 7.64, + "learning_rate": 3.7601413427561836e-06, + "loss": 0.2829, "step": 2200 }, { - "epoch": 30.69, - "learning_rate": 1.8626865671641793e-05, - "loss": 0.2937, + "epoch": 7.67, + "learning_rate": 3.7587279151943465e-06, + "loss": 0.2952, "step": 2210 }, { - "epoch": 30.83, - "learning_rate": 1.8589552238805972e-05, - "loss": 0.2952, + "epoch": 7.71, + "learning_rate": 3.7573144876325085e-06, + "loss": 0.2675, "step": 2220 }, { - "epoch": 30.97, - "learning_rate": 1.855223880597015e-05, - "loss": 0.2915, + "epoch": 7.74, + "learning_rate": 3.7559010600706713e-06, + "loss": 0.2608, "step": 2230 }, { - "epoch": 31.0, - "eval_loss": 0.5184913873672485, - "eval_runtime": 131.6654, - "eval_samples_per_second": 4.041, - "eval_steps_per_second": 0.509, - "eval_wer": 0.20736645882882304, - "step": 2232 - }, - { - "epoch": 31.11, - "learning_rate": 1.851492537313433e-05, - "loss": 0.3009, + "epoch": 7.78, + "learning_rate": 3.7544876325088337e-06, + "loss": 0.2701, "step": 2240 }, { - "epoch": 31.25, - "learning_rate": 1.847761194029851e-05, - "loss": 0.3002, + "epoch": 7.81, + "learning_rate": 3.7530742049469965e-06, + "loss": 0.2797, "step": 2250 }, { - "epoch": 31.39, - "learning_rate": 1.844029850746269e-05, - "loss": 0.2676, + "epoch": 7.85, + "learning_rate": 3.7518021201413426e-06, + "loss": 0.2733, "step": 2260 }, { - "epoch": 31.53, - "learning_rate": 1.8402985074626868e-05, - "loss": 0.2795, + "epoch": 7.88, + "learning_rate": 3.750388692579505e-06, + "loss": 0.3008, "step": 2270 }, { - "epoch": 31.66, - "learning_rate": 1.8365671641791047e-05, + "epoch": 7.91, + "learning_rate": 3.748975265017668e-06, "loss": 0.2855, "step": 2280 }, { - "epoch": 31.8, - "learning_rate": 1.8328358208955223e-05, - "loss": 0.2967, + "epoch": 7.95, + "learning_rate": 3.7475618374558306e-06, + "loss": 0.2587, "step": 2290 }, { - "epoch": 31.94, - "learning_rate": 1.8291044776119405e-05, - "loss": 0.2942, + "epoch": 7.98, + "learning_rate": 3.7461484098939926e-06, + "loss": 0.2922, "step": 2300 }, { - "epoch": 32.0, - "eval_loss": 0.5221661925315857, - "eval_runtime": 131.7358, - "eval_samples_per_second": 4.038, - "eval_steps_per_second": 0.509, - "eval_wer": 0.20935913093784148, + "epoch": 8.0, + "eval_loss": 0.507337212562561, + "eval_runtime": 130.1898, + "eval_samples_per_second": 4.086, + "eval_steps_per_second": 1.022, + "eval_wer": 0.2030597158835251, "step": 2304 }, { - "epoch": 32.08, - "learning_rate": 1.8253731343283584e-05, - "loss": 0.3027, + "epoch": 8.02, + "learning_rate": 3.744734982332155e-06, + "loss": 0.2721, "step": 2310 }, { - "epoch": 32.22, - "learning_rate": 1.821641791044776e-05, - "loss": 0.2919, + "epoch": 8.06, + "learning_rate": 3.743321554770318e-06, + "loss": 0.305, "step": 2320 }, { - "epoch": 32.36, - "learning_rate": 1.8179104477611943e-05, - "loss": 0.2963, + "epoch": 8.09, + "learning_rate": 3.7419081272084803e-06, + "loss": 0.2736, "step": 2330 }, { - "epoch": 32.5, - "learning_rate": 1.814179104477612e-05, - "loss": 0.2917, + "epoch": 8.12, + "learning_rate": 3.740494699646643e-06, + "loss": 0.2865, "step": 2340 }, { - "epoch": 32.64, - "learning_rate": 1.8104477611940297e-05, - "loss": 0.2753, + "epoch": 8.16, + "learning_rate": 3.739081272084805e-06, + "loss": 0.2774, "step": 2350 }, { - "epoch": 32.78, - "learning_rate": 1.806716417910448e-05, - "loss": 0.288, + "epoch": 8.19, + "learning_rate": 3.737667844522968e-06, + "loss": 0.2621, "step": 2360 }, { - "epoch": 32.91, - "learning_rate": 1.802985074626866e-05, - "loss": 0.2777, + "epoch": 8.23, + "learning_rate": 3.7362544169611303e-06, + "loss": 0.2849, "step": 2370 }, { - "epoch": 33.0, - "eval_loss": 0.5229014158248901, - "eval_runtime": 131.9614, - "eval_samples_per_second": 4.031, - "eval_steps_per_second": 0.508, - "eval_wer": 0.21077328533779005, - "step": 2376 - }, - { - "epoch": 33.06, - "learning_rate": 1.7992537313432835e-05, - "loss": 0.3004, + "epoch": 8.26, + "learning_rate": 3.734840989399293e-06, + "loss": 0.2744, "step": 2380 }, { - "epoch": 33.19, - "learning_rate": 1.7955223880597017e-05, - "loss": 0.2916, + "epoch": 8.3, + "learning_rate": 3.7334275618374556e-06, + "loss": 0.3042, "step": 2390 }, { - "epoch": 33.33, - "learning_rate": 1.7917910447761193e-05, - "loss": 0.2933, + "epoch": 8.33, + "learning_rate": 3.7320141342756184e-06, + "loss": 0.2861, "step": 2400 }, { - "epoch": 33.47, - "learning_rate": 1.7880597014925372e-05, - "loss": 0.296, + "epoch": 8.37, + "learning_rate": 3.7306007067137804e-06, + "loss": 0.2774, "step": 2410 }, { - "epoch": 33.61, - "learning_rate": 1.7843283582089555e-05, - "loss": 0.2959, + "epoch": 8.4, + "learning_rate": 3.7291872791519432e-06, + "loss": 0.2846, "step": 2420 }, { - "epoch": 33.75, - "learning_rate": 1.780597014925373e-05, - "loss": 0.2846, + "epoch": 8.44, + "learning_rate": 3.7277738515901056e-06, + "loss": 0.2448, "step": 2430 }, { - "epoch": 33.89, - "learning_rate": 1.776865671641791e-05, - "loss": 0.2821, + "epoch": 8.47, + "learning_rate": 3.7263604240282685e-06, + "loss": 0.2937, "step": 2440 }, { - "epoch": 34.0, - "eval_loss": 0.5242453813552856, - "eval_runtime": 132.7946, - "eval_samples_per_second": 4.006, - "eval_steps_per_second": 0.505, - "eval_wer": 0.2101947676287202, - "step": 2448 - }, - { - "epoch": 34.03, - "learning_rate": 1.7731343283582092e-05, - "loss": 0.2997, + "epoch": 8.51, + "learning_rate": 3.724946996466431e-06, + "loss": 0.2963, "step": 2450 }, { - "epoch": 34.17, - "learning_rate": 1.7694029850746268e-05, - "loss": 0.2872, + "epoch": 8.54, + "learning_rate": 3.7235335689045937e-06, + "loss": 0.2583, "step": 2460 }, { - "epoch": 34.3, - "learning_rate": 1.7656716417910447e-05, - "loss": 0.2826, + "epoch": 8.57, + "learning_rate": 3.7221201413427557e-06, + "loss": 0.2691, "step": 2470 }, { - "epoch": 34.44, - "learning_rate": 1.761940298507463e-05, - "loss": 0.2965, + "epoch": 8.61, + "learning_rate": 3.7207067137809185e-06, + "loss": 0.2798, "step": 2480 }, { - "epoch": 34.58, - "learning_rate": 1.7582089552238806e-05, - "loss": 0.2812, + "epoch": 8.64, + "learning_rate": 3.719293286219081e-06, + "loss": 0.2915, "step": 2490 }, { - "epoch": 34.72, - "learning_rate": 1.7548507462686566e-05, - "loss": 0.2893, + "epoch": 8.68, + "learning_rate": 3.7178798586572438e-06, + "loss": 0.2906, "step": 2500 }, { - "epoch": 34.86, - "learning_rate": 1.751119402985075e-05, - "loss": 0.2799, + "epoch": 8.71, + "learning_rate": 3.716466431095406e-06, + "loss": 0.2885, "step": 2510 }, { - "epoch": 35.0, - "learning_rate": 1.7473880597014928e-05, - "loss": 0.2859, - "step": 2520 - }, - { - "epoch": 35.0, - "eval_loss": 0.5292270183563232, - "eval_runtime": 131.3549, - "eval_samples_per_second": 4.05, - "eval_steps_per_second": 0.51, - "eval_wer": 0.2096162499196503, + "epoch": 8.75, + "learning_rate": 3.7150530035335686e-06, + "loss": 0.2899, "step": 2520 }, { - "epoch": 35.14, - "learning_rate": 1.7436567164179103e-05, - "loss": 0.2936, + "epoch": 8.78, + "learning_rate": 3.713639575971731e-06, + "loss": 0.2726, "step": 2530 }, { - "epoch": 35.28, - "learning_rate": 1.7399253731343286e-05, - "loss": 0.2941, + "epoch": 8.82, + "learning_rate": 3.712226148409894e-06, + "loss": 0.2824, "step": 2540 }, { - "epoch": 35.42, - "learning_rate": 1.7361940298507465e-05, - "loss": 0.2887, + "epoch": 8.85, + "learning_rate": 3.7108127208480563e-06, + "loss": 0.2846, "step": 2550 }, { - "epoch": 35.55, - "learning_rate": 1.732462686567164e-05, - "loss": 0.296, + "epoch": 8.89, + "learning_rate": 3.709399293286219e-06, + "loss": 0.2734, "step": 2560 }, { - "epoch": 35.69, - "learning_rate": 1.7287313432835823e-05, - "loss": 0.2905, + "epoch": 8.92, + "learning_rate": 3.7079858657243815e-06, + "loss": 0.2696, "step": 2570 }, { - "epoch": 35.83, - "learning_rate": 1.725e-05, - "loss": 0.2872, + "epoch": 8.96, + "learning_rate": 3.706572438162544e-06, + "loss": 0.2703, "step": 2580 }, { - "epoch": 35.97, - "learning_rate": 1.721268656716418e-05, - "loss": 0.283, + "epoch": 8.99, + "learning_rate": 3.7051590106007063e-06, + "loss": 0.266, "step": 2590 }, { - "epoch": 36.0, - "eval_loss": 0.5041770339012146, - "eval_runtime": 131.4728, - "eval_samples_per_second": 4.046, - "eval_steps_per_second": 0.51, - "eval_wer": 0.20665938162884875, + "epoch": 9.0, + "eval_loss": 0.5159009695053101, + "eval_runtime": 130.5433, + "eval_samples_per_second": 4.075, + "eval_steps_per_second": 1.019, + "eval_wer": 0.2023526386835508, "step": 2592 }, { - "epoch": 36.11, - "learning_rate": 1.717537313432836e-05, - "loss": 0.2914, + "epoch": 9.03, + "learning_rate": 3.703745583038869e-06, + "loss": 0.2807, "step": 2600 }, { - "epoch": 36.25, - "learning_rate": 1.7138059701492537e-05, - "loss": 0.2829, + "epoch": 9.06, + "learning_rate": 3.7023321554770316e-06, + "loss": 0.2772, "step": 2610 }, { - "epoch": 36.39, - "learning_rate": 1.7100746268656716e-05, - "loss": 0.2682, + "epoch": 9.1, + "learning_rate": 3.7009187279151944e-06, + "loss": 0.2813, "step": 2620 }, { - "epoch": 36.53, - "learning_rate": 1.70634328358209e-05, - "loss": 0.2989, + "epoch": 9.13, + "learning_rate": 3.6995053003533564e-06, + "loss": 0.2878, "step": 2630 }, { - "epoch": 36.66, - "learning_rate": 1.7026119402985074e-05, - "loss": 0.2873, + "epoch": 9.17, + "learning_rate": 3.6980918727915192e-06, + "loss": 0.2934, "step": 2640 }, { - "epoch": 36.8, - "learning_rate": 1.6992537313432834e-05, - "loss": 0.29, + "epoch": 9.2, + "learning_rate": 3.6966784452296816e-06, + "loss": 0.2755, "step": 2650 }, { - "epoch": 36.94, - "learning_rate": 1.6955223880597017e-05, - "loss": 0.2895, + "epoch": 9.24, + "learning_rate": 3.6952650176678445e-06, + "loss": 0.2921, "step": 2660 }, { - "epoch": 37.0, - "eval_loss": 0.5222975015640259, - "eval_runtime": 131.841, - "eval_samples_per_second": 4.035, - "eval_steps_per_second": 0.508, - "eval_wer": 0.2045381500289259, - "step": 2664 - }, - { - "epoch": 37.08, - "learning_rate": 1.6917910447761196e-05, - "loss": 0.2939, + "epoch": 9.27, + "learning_rate": 3.693851590106007e-06, + "loss": 0.2499, "step": 2670 }, { - "epoch": 37.22, - "learning_rate": 1.6880597014925372e-05, - "loss": 0.295, + "epoch": 9.3, + "learning_rate": 3.6924381625441697e-06, + "loss": 0.2904, "step": 2680 }, { - "epoch": 37.36, - "learning_rate": 1.6843283582089554e-05, - "loss": 0.2793, + "epoch": 9.34, + "learning_rate": 3.6910247349823317e-06, + "loss": 0.2853, "step": 2690 }, { - "epoch": 37.5, - "learning_rate": 1.6805970149253734e-05, - "loss": 0.2842, + "epoch": 9.37, + "learning_rate": 3.6896113074204945e-06, + "loss": 0.2855, "step": 2700 }, { - "epoch": 37.64, - "learning_rate": 1.676865671641791e-05, - "loss": 0.2678, + "epoch": 9.41, + "learning_rate": 3.688197879858657e-06, + "loss": 0.2839, "step": 2710 }, { - "epoch": 37.78, - "learning_rate": 1.6731343283582092e-05, - "loss": 0.2868, + "epoch": 9.44, + "learning_rate": 3.6867844522968198e-06, + "loss": 0.2615, "step": 2720 }, { - "epoch": 37.91, - "learning_rate": 1.669402985074627e-05, - "loss": 0.2822, + "epoch": 9.48, + "learning_rate": 3.685371024734982e-06, + "loss": 0.3092, "step": 2730 }, { - "epoch": 38.0, - "eval_loss": 0.5093514919281006, - "eval_runtime": 132.4112, - "eval_samples_per_second": 4.018, - "eval_steps_per_second": 0.506, - "eval_wer": 0.2071093398470142, - "step": 2736 - }, - { - "epoch": 38.06, - "learning_rate": 1.6656716417910447e-05, - "loss": 0.2914, + "epoch": 9.51, + "learning_rate": 3.683957597173145e-06, + "loss": 0.2576, "step": 2740 }, { - "epoch": 38.19, - "learning_rate": 1.661940298507463e-05, - "loss": 0.2828, + "epoch": 9.55, + "learning_rate": 3.682544169611307e-06, + "loss": 0.2947, "step": 2750 }, { - "epoch": 38.33, - "learning_rate": 1.658208955223881e-05, - "loss": 0.2637, + "epoch": 9.58, + "learning_rate": 3.68113074204947e-06, + "loss": 0.2769, "step": 2760 }, { - "epoch": 38.47, - "learning_rate": 1.6544776119402984e-05, - "loss": 0.288, + "epoch": 9.62, + "learning_rate": 3.6797173144876322e-06, + "loss": 0.2569, "step": 2770 }, { - "epoch": 38.61, - "learning_rate": 1.6507462686567167e-05, - "loss": 0.2814, + "epoch": 9.65, + "learning_rate": 3.678303886925795e-06, + "loss": 0.2908, "step": 2780 }, { - "epoch": 38.75, - "learning_rate": 1.6470149253731343e-05, - "loss": 0.2902, + "epoch": 9.69, + "learning_rate": 3.6768904593639575e-06, + "loss": 0.2975, "step": 2790 }, { - "epoch": 38.89, - "learning_rate": 1.6432835820895522e-05, - "loss": 0.2672, + "epoch": 9.72, + "learning_rate": 3.67547703180212e-06, + "loss": 0.26, "step": 2800 }, { - "epoch": 39.0, - "eval_loss": 0.5250556468963623, - "eval_runtime": 131.822, - "eval_samples_per_second": 4.036, - "eval_steps_per_second": 0.508, - "eval_wer": 0.20415247155621263, - "step": 2808 - }, - { - "epoch": 39.03, - "learning_rate": 1.6395522388059704e-05, - "loss": 0.2954, + "epoch": 9.75, + "learning_rate": 3.6740636042402823e-06, + "loss": 0.2551, "step": 2810 }, { - "epoch": 39.17, - "learning_rate": 1.635820895522388e-05, - "loss": 0.2854, + "epoch": 9.79, + "learning_rate": 3.672650176678445e-06, + "loss": 0.2701, "step": 2820 }, { - "epoch": 39.3, - "learning_rate": 1.632089552238806e-05, - "loss": 0.2874, + "epoch": 9.82, + "learning_rate": 3.6712367491166075e-06, + "loss": 0.2922, "step": 2830 }, { - "epoch": 39.44, - "learning_rate": 1.6283582089552242e-05, - "loss": 0.2671, + "epoch": 9.86, + "learning_rate": 3.6698233215547704e-06, + "loss": 0.2951, "step": 2840 }, { - "epoch": 39.58, - "learning_rate": 1.6246268656716418e-05, - "loss": 0.2761, + "epoch": 9.89, + "learning_rate": 3.6684098939929328e-06, + "loss": 0.2508, "step": 2850 }, { - "epoch": 39.72, - "learning_rate": 1.6208955223880597e-05, - "loss": 0.2904, + "epoch": 9.93, + "learning_rate": 3.666996466431095e-06, + "loss": 0.2844, "step": 2860 }, { - "epoch": 39.86, - "learning_rate": 1.617164179104478e-05, - "loss": 0.2783, + "epoch": 9.96, + "learning_rate": 3.6655830388692576e-06, + "loss": 0.2914, "step": 2870 }, { - "epoch": 40.0, - "learning_rate": 1.6134328358208955e-05, - "loss": 0.2925, + "epoch": 10.0, + "learning_rate": 3.6641696113074204e-06, + "loss": 0.2817, "step": 2880 }, { - "epoch": 40.0, - "eval_loss": 0.5071823000907898, - "eval_runtime": 132.8431, - "eval_samples_per_second": 4.005, - "eval_steps_per_second": 0.504, - "eval_wer": 0.20511666773799575, + "epoch": 10.0, + "eval_loss": 0.523847222328186, + "eval_runtime": 131.2872, + "eval_samples_per_second": 4.052, + "eval_steps_per_second": 1.013, + "eval_wer": 0.20106704377450665, "step": 2880 }, { - "epoch": 40.14, - "learning_rate": 1.6097014925373134e-05, - "loss": 0.2936, + "epoch": 10.03, + "learning_rate": 3.662756183745583e-06, + "loss": 0.2805, "step": 2890 }, { - "epoch": 40.28, - "learning_rate": 1.6059701492537313e-05, - "loss": 0.2848, + "epoch": 10.07, + "learning_rate": 3.6613427561837457e-06, + "loss": 0.2565, "step": 2900 }, { - "epoch": 40.42, - "learning_rate": 1.6022388059701492e-05, - "loss": 0.2866, + "epoch": 10.1, + "learning_rate": 3.659929328621908e-06, + "loss": 0.2575, "step": 2910 }, { - "epoch": 40.55, - "learning_rate": 1.598507462686567e-05, - "loss": 0.289, + "epoch": 10.14, + "learning_rate": 3.6585159010600705e-06, + "loss": 0.2875, "step": 2920 }, { - "epoch": 40.69, - "learning_rate": 1.594776119402985e-05, - "loss": 0.2817, + "epoch": 10.17, + "learning_rate": 3.657102473498233e-06, + "loss": 0.2961, "step": 2930 }, { - "epoch": 40.83, - "learning_rate": 1.591044776119403e-05, - "loss": 0.293, + "epoch": 10.21, + "learning_rate": 3.6556890459363957e-06, + "loss": 0.2588, "step": 2940 }, { - "epoch": 40.97, - "learning_rate": 1.587313432835821e-05, - "loss": 0.295, + "epoch": 10.24, + "learning_rate": 3.654275618374558e-06, + "loss": 0.2574, "step": 2950 }, { - "epoch": 41.0, - "eval_loss": 0.4903075695037842, - "eval_runtime": 131.5707, - "eval_samples_per_second": 4.043, - "eval_steps_per_second": 0.509, - "eval_wer": 0.2071093398470142, - "step": 2952 - }, - { - "epoch": 41.11, - "learning_rate": 1.5835820895522388e-05, - "loss": 0.2957, + "epoch": 10.28, + "learning_rate": 3.652862190812721e-06, + "loss": 0.269, "step": 2960 }, { - "epoch": 41.25, - "learning_rate": 1.5798507462686567e-05, - "loss": 0.294, + "epoch": 10.31, + "learning_rate": 3.651448763250883e-06, + "loss": 0.281, "step": 2970 }, { - "epoch": 41.39, - "learning_rate": 1.5761194029850747e-05, - "loss": 0.2779, + "epoch": 10.35, + "learning_rate": 3.650035335689046e-06, + "loss": 0.2859, "step": 2980 }, { - "epoch": 41.53, - "learning_rate": 1.5723880597014926e-05, - "loss": 0.2808, + "epoch": 10.38, + "learning_rate": 3.648621908127208e-06, + "loss": 0.2844, "step": 2990 }, { - "epoch": 41.66, - "learning_rate": 1.5686567164179105e-05, - "loss": 0.2924, + "epoch": 10.42, + "learning_rate": 3.647208480565371e-06, + "loss": 0.3113, "step": 3000 }, { - "epoch": 41.8, - "learning_rate": 1.5649253731343284e-05, - "loss": 0.2917, + "epoch": 10.45, + "learning_rate": 3.6457950530035334e-06, + "loss": 0.2806, "step": 3010 }, { - "epoch": 41.94, - "learning_rate": 1.5611940298507463e-05, - "loss": 0.2725, + "epoch": 10.48, + "learning_rate": 3.6443816254416963e-06, + "loss": 0.2926, "step": 3020 }, { - "epoch": 42.0, - "eval_loss": 0.49732398986816406, - "eval_runtime": 131.4816, - "eval_samples_per_second": 4.046, - "eval_steps_per_second": 0.51, - "eval_wer": 0.20485954875618692, - "step": 3024 - }, - { - "epoch": 42.08, - "learning_rate": 1.5574626865671642e-05, - "loss": 0.2972, + "epoch": 10.52, + "learning_rate": 3.6429681978798583e-06, + "loss": 0.3066, "step": 3030 }, { - "epoch": 42.22, - "learning_rate": 1.553731343283582e-05, - "loss": 0.2854, + "epoch": 10.55, + "learning_rate": 3.641554770318021e-06, + "loss": 0.278, "step": 3040 }, { - "epoch": 42.36, - "learning_rate": 1.55e-05, - "loss": 0.2874, + "epoch": 10.59, + "learning_rate": 3.6401413427561835e-06, + "loss": 0.276, "step": 3050 }, { - "epoch": 42.5, - "learning_rate": 1.546268656716418e-05, - "loss": 0.2928, + "epoch": 10.62, + "learning_rate": 3.6387279151943463e-06, + "loss": 0.2589, "step": 3060 }, { - "epoch": 42.64, - "learning_rate": 1.542537313432836e-05, - "loss": 0.2773, + "epoch": 10.66, + "learning_rate": 3.6373144876325088e-06, + "loss": 0.2792, "step": 3070 }, { - "epoch": 42.78, - "learning_rate": 1.5388059701492538e-05, - "loss": 0.2954, + "epoch": 10.69, + "learning_rate": 3.6359010600706716e-06, + "loss": 0.2706, "step": 3080 }, { - "epoch": 42.91, - "learning_rate": 1.5350746268656717e-05, - "loss": 0.2758, + "epoch": 10.73, + "learning_rate": 3.6344876325088336e-06, + "loss": 0.2702, "step": 3090 }, { - "epoch": 43.0, - "eval_loss": 0.5097233057022095, - "eval_runtime": 131.4822, - "eval_samples_per_second": 4.046, - "eval_steps_per_second": 0.51, - "eval_wer": 0.2015812817381243, - "step": 3096 - }, - { - "epoch": 43.06, - "learning_rate": 1.5313432835820896e-05, - "loss": 0.2904, + "epoch": 10.76, + "learning_rate": 3.6330742049469964e-06, + "loss": 0.2818, "step": 3100 }, { - "epoch": 43.19, - "learning_rate": 1.5276119402985076e-05, - "loss": 0.2831, + "epoch": 10.8, + "learning_rate": 3.631660777385159e-06, + "loss": 0.2898, "step": 3110 }, { - "epoch": 43.33, - "learning_rate": 1.5238805970149256e-05, - "loss": 0.2779, + "epoch": 10.83, + "learning_rate": 3.6302473498233216e-06, + "loss": 0.2893, "step": 3120 }, { - "epoch": 43.47, - "learning_rate": 1.5201492537313434e-05, - "loss": 0.2844, + "epoch": 10.87, + "learning_rate": 3.628833922261484e-06, + "loss": 0.275, "step": 3130 }, { - "epoch": 43.61, - "learning_rate": 1.5164179104477613e-05, - "loss": 0.2842, + "epoch": 10.9, + "learning_rate": 3.6274204946996465e-06, + "loss": 0.283, "step": 3140 }, { - "epoch": 43.75, - "learning_rate": 1.512686567164179e-05, - "loss": 0.2856, + "epoch": 10.94, + "learning_rate": 3.626007067137809e-06, + "loss": 0.2606, "step": 3150 }, { - "epoch": 43.89, - "learning_rate": 1.5089552238805971e-05, - "loss": 0.2809, + "epoch": 10.97, + "learning_rate": 3.6245936395759717e-06, + "loss": 0.2922, "step": 3160 }, { - "epoch": 44.0, - "eval_loss": 0.49982935190200806, - "eval_runtime": 131.8613, - "eval_samples_per_second": 4.035, - "eval_steps_per_second": 0.508, - "eval_wer": 0.20280259690171626, + "epoch": 11.0, + "eval_loss": 0.508041262626648, + "eval_runtime": 130.0766, + "eval_samples_per_second": 4.09, + "eval_steps_per_second": 1.022, + "eval_wer": 0.20113132351995885, "step": 3168 }, { - "epoch": 44.03, - "learning_rate": 1.505223880597015e-05, - "loss": 0.2936, + "epoch": 11.01, + "learning_rate": 3.623180212014134e-06, + "loss": 0.3119, "step": 3170 }, { - "epoch": 44.17, - "learning_rate": 1.5014925373134328e-05, - "loss": 0.285, + "epoch": 11.04, + "learning_rate": 3.621766784452297e-06, + "loss": 0.2549, "step": 3180 }, { - "epoch": 44.3, - "learning_rate": 1.4977611940298509e-05, - "loss": 0.2833, + "epoch": 11.08, + "learning_rate": 3.6203533568904594e-06, + "loss": 0.2656, "step": 3190 }, { - "epoch": 44.44, - "learning_rate": 1.4940298507462688e-05, - "loss": 0.282, + "epoch": 11.11, + "learning_rate": 3.6189399293286218e-06, + "loss": 0.2914, "step": 3200 }, { - "epoch": 44.58, - "learning_rate": 1.4902985074626866e-05, - "loss": 0.2816, + "epoch": 11.15, + "learning_rate": 3.617526501766784e-06, + "loss": 0.2861, "step": 3210 }, { - "epoch": 44.72, - "learning_rate": 1.4865671641791046e-05, - "loss": 0.2711, + "epoch": 11.18, + "learning_rate": 3.616113074204947e-06, + "loss": 0.2998, "step": 3220 }, { - "epoch": 44.86, - "learning_rate": 1.4828358208955226e-05, - "loss": 0.2702, + "epoch": 11.21, + "learning_rate": 3.6146996466431094e-06, + "loss": 0.2821, "step": 3230 }, { - "epoch": 45.0, - "learning_rate": 1.4791044776119403e-05, - "loss": 0.2804, - "step": 3240 - }, - { - "epoch": 45.0, - "eval_loss": 0.5103247761726379, - "eval_runtime": 131.3748, - "eval_samples_per_second": 4.049, - "eval_steps_per_second": 0.51, - "eval_wer": 0.20421675130166483, + "epoch": 11.25, + "learning_rate": 3.6132862190812723e-06, + "loss": 0.3008, "step": 3240 }, { - "epoch": 45.14, - "learning_rate": 1.4753731343283584e-05, - "loss": 0.2664, + "epoch": 11.28, + "learning_rate": 3.6118727915194342e-06, + "loss": 0.26, "step": 3250 }, { - "epoch": 45.28, - "learning_rate": 1.4716417910447761e-05, - "loss": 0.2755, + "epoch": 11.32, + "learning_rate": 3.610459363957597e-06, + "loss": 0.2877, "step": 3260 }, { - "epoch": 45.42, - "learning_rate": 1.467910447761194e-05, - "loss": 0.2725, + "epoch": 11.35, + "learning_rate": 3.6090459363957595e-06, + "loss": 0.3065, "step": 3270 }, { - "epoch": 45.55, - "learning_rate": 1.4641791044776121e-05, - "loss": 0.2878, + "epoch": 11.39, + "learning_rate": 3.6076325088339223e-06, + "loss": 0.2815, "step": 3280 }, { - "epoch": 45.69, - "learning_rate": 1.4604477611940299e-05, - "loss": 0.2847, + "epoch": 11.42, + "learning_rate": 3.6062190812720847e-06, + "loss": 0.2649, "step": 3290 }, { - "epoch": 45.83, - "learning_rate": 1.4567164179104478e-05, - "loss": 0.2826, + "epoch": 11.46, + "learning_rate": 3.6048056537102476e-06, + "loss": 0.2859, "step": 3300 }, { - "epoch": 45.97, - "learning_rate": 1.4529850746268659e-05, - "loss": 0.2842, + "epoch": 11.49, + "learning_rate": 3.6033922261484095e-06, + "loss": 0.2826, "step": 3310 }, { - "epoch": 46.0, - "eval_loss": 0.48608192801475525, - "eval_runtime": 131.8901, - "eval_samples_per_second": 4.034, - "eval_steps_per_second": 0.508, - "eval_wer": 0.2021597994471942, - "step": 3312 - }, - { - "epoch": 46.11, - "learning_rate": 1.4492537313432836e-05, - "loss": 0.2921, + "epoch": 11.53, + "learning_rate": 3.601978798586572e-06, + "loss": 0.2882, "step": 3320 }, { - "epoch": 46.25, - "learning_rate": 1.4455223880597015e-05, - "loss": 0.2833, + "epoch": 11.56, + "learning_rate": 3.600565371024735e-06, + "loss": 0.2772, "step": 3330 }, { - "epoch": 46.39, - "learning_rate": 1.4417910447761196e-05, - "loss": 0.2787, + "epoch": 11.6, + "learning_rate": 3.5991519434628976e-06, + "loss": 0.2678, "step": 3340 }, { - "epoch": 46.53, - "learning_rate": 1.4380597014925374e-05, - "loss": 0.2772, + "epoch": 11.63, + "learning_rate": 3.59773851590106e-06, + "loss": 0.2841, "step": 3350 }, { - "epoch": 46.66, - "learning_rate": 1.4343283582089553e-05, - "loss": 0.2756, + "epoch": 11.66, + "learning_rate": 3.596325088339223e-06, + "loss": 0.2982, "step": 3360 }, { - "epoch": 46.8, - "learning_rate": 1.430597014925373e-05, - "loss": 0.2745, + "epoch": 11.7, + "learning_rate": 3.594911660777385e-06, + "loss": 0.2904, "step": 3370 }, { - "epoch": 46.94, - "learning_rate": 1.4268656716417911e-05, - "loss": 0.2721, + "epoch": 11.73, + "learning_rate": 3.5934982332155473e-06, + "loss": 0.2908, "step": 3380 }, { - "epoch": 47.0, - "eval_loss": 0.5053983926773071, - "eval_runtime": 131.5158, - "eval_samples_per_second": 4.045, - "eval_steps_per_second": 0.509, - "eval_wer": 0.20595230442887447, - "step": 3384 - }, - { - "epoch": 47.08, - "learning_rate": 1.423134328358209e-05, - "loss": 0.2809, + "epoch": 11.77, + "learning_rate": 3.59208480565371e-06, + "loss": 0.2629, "step": 3390 }, { - "epoch": 47.22, - "learning_rate": 1.4194029850746268e-05, - "loss": 0.2767, + "epoch": 11.8, + "learning_rate": 3.5906713780918725e-06, + "loss": 0.2953, "step": 3400 }, { - "epoch": 47.36, - "learning_rate": 1.4156716417910449e-05, - "loss": 0.267, + "epoch": 11.84, + "learning_rate": 3.5892579505300353e-06, + "loss": 0.2857, "step": 3410 }, { - "epoch": 47.5, - "learning_rate": 1.4119402985074628e-05, - "loss": 0.2758, + "epoch": 11.87, + "learning_rate": 3.5878445229681973e-06, + "loss": 0.2671, "step": 3420 }, { - "epoch": 47.64, - "learning_rate": 1.4082089552238805e-05, - "loss": 0.2654, + "epoch": 11.91, + "learning_rate": 3.58643109540636e-06, + "loss": 0.2685, "step": 3430 }, { - "epoch": 47.78, - "learning_rate": 1.4044776119402986e-05, - "loss": 0.2781, + "epoch": 11.94, + "learning_rate": 3.5850176678445226e-06, + "loss": 0.287, "step": 3440 }, { - "epoch": 47.91, - "learning_rate": 1.4007462686567165e-05, - "loss": 0.2673, + "epoch": 11.98, + "learning_rate": 3.5836042402826854e-06, + "loss": 0.2869, "step": 3450 }, { - "epoch": 48.0, - "eval_loss": 0.5044223070144653, - "eval_runtime": 131.7824, - "eval_samples_per_second": 4.037, - "eval_steps_per_second": 0.508, - "eval_wer": 0.1999742881018191, + "epoch": 12.0, + "eval_loss": 0.4973689019680023, + "eval_runtime": 129.1272, + "eval_samples_per_second": 4.12, + "eval_steps_per_second": 1.03, + "eval_wer": 0.20267403741081186, "step": 3456 }, { - "epoch": 48.06, - "learning_rate": 1.3970149253731343e-05, - "loss": 0.2927, + "epoch": 12.01, + "learning_rate": 3.582190812720848e-06, + "loss": 0.2896, "step": 3460 }, { - "epoch": 48.19, - "learning_rate": 1.3932835820895524e-05, - "loss": 0.2854, + "epoch": 12.05, + "learning_rate": 3.5807773851590106e-06, + "loss": 0.2994, "step": 3470 }, { - "epoch": 48.33, - "learning_rate": 1.3895522388059703e-05, - "loss": 0.284, + "epoch": 12.08, + "learning_rate": 3.5793639575971726e-06, + "loss": 0.2556, "step": 3480 }, { - "epoch": 48.47, - "learning_rate": 1.385820895522388e-05, - "loss": 0.2675, + "epoch": 12.12, + "learning_rate": 3.5779505300353355e-06, + "loss": 0.2681, "step": 3490 }, { - "epoch": 48.61, - "learning_rate": 1.3820895522388061e-05, - "loss": 0.2719, + "epoch": 12.15, + "learning_rate": 3.576537102473498e-06, + "loss": 0.2913, "step": 3500 }, { - "epoch": 48.75, - "learning_rate": 1.3783582089552239e-05, - "loss": 0.2748, + "epoch": 12.19, + "learning_rate": 3.5751236749116607e-06, + "loss": 0.2544, "step": 3510 }, { - "epoch": 48.89, - "learning_rate": 1.3746268656716418e-05, - "loss": 0.2696, + "epoch": 12.22, + "learning_rate": 3.573710247349823e-06, + "loss": 0.2785, "step": 3520 }, { - "epoch": 49.0, - "eval_loss": 0.5187488794326782, - "eval_runtime": 131.1067, - "eval_samples_per_second": 4.058, - "eval_steps_per_second": 0.511, - "eval_wer": 0.1983030147200617, - "step": 3528 - }, - { - "epoch": 49.03, - "learning_rate": 1.3708955223880599e-05, - "loss": 0.2806, + "epoch": 12.26, + "learning_rate": 3.572296819787986e-06, + "loss": 0.2865, "step": 3530 }, { - "epoch": 49.17, - "learning_rate": 1.3671641791044776e-05, - "loss": 0.2766, + "epoch": 12.29, + "learning_rate": 3.570883392226148e-06, + "loss": 0.3012, "step": 3540 }, { - "epoch": 49.3, - "learning_rate": 1.3634328358208955e-05, - "loss": 0.2821, + "epoch": 12.33, + "learning_rate": 3.5694699646643108e-06, + "loss": 0.2854, "step": 3550 }, { - "epoch": 49.44, - "learning_rate": 1.3597014925373136e-05, - "loss": 0.2673, + "epoch": 12.36, + "learning_rate": 3.568056537102473e-06, + "loss": 0.3029, "step": 3560 }, { - "epoch": 49.58, - "learning_rate": 1.3559701492537314e-05, - "loss": 0.2794, + "epoch": 12.39, + "learning_rate": 3.566643109540636e-06, + "loss": 0.2927, "step": 3570 }, { - "epoch": 49.72, - "learning_rate": 1.3522388059701493e-05, - "loss": 0.2745, + "epoch": 12.43, + "learning_rate": 3.5652296819787984e-06, + "loss": 0.2681, "step": 3580 }, { - "epoch": 49.86, - "learning_rate": 1.3485074626865674e-05, - "loss": 0.2664, + "epoch": 12.46, + "learning_rate": 3.563816254416961e-06, + "loss": 0.2767, "step": 3590 }, { - "epoch": 50.0, - "learning_rate": 1.3447761194029851e-05, - "loss": 0.2724, - "step": 3600 - }, - { - "epoch": 50.0, - "eval_loss": 0.5234389901161194, - "eval_runtime": 131.879, - "eval_samples_per_second": 4.034, - "eval_steps_per_second": 0.508, - "eval_wer": 0.20350967410169055, + "epoch": 12.5, + "learning_rate": 3.5624028268551232e-06, + "loss": 0.2824, "step": 3600 }, { - "epoch": 50.14, - "learning_rate": 1.3410447761194032e-05, - "loss": 0.2814, + "epoch": 12.53, + "learning_rate": 3.5611307420494697e-06, + "loss": 0.2764, "step": 3610 }, { - "epoch": 50.28, - "learning_rate": 1.3373134328358208e-05, - "loss": 0.267, + "epoch": 12.57, + "learning_rate": 3.559717314487632e-06, + "loss": 0.2487, "step": 3620 }, { - "epoch": 50.42, - "learning_rate": 1.3335820895522388e-05, - "loss": 0.2681, + "epoch": 12.6, + "learning_rate": 3.558303886925795e-06, + "loss": 0.2881, "step": 3630 }, { - "epoch": 50.55, - "learning_rate": 1.329850746268657e-05, - "loss": 0.2812, + "epoch": 12.64, + "learning_rate": 3.5568904593639574e-06, + "loss": 0.2865, "step": 3640 }, { - "epoch": 50.69, - "learning_rate": 1.3261194029850745e-05, - "loss": 0.2709, + "epoch": 12.67, + "learning_rate": 3.55547703180212e-06, + "loss": 0.2817, "step": 3650 }, { - "epoch": 50.83, - "learning_rate": 1.3223880597014926e-05, - "loss": 0.2719, + "epoch": 12.71, + "learning_rate": 3.5540636042402826e-06, + "loss": 0.2677, "step": 3660 }, { - "epoch": 50.97, - "learning_rate": 1.3186567164179107e-05, - "loss": 0.2736, + "epoch": 12.74, + "learning_rate": 3.552650176678445e-06, + "loss": 0.3031, "step": 3670 }, { - "epoch": 51.0, - "eval_loss": 0.5106495022773743, - "eval_runtime": 131.9308, - "eval_samples_per_second": 4.032, - "eval_steps_per_second": 0.508, - "eval_wer": 0.2016455614835765, - "step": 3672 - }, - { - "epoch": 51.11, - "learning_rate": 1.3149253731343284e-05, - "loss": 0.2766, + "epoch": 12.78, + "learning_rate": 3.5512367491166074e-06, + "loss": 0.2787, "step": 3680 }, { - "epoch": 51.25, - "learning_rate": 1.3111940298507463e-05, - "loss": 0.2771, + "epoch": 12.81, + "learning_rate": 3.5498233215547702e-06, + "loss": 0.2761, "step": 3690 }, { - "epoch": 51.39, - "learning_rate": 1.3074626865671644e-05, - "loss": 0.2754, + "epoch": 12.85, + "learning_rate": 3.5484098939929327e-06, + "loss": 0.2749, "step": 3700 }, { - "epoch": 51.53, - "learning_rate": 1.3037313432835822e-05, - "loss": 0.2849, + "epoch": 12.88, + "learning_rate": 3.5469964664310955e-06, + "loss": 0.2977, "step": 3710 }, { - "epoch": 51.66, - "learning_rate": 1.3000000000000001e-05, - "loss": 0.2669, + "epoch": 12.91, + "learning_rate": 3.5455830388692575e-06, + "loss": 0.2686, "step": 3720 }, { - "epoch": 51.8, - "learning_rate": 1.2962686567164178e-05, - "loss": 0.2623, + "epoch": 12.95, + "learning_rate": 3.5441696113074203e-06, + "loss": 0.2724, "step": 3730 }, { - "epoch": 51.94, - "learning_rate": 1.292537313432836e-05, - "loss": 0.2662, + "epoch": 12.98, + "learning_rate": 3.5427561837455827e-06, + "loss": 0.284, "step": 3740 }, { - "epoch": 52.0, - "eval_loss": 0.5071024298667908, - "eval_runtime": 131.882, - "eval_samples_per_second": 4.034, - "eval_steps_per_second": 0.508, - "eval_wer": 0.20537378671980458, + "epoch": 13.0, + "eval_loss": 0.5104484558105469, + "eval_runtime": 128.6455, + "eval_samples_per_second": 4.135, + "eval_steps_per_second": 1.034, + "eval_wer": 0.200552805810889, "step": 3744 }, { - "epoch": 52.08, - "learning_rate": 1.2888059701492538e-05, - "loss": 0.2814, + "epoch": 13.02, + "learning_rate": 3.5413427561837456e-06, + "loss": 0.2975, "step": 3750 }, { - "epoch": 52.22, - "learning_rate": 1.2850746268656716e-05, - "loss": 0.2733, + "epoch": 13.06, + "learning_rate": 3.539929328621908e-06, + "loss": 0.2805, "step": 3760 }, { - "epoch": 52.36, - "learning_rate": 1.2813432835820897e-05, - "loss": 0.2679, + "epoch": 13.09, + "learning_rate": 3.538515901060071e-06, + "loss": 0.2694, "step": 3770 }, { - "epoch": 52.5, - "learning_rate": 1.2776119402985076e-05, - "loss": 0.2717, + "epoch": 13.12, + "learning_rate": 3.5371024734982328e-06, + "loss": 0.2523, "step": 3780 }, { - "epoch": 52.64, - "learning_rate": 1.2738805970149253e-05, - "loss": 0.2563, + "epoch": 13.16, + "learning_rate": 3.5356890459363956e-06, + "loss": 0.2933, "step": 3790 }, { - "epoch": 52.78, - "learning_rate": 1.2701492537313434e-05, - "loss": 0.2791, + "epoch": 13.19, + "learning_rate": 3.534275618374558e-06, + "loss": 0.2829, "step": 3800 }, { - "epoch": 52.91, - "learning_rate": 1.2664179104477613e-05, - "loss": 0.2701, + "epoch": 13.23, + "learning_rate": 3.532862190812721e-06, + "loss": 0.261, "step": 3810 }, { - "epoch": 53.0, - "eval_loss": 0.5253528356552124, - "eval_runtime": 131.2156, - "eval_samples_per_second": 4.054, - "eval_steps_per_second": 0.511, - "eval_wer": 0.2016455614835765, - "step": 3816 - }, - { - "epoch": 53.06, - "learning_rate": 1.262686567164179e-05, - "loss": 0.2935, + "epoch": 13.26, + "learning_rate": 3.5314487632508833e-06, + "loss": 0.2829, "step": 3820 }, { - "epoch": 53.19, - "learning_rate": 1.2589552238805972e-05, - "loss": 0.2654, + "epoch": 13.3, + "learning_rate": 3.530035335689046e-06, + "loss": 0.2911, "step": 3830 }, { - "epoch": 53.33, - "learning_rate": 1.255223880597015e-05, - "loss": 0.2768, + "epoch": 13.33, + "learning_rate": 3.528621908127208e-06, + "loss": 0.2769, "step": 3840 }, { - "epoch": 53.47, - "learning_rate": 1.2514925373134328e-05, - "loss": 0.2779, + "epoch": 13.37, + "learning_rate": 3.527208480565371e-06, + "loss": 0.2595, "step": 3850 }, { - "epoch": 53.61, - "learning_rate": 1.2477611940298509e-05, - "loss": 0.2743, + "epoch": 13.4, + "learning_rate": 3.5257950530035333e-06, + "loss": 0.2858, "step": 3860 }, { - "epoch": 53.75, - "learning_rate": 1.2440298507462687e-05, - "loss": 0.2719, + "epoch": 13.44, + "learning_rate": 3.524381625441696e-06, + "loss": 0.2498, "step": 3870 }, { - "epoch": 53.89, - "learning_rate": 1.2402985074626866e-05, - "loss": 0.261, + "epoch": 13.47, + "learning_rate": 3.5229681978798586e-06, + "loss": 0.2919, "step": 3880 }, { - "epoch": 54.0, - "eval_loss": 0.4967404007911682, - "eval_runtime": 131.9132, - "eval_samples_per_second": 4.033, - "eval_steps_per_second": 0.508, - "eval_wer": 0.19939577039274925, - "step": 3888 - }, - { - "epoch": 54.03, - "learning_rate": 1.2365671641791045e-05, - "loss": 0.2909, + "epoch": 13.51, + "learning_rate": 3.521554770318021e-06, + "loss": 0.3099, "step": 3890 }, { - "epoch": 54.17, - "learning_rate": 1.2328358208955226e-05, - "loss": 0.2642, + "epoch": 13.54, + "learning_rate": 3.5201413427561834e-06, + "loss": 0.2785, "step": 3900 }, { - "epoch": 54.3, - "learning_rate": 1.2291044776119403e-05, - "loss": 0.2746, + "epoch": 13.57, + "learning_rate": 3.5187279151943462e-06, + "loss": 0.2562, "step": 3910 }, { - "epoch": 54.44, - "learning_rate": 1.2253731343283582e-05, - "loss": 0.2655, + "epoch": 13.61, + "learning_rate": 3.5173144876325086e-06, + "loss": 0.2876, "step": 3920 }, { - "epoch": 54.58, - "learning_rate": 1.2216417910447763e-05, - "loss": 0.2722, + "epoch": 13.64, + "learning_rate": 3.5159010600706715e-06, + "loss": 0.2982, "step": 3930 }, { - "epoch": 54.72, - "learning_rate": 1.217910447761194e-05, - "loss": 0.2721, + "epoch": 13.68, + "learning_rate": 3.514487632508834e-06, + "loss": 0.2774, "step": 3940 }, { - "epoch": 54.86, - "learning_rate": 1.214179104477612e-05, - "loss": 0.2728, + "epoch": 13.71, + "learning_rate": 3.5130742049469963e-06, + "loss": 0.2651, "step": 3950 }, { - "epoch": 55.0, - "learning_rate": 1.2104477611940299e-05, - "loss": 0.2708, - "step": 3960 - }, - { - "epoch": 55.0, - "eval_loss": 0.5263388156890869, - "eval_runtime": 131.5494, - "eval_samples_per_second": 4.044, - "eval_steps_per_second": 0.509, - "eval_wer": 0.19688886032011313, + "epoch": 13.75, + "learning_rate": 3.5116607773851587e-06, + "loss": 0.2769, "step": 3960 }, { - "epoch": 55.14, - "learning_rate": 1.2067164179104478e-05, - "loss": 0.2684, + "epoch": 13.78, + "learning_rate": 3.5102473498233215e-06, + "loss": 0.2744, "step": 3970 }, { - "epoch": 55.28, - "learning_rate": 1.2029850746268657e-05, - "loss": 0.2699, + "epoch": 13.82, + "learning_rate": 3.508833922261484e-06, + "loss": 0.2922, "step": 3980 }, { - "epoch": 55.42, - "learning_rate": 1.1992537313432836e-05, - "loss": 0.2796, + "epoch": 13.85, + "learning_rate": 3.5074204946996468e-06, + "loss": 0.2784, "step": 3990 }, { - "epoch": 55.55, - "learning_rate": 1.1955223880597016e-05, - "loss": 0.2666, + "epoch": 13.89, + "learning_rate": 3.506007067137809e-06, + "loss": 0.2871, "step": 4000 }, { - "epoch": 55.69, - "learning_rate": 1.1917910447761195e-05, - "loss": 0.2702, + "epoch": 13.92, + "learning_rate": 3.5045936395759716e-06, + "loss": 0.2628, "step": 4010 }, { - "epoch": 55.83, - "learning_rate": 1.1880597014925374e-05, - "loss": 0.2711, + "epoch": 13.96, + "learning_rate": 3.503180212014134e-06, + "loss": 0.2794, "step": 4020 }, { - "epoch": 55.97, - "learning_rate": 1.1843283582089553e-05, - "loss": 0.2764, + "epoch": 13.99, + "learning_rate": 3.501766784452297e-06, + "loss": 0.2911, "step": 4030 }, { - "epoch": 56.0, - "eval_loss": 0.5201473236083984, - "eval_runtime": 131.8696, - "eval_samples_per_second": 4.034, - "eval_steps_per_second": 0.508, - "eval_wer": 0.19676030082920873, + "epoch": 14.0, + "eval_loss": 0.5025652050971985, + "eval_runtime": 129.3001, + "eval_samples_per_second": 4.114, + "eval_steps_per_second": 1.029, + "eval_wer": 0.20170984122902874, "step": 4032 }, { - "epoch": 56.11, - "learning_rate": 1.1805970149253732e-05, - "loss": 0.272, + "epoch": 14.03, + "learning_rate": 3.5003533568904592e-06, + "loss": 0.2873, "step": 4040 }, { - "epoch": 56.25, - "learning_rate": 1.1768656716417911e-05, - "loss": 0.2624, + "epoch": 14.06, + "learning_rate": 3.498939929328622e-06, + "loss": 0.2802, "step": 4050 }, { - "epoch": 56.39, - "learning_rate": 1.173134328358209e-05, - "loss": 0.2566, + "epoch": 14.1, + "learning_rate": 3.497526501766784e-06, + "loss": 0.2649, "step": 4060 }, { - "epoch": 56.53, - "learning_rate": 1.1694029850746268e-05, - "loss": 0.2789, + "epoch": 14.13, + "learning_rate": 3.496113074204947e-06, + "loss": 0.2909, "step": 4070 }, { - "epoch": 56.66, - "learning_rate": 1.1656716417910449e-05, - "loss": 0.267, + "epoch": 14.17, + "learning_rate": 3.4946996466431093e-06, + "loss": 0.2844, "step": 4080 }, { - "epoch": 56.8, - "learning_rate": 1.1619402985074628e-05, - "loss": 0.2711, + "epoch": 14.2, + "learning_rate": 3.493286219081272e-06, + "loss": 0.2669, "step": 4090 }, { - "epoch": 56.94, - "learning_rate": 1.1582089552238806e-05, - "loss": 0.268, + "epoch": 14.24, + "learning_rate": 3.4918727915194345e-06, + "loss": 0.2757, "step": 4100 }, { - "epoch": 57.0, - "eval_loss": 0.5023506879806519, - "eval_runtime": 131.2011, - "eval_samples_per_second": 4.055, - "eval_steps_per_second": 0.511, - "eval_wer": 0.19785305650189625, - "step": 4104 - }, - { - "epoch": 57.08, - "learning_rate": 1.1544776119402986e-05, - "loss": 0.2639, + "epoch": 14.27, + "learning_rate": 3.4904593639575974e-06, + "loss": 0.2774, "step": 4110 }, { - "epoch": 57.22, - "learning_rate": 1.1507462686567166e-05, - "loss": 0.2725, + "epoch": 14.3, + "learning_rate": 3.4890459363957594e-06, + "loss": 0.2773, "step": 4120 }, { - "epoch": 57.36, - "learning_rate": 1.1470149253731343e-05, - "loss": 0.271, + "epoch": 14.34, + "learning_rate": 3.487632508833922e-06, + "loss": 0.2743, "step": 4130 }, { - "epoch": 57.5, - "learning_rate": 1.1432835820895522e-05, - "loss": 0.2778, + "epoch": 14.37, + "learning_rate": 3.4862190812720846e-06, + "loss": 0.2583, "step": 4140 }, { - "epoch": 57.64, - "learning_rate": 1.1395522388059703e-05, - "loss": 0.2673, + "epoch": 14.41, + "learning_rate": 3.4848056537102474e-06, + "loss": 0.2636, "step": 4150 }, { - "epoch": 57.78, - "learning_rate": 1.135820895522388e-05, - "loss": 0.2665, + "epoch": 14.44, + "learning_rate": 3.48339222614841e-06, + "loss": 0.2344, "step": 4160 }, { - "epoch": 57.91, - "learning_rate": 1.132089552238806e-05, - "loss": 0.2536, + "epoch": 14.48, + "learning_rate": 3.4819787985865723e-06, + "loss": 0.2904, "step": 4170 }, { - "epoch": 58.0, - "eval_loss": 0.5224213600158691, - "eval_runtime": 131.5544, - "eval_samples_per_second": 4.044, - "eval_steps_per_second": 0.509, - "eval_wer": 0.19701741981101756, - "step": 4176 - }, - { - "epoch": 58.06, - "learning_rate": 1.1283582089552239e-05, - "loss": 0.2727, + "epoch": 14.51, + "learning_rate": 3.4805653710247347e-06, + "loss": 0.2892, "step": 4180 }, { - "epoch": 58.19, - "learning_rate": 1.124626865671642e-05, - "loss": 0.2596, + "epoch": 14.55, + "learning_rate": 3.4791519434628975e-06, + "loss": 0.2607, "step": 4190 }, { - "epoch": 58.33, - "learning_rate": 1.1208955223880597e-05, - "loss": 0.2671, + "epoch": 14.58, + "learning_rate": 3.47773851590106e-06, + "loss": 0.2952, "step": 4200 }, { - "epoch": 58.47, - "learning_rate": 1.1171641791044776e-05, - "loss": 0.2667, + "epoch": 14.62, + "learning_rate": 3.4763250883392227e-06, + "loss": 0.2731, "step": 4210 }, { - "epoch": 58.61, - "learning_rate": 1.1134328358208957e-05, - "loss": 0.2648, + "epoch": 14.65, + "learning_rate": 3.474911660777385e-06, + "loss": 0.2973, "step": 4220 }, { - "epoch": 58.75, - "learning_rate": 1.1097014925373135e-05, - "loss": 0.2828, + "epoch": 14.69, + "learning_rate": 3.4734982332155476e-06, + "loss": 0.2897, "step": 4230 }, { - "epoch": 58.89, - "learning_rate": 1.1059701492537314e-05, - "loss": 0.2625, + "epoch": 14.72, + "learning_rate": 3.47208480565371e-06, + "loss": 0.2761, "step": 4240 }, { - "epoch": 59.0, - "eval_loss": 0.5316326022148132, - "eval_runtime": 131.6958, - "eval_samples_per_second": 4.04, - "eval_steps_per_second": 0.509, - "eval_wer": 0.1999742881018191, - "step": 4248 - }, - { - "epoch": 59.03, - "learning_rate": 1.1022388059701493e-05, - "loss": 0.2725, + "epoch": 14.75, + "learning_rate": 3.470671378091873e-06, + "loss": 0.2716, "step": 4250 }, { - "epoch": 59.17, - "learning_rate": 1.0985074626865672e-05, - "loss": 0.2541, + "epoch": 14.79, + "learning_rate": 3.4692579505300352e-06, + "loss": 0.2473, "step": 4260 }, { - "epoch": 59.3, - "learning_rate": 1.0947761194029851e-05, - "loss": 0.2703, + "epoch": 14.82, + "learning_rate": 3.467844522968198e-06, + "loss": 0.3024, "step": 4270 }, { - "epoch": 59.44, - "learning_rate": 1.091044776119403e-05, - "loss": 0.2725, + "epoch": 14.86, + "learning_rate": 3.4664310954063605e-06, + "loss": 0.2873, "step": 4280 }, { - "epoch": 59.58, - "learning_rate": 1.087313432835821e-05, - "loss": 0.273, + "epoch": 14.89, + "learning_rate": 3.4650176678445224e-06, + "loss": 0.278, "step": 4290 }, { - "epoch": 59.72, - "learning_rate": 1.0835820895522389e-05, - "loss": 0.2793, + "epoch": 14.93, + "learning_rate": 3.4636042402826853e-06, + "loss": 0.2486, "step": 4300 }, { - "epoch": 59.86, - "learning_rate": 1.0798507462686568e-05, - "loss": 0.257, + "epoch": 14.96, + "learning_rate": 3.462190812720848e-06, + "loss": 0.2668, "step": 4310 }, { - "epoch": 60.0, - "learning_rate": 1.0761194029850747e-05, - "loss": 0.2621, + "epoch": 15.0, + "learning_rate": 3.4607773851590105e-06, + "loss": 0.2864, "step": 4320 }, { - "epoch": 60.0, - "eval_loss": 0.5173215270042419, - "eval_runtime": 131.579, - "eval_samples_per_second": 4.043, - "eval_steps_per_second": 0.509, - "eval_wer": 0.19965288937455808, + "epoch": 15.0, + "eval_loss": 0.5064656138420105, + "eval_runtime": 129.204, + "eval_samples_per_second": 4.118, + "eval_steps_per_second": 1.029, + "eval_wer": 0.20023140708362794, "step": 4320 }, { - "epoch": 60.14, - "learning_rate": 1.0723880597014926e-05, - "loss": 0.272, + "epoch": 15.03, + "learning_rate": 3.4593639575971734e-06, + "loss": 0.2883, "step": 4330 }, { - "epoch": 60.28, - "learning_rate": 1.0686567164179105e-05, - "loss": 0.2669, + "epoch": 15.07, + "learning_rate": 3.4579505300353353e-06, + "loss": 0.2741, "step": 4340 }, { - "epoch": 60.42, - "learning_rate": 1.0649253731343284e-05, - "loss": 0.2703, + "epoch": 15.1, + "learning_rate": 3.4565371024734977e-06, + "loss": 0.2775, "step": 4350 }, { - "epoch": 60.55, - "learning_rate": 1.0611940298507462e-05, - "loss": 0.2633, + "epoch": 15.14, + "learning_rate": 3.4551236749116606e-06, + "loss": 0.287, "step": 4360 }, { - "epoch": 60.69, - "learning_rate": 1.0574626865671643e-05, - "loss": 0.2657, + "epoch": 15.17, + "learning_rate": 3.453710247349823e-06, + "loss": 0.2964, "step": 4370 }, { - "epoch": 60.83, - "learning_rate": 1.0537313432835822e-05, - "loss": 0.2654, + "epoch": 15.21, + "learning_rate": 3.452296819787986e-06, + "loss": 0.2907, "step": 4380 }, { - "epoch": 60.97, - "learning_rate": 1.05e-05, - "loss": 0.2673, + "epoch": 15.24, + "learning_rate": 3.4508833922261482e-06, + "loss": 0.282, "step": 4390 }, { - "epoch": 61.0, - "eval_loss": 0.5116785764694214, - "eval_runtime": 131.1081, - "eval_samples_per_second": 4.058, - "eval_steps_per_second": 0.511, - "eval_wer": 0.20280259690171626, - "step": 4392 - }, - { - "epoch": 61.11, - "learning_rate": 1.046268656716418e-05, - "loss": 0.2678, + "epoch": 15.28, + "learning_rate": 3.4494699646643106e-06, + "loss": 0.2511, "step": 4400 }, { - "epoch": 61.25, - "learning_rate": 1.042537313432836e-05, - "loss": 0.2706, + "epoch": 15.31, + "learning_rate": 3.448056537102473e-06, + "loss": 0.284, "step": 4410 }, { - "epoch": 61.39, - "learning_rate": 1.0388059701492537e-05, - "loss": 0.2641, + "epoch": 15.35, + "learning_rate": 3.446643109540636e-06, + "loss": 0.2856, "step": 4420 }, { - "epoch": 61.53, - "learning_rate": 1.0350746268656716e-05, - "loss": 0.2596, + "epoch": 15.38, + "learning_rate": 3.4452296819787983e-06, + "loss": 0.2694, "step": 4430 }, { - "epoch": 61.66, - "learning_rate": 1.0313432835820897e-05, - "loss": 0.2562, + "epoch": 15.42, + "learning_rate": 3.443816254416961e-06, + "loss": 0.2572, "step": 4440 }, { - "epoch": 61.8, - "learning_rate": 1.0276119402985074e-05, - "loss": 0.2802, + "epoch": 15.45, + "learning_rate": 3.4424028268551235e-06, + "loss": 0.2929, "step": 4450 }, { - "epoch": 61.94, - "learning_rate": 1.0238805970149254e-05, - "loss": 0.2723, + "epoch": 15.48, + "learning_rate": 3.440989399293286e-06, + "loss": 0.2973, "step": 4460 }, { - "epoch": 62.0, - "eval_loss": 0.5285342335700989, - "eval_runtime": 131.8603, - "eval_samples_per_second": 4.035, - "eval_steps_per_second": 0.508, - "eval_wer": 0.1999742881018191, - "step": 4464 - }, - { - "epoch": 62.08, - "learning_rate": 1.0201492537313434e-05, - "loss": 0.2846, + "epoch": 15.52, + "learning_rate": 3.4395759717314484e-06, + "loss": 0.2767, "step": 4470 }, { - "epoch": 62.22, - "learning_rate": 1.0164179104477614e-05, - "loss": 0.2758, + "epoch": 15.55, + "learning_rate": 3.438162544169611e-06, + "loss": 0.26, "step": 4480 }, { - "epoch": 62.36, - "learning_rate": 1.0126865671641791e-05, - "loss": 0.277, + "epoch": 15.59, + "learning_rate": 3.4367491166077736e-06, + "loss": 0.2813, "step": 4490 }, { - "epoch": 62.5, - "learning_rate": 1.008955223880597e-05, - "loss": 0.2761, + "epoch": 15.62, + "learning_rate": 3.4353356890459364e-06, + "loss": 0.2703, "step": 4500 }, { - "epoch": 62.64, - "learning_rate": 1.0052238805970151e-05, - "loss": 0.2684, + "epoch": 15.66, + "learning_rate": 3.4339222614840984e-06, + "loss": 0.2875, "step": 4510 }, { - "epoch": 62.78, - "learning_rate": 1.0014925373134328e-05, - "loss": 0.2817, + "epoch": 15.69, + "learning_rate": 3.4325088339222613e-06, + "loss": 0.2561, "step": 4520 }, { - "epoch": 62.91, - "learning_rate": 9.977611940298508e-06, - "loss": 0.2691, + "epoch": 15.73, + "learning_rate": 3.4310954063604237e-06, + "loss": 0.271, "step": 4530 }, { - "epoch": 63.0, - "eval_loss": 0.5328835248947144, - "eval_runtime": 131.3705, - "eval_samples_per_second": 4.05, - "eval_steps_per_second": 0.51, - "eval_wer": 0.19611750337468664, - "step": 4536 - }, - { - "epoch": 63.06, - "learning_rate": 9.940298507462687e-06, - "loss": 0.2824, + "epoch": 15.76, + "learning_rate": 3.4296819787985865e-06, + "loss": 0.2934, "step": 4540 }, { - "epoch": 63.19, - "learning_rate": 9.902985074626866e-06, - "loss": 0.2772, + "epoch": 15.8, + "learning_rate": 3.428268551236749e-06, + "loss": 0.2791, "step": 4550 }, { - "epoch": 63.33, - "learning_rate": 9.865671641791045e-06, - "loss": 0.2708, + "epoch": 15.83, + "learning_rate": 3.4268551236749117e-06, + "loss": 0.2896, "step": 4560 }, { - "epoch": 63.47, - "learning_rate": 9.828358208955224e-06, - "loss": 0.2679, + "epoch": 15.87, + "learning_rate": 3.4254416961130737e-06, + "loss": 0.3179, "step": 4570 }, { - "epoch": 63.61, - "learning_rate": 9.791044776119403e-06, - "loss": 0.268, + "epoch": 15.9, + "learning_rate": 3.4240282685512366e-06, + "loss": 0.2716, "step": 4580 }, { - "epoch": 63.75, - "learning_rate": 9.753731343283583e-06, - "loss": 0.2705, + "epoch": 15.94, + "learning_rate": 3.422614840989399e-06, + "loss": 0.3019, "step": 4590 }, { - "epoch": 63.89, - "learning_rate": 9.716417910447762e-06, - "loss": 0.2668, + "epoch": 15.97, + "learning_rate": 3.421201413427562e-06, + "loss": 0.2779, "step": 4600 }, { - "epoch": 64.0, - "eval_loss": 0.5160889625549316, - "eval_runtime": 131.2903, - "eval_samples_per_second": 4.052, - "eval_steps_per_second": 0.51, - "eval_wer": 0.19643890210194767, + "epoch": 16.0, + "eval_loss": 0.5024499297142029, + "eval_runtime": 129.1181, + "eval_samples_per_second": 4.12, + "eval_steps_per_second": 1.03, + "eval_wer": 0.20100276402905445, "step": 4608 }, { - "epoch": 64.03, - "learning_rate": 9.679104477611941e-06, - "loss": 0.2774, + "epoch": 16.01, + "learning_rate": 3.419787985865724e-06, + "loss": 0.3, "step": 4610 }, { - "epoch": 64.17, - "learning_rate": 9.64179104477612e-06, - "loss": 0.2688, + "epoch": 16.04, + "learning_rate": 3.418374558303887e-06, + "loss": 0.2691, "step": 4620 }, { - "epoch": 64.3, - "learning_rate": 9.6044776119403e-06, - "loss": 0.2773, + "epoch": 16.08, + "learning_rate": 3.416961130742049e-06, + "loss": 0.2599, "step": 4630 }, { - "epoch": 64.44, - "learning_rate": 9.567164179104478e-06, - "loss": 0.2633, + "epoch": 16.11, + "learning_rate": 3.415547703180212e-06, + "loss": 0.2636, "step": 4640 }, { - "epoch": 64.58, - "learning_rate": 9.529850746268656e-06, - "loss": 0.2735, + "epoch": 16.15, + "learning_rate": 3.4141342756183743e-06, + "loss": 0.2902, "step": 4650 }, { - "epoch": 64.72, - "learning_rate": 9.492537313432837e-06, - "loss": 0.2683, + "epoch": 16.18, + "learning_rate": 3.412720848056537e-06, + "loss": 0.2577, "step": 4660 }, { - "epoch": 64.86, - "learning_rate": 9.455223880597016e-06, - "loss": 0.2719, + "epoch": 16.21, + "learning_rate": 3.4113074204946995e-06, + "loss": 0.2813, "step": 4670 }, { - "epoch": 65.0, - "learning_rate": 9.417910447761193e-06, - "loss": 0.27, - "step": 4680 - }, - { - "epoch": 65.0, - "eval_loss": 0.5026705861091614, - "eval_runtime": 131.4228, - "eval_samples_per_second": 4.048, - "eval_steps_per_second": 0.51, - "eval_wer": 0.19695314006556533, + "epoch": 16.25, + "learning_rate": 3.409893992932862e-06, + "loss": 0.2619, "step": 4680 }, { - "epoch": 65.14, - "learning_rate": 9.380597014925374e-06, - "loss": 0.2786, + "epoch": 16.28, + "learning_rate": 3.4084805653710243e-06, + "loss": 0.2685, "step": 4690 }, { - "epoch": 65.28, - "learning_rate": 9.343283582089553e-06, - "loss": 0.2731, + "epoch": 16.32, + "learning_rate": 3.407067137809187e-06, + "loss": 0.2886, "step": 4700 }, { - "epoch": 65.42, - "learning_rate": 9.30597014925373e-06, - "loss": 0.2707, + "epoch": 16.35, + "learning_rate": 3.4056537102473496e-06, + "loss": 0.2828, "step": 4710 }, { - "epoch": 65.55, - "learning_rate": 9.26865671641791e-06, - "loss": 0.2638, + "epoch": 16.39, + "learning_rate": 3.4042402826855124e-06, + "loss": 0.2643, "step": 4720 }, { - "epoch": 65.69, - "learning_rate": 9.23134328358209e-06, - "loss": 0.2605, + "epoch": 16.42, + "learning_rate": 3.402826855123675e-06, + "loss": 0.2722, "step": 4730 }, { - "epoch": 65.83, - "learning_rate": 9.194029850746268e-06, - "loss": 0.2736, + "epoch": 16.46, + "learning_rate": 3.4014134275618372e-06, + "loss": 0.2868, "step": 4740 }, { - "epoch": 65.97, - "learning_rate": 9.156716417910447e-06, - "loss": 0.257, + "epoch": 16.49, + "learning_rate": 3.3999999999999996e-06, + "loss": 0.2736, "step": 4750 }, { - "epoch": 66.0, - "eval_loss": 0.5016449689865112, - "eval_runtime": 132.0547, - "eval_samples_per_second": 4.029, - "eval_steps_per_second": 0.507, - "eval_wer": 0.19965288937455808, - "step": 4752 - }, - { - "epoch": 66.11, - "learning_rate": 9.119402985074628e-06, - "loss": 0.277, + "epoch": 16.53, + "learning_rate": 3.3985865724381625e-06, + "loss": 0.2888, "step": 4760 }, { - "epoch": 66.25, - "learning_rate": 9.082089552238807e-06, - "loss": 0.2734, + "epoch": 16.56, + "learning_rate": 3.397173144876325e-06, + "loss": 0.2616, "step": 4770 }, { - "epoch": 66.39, - "learning_rate": 9.044776119402985e-06, - "loss": 0.2679, + "epoch": 16.6, + "learning_rate": 3.3957597173144877e-06, + "loss": 0.2736, "step": 4780 }, { - "epoch": 66.53, - "learning_rate": 9.007462686567164e-06, - "loss": 0.2755, + "epoch": 16.63, + "learning_rate": 3.3943462897526497e-06, + "loss": 0.2678, "step": 4790 }, { - "epoch": 66.66, - "learning_rate": 8.970149253731345e-06, - "loss": 0.2686, + "epoch": 16.66, + "learning_rate": 3.3929328621908125e-06, + "loss": 0.2739, "step": 4800 }, { - "epoch": 66.8, - "learning_rate": 8.932835820895522e-06, - "loss": 0.2651, + "epoch": 16.7, + "learning_rate": 3.391519434628975e-06, + "loss": 0.252, "step": 4810 }, { - "epoch": 66.94, - "learning_rate": 8.895522388059702e-06, - "loss": 0.2711, + "epoch": 16.73, + "learning_rate": 3.3901060070671378e-06, + "loss": 0.2913, "step": 4820 }, { - "epoch": 67.0, - "eval_loss": 0.5059924721717834, - "eval_runtime": 131.6036, - "eval_samples_per_second": 4.042, - "eval_steps_per_second": 0.509, - "eval_wer": 0.19714597930192196, - "step": 4824 - }, - { - "epoch": 67.08, - "learning_rate": 8.85820895522388e-06, - "loss": 0.2678, + "epoch": 16.77, + "learning_rate": 3.3886925795053e-06, + "loss": 0.2935, "step": 4830 }, { - "epoch": 67.22, - "learning_rate": 8.82089552238806e-06, - "loss": 0.2676, + "epoch": 16.8, + "learning_rate": 3.387279151943463e-06, + "loss": 0.2672, "step": 4840 }, { - "epoch": 67.36, - "learning_rate": 8.783582089552239e-06, - "loss": 0.2569, + "epoch": 16.84, + "learning_rate": 3.385865724381625e-06, + "loss": 0.2693, "step": 4850 }, { - "epoch": 67.5, - "learning_rate": 8.746268656716418e-06, - "loss": 0.2681, + "epoch": 16.87, + "learning_rate": 3.384452296819788e-06, + "loss": 0.2723, "step": 4860 }, { - "epoch": 67.64, - "learning_rate": 8.708955223880597e-06, - "loss": 0.2664, + "epoch": 16.91, + "learning_rate": 3.3830388692579502e-06, + "loss": 0.2571, "step": 4870 }, { - "epoch": 67.78, - "learning_rate": 8.671641791044776e-06, - "loss": 0.2725, + "epoch": 16.94, + "learning_rate": 3.381625441696113e-06, + "loss": 0.2511, "step": 4880 }, { - "epoch": 67.91, - "learning_rate": 8.634328358208956e-06, - "loss": 0.269, + "epoch": 16.98, + "learning_rate": 3.3802120141342755e-06, + "loss": 0.2766, "step": 4890 }, { - "epoch": 68.0, - "eval_loss": 0.5219683051109314, - "eval_runtime": 131.9262, - "eval_samples_per_second": 4.033, - "eval_steps_per_second": 0.508, - "eval_wer": 0.1983030147200617, + "epoch": 17.0, + "eval_loss": 0.5078305006027222, + "eval_runtime": 129.3828, + "eval_samples_per_second": 4.112, + "eval_steps_per_second": 1.028, + "eval_wer": 0.1998457286109147, "step": 4896 }, { - "epoch": 68.06, - "learning_rate": 8.597014925373135e-06, - "loss": 0.2747, + "epoch": 17.01, + "learning_rate": 3.3787985865724383e-06, + "loss": 0.2968, "step": 4900 }, { - "epoch": 68.19, - "learning_rate": 8.559701492537314e-06, - "loss": 0.2724, + "epoch": 17.05, + "learning_rate": 3.3773851590106003e-06, + "loss": 0.2869, "step": 4910 }, { - "epoch": 68.33, - "learning_rate": 8.522388059701493e-06, - "loss": 0.2773, + "epoch": 17.08, + "learning_rate": 3.375971731448763e-06, + "loss": 0.2671, "step": 4920 }, { - "epoch": 68.47, - "learning_rate": 8.485074626865672e-06, - "loss": 0.282, + "epoch": 17.12, + "learning_rate": 3.3745583038869255e-06, + "loss": 0.2651, "step": 4930 }, { - "epoch": 68.61, - "learning_rate": 8.447761194029851e-06, - "loss": 0.2674, + "epoch": 17.15, + "learning_rate": 3.3731448763250884e-06, + "loss": 0.262, "step": 4940 }, { - "epoch": 68.75, - "learning_rate": 8.41044776119403e-06, - "loss": 0.2611, + "epoch": 17.19, + "learning_rate": 3.371731448763251e-06, + "loss": 0.2579, "step": 4950 }, { - "epoch": 68.89, - "learning_rate": 8.37313432835821e-06, - "loss": 0.2659, + "epoch": 17.22, + "learning_rate": 3.370318021201413e-06, + "loss": 0.2801, "step": 4960 }, { - "epoch": 69.0, - "eval_loss": 0.498529314994812, - "eval_runtime": 132.3204, - "eval_samples_per_second": 4.021, - "eval_steps_per_second": 0.506, - "eval_wer": 0.19856013370187053, - "step": 4968 - }, - { - "epoch": 69.03, - "learning_rate": 8.335820895522387e-06, - "loss": 0.2752, + "epoch": 17.26, + "learning_rate": 3.3689045936395756e-06, + "loss": 0.2667, "step": 4970 }, { - "epoch": 69.17, - "learning_rate": 8.298507462686568e-06, - "loss": 0.2671, + "epoch": 17.29, + "learning_rate": 3.3674911660777384e-06, + "loss": 0.2852, "step": 4980 }, { - "epoch": 69.3, - "learning_rate": 8.261194029850747e-06, - "loss": 0.2704, + "epoch": 17.33, + "learning_rate": 3.366077738515901e-06, + "loss": 0.2515, "step": 4990 }, { - "epoch": 69.44, - "learning_rate": 8.223880597014925e-06, - "loss": 0.265, + "epoch": 17.36, + "learning_rate": 3.3646643109540637e-06, + "loss": 0.2632, "step": 5000 }, { - "epoch": 69.58, - "learning_rate": 8.186567164179104e-06, - "loss": 0.2757, + "epoch": 17.39, + "learning_rate": 3.363250883392226e-06, + "loss": 0.2756, "step": 5010 }, { - "epoch": 69.72, - "learning_rate": 8.149253731343285e-06, - "loss": 0.2688, + "epoch": 17.43, + "learning_rate": 3.3618374558303885e-06, + "loss": 0.2703, "step": 5020 }, { - "epoch": 69.86, - "learning_rate": 8.111940298507462e-06, - "loss": 0.2666, + "epoch": 17.46, + "learning_rate": 3.360424028268551e-06, + "loss": 0.2706, "step": 5030 }, { - "epoch": 70.0, - "learning_rate": 8.074626865671641e-06, - "loss": 0.2669, - "step": 5040 - }, - { - "epoch": 70.0, - "eval_loss": 0.514457643032074, - "eval_runtime": 131.6706, - "eval_samples_per_second": 4.04, - "eval_steps_per_second": 0.509, - "eval_wer": 0.1958603843928778, + "epoch": 17.5, + "learning_rate": 3.3590106007067137e-06, + "loss": 0.3145, "step": 5040 }, { - "epoch": 70.14, - "learning_rate": 8.037313432835822e-06, - "loss": 0.2716, + "epoch": 17.53, + "learning_rate": 3.357597173144876e-06, + "loss": 0.2588, "step": 5050 }, { - "epoch": 70.28, - "learning_rate": 8.000000000000001e-06, - "loss": 0.2729, + "epoch": 17.57, + "learning_rate": 3.356183745583039e-06, + "loss": 0.278, "step": 5060 }, { - "epoch": 70.42, - "learning_rate": 7.962686567164179e-06, - "loss": 0.259, + "epoch": 17.6, + "learning_rate": 3.3547703180212014e-06, + "loss": 0.2612, "step": 5070 }, { - "epoch": 70.55, - "learning_rate": 7.925373134328358e-06, - "loss": 0.2651, + "epoch": 17.64, + "learning_rate": 3.353356890459364e-06, + "loss": 0.2747, "step": 5080 }, { - "epoch": 70.69, - "learning_rate": 7.888059701492539e-06, - "loss": 0.2657, + "epoch": 17.67, + "learning_rate": 3.3519434628975262e-06, + "loss": 0.2839, "step": 5090 }, { - "epoch": 70.83, - "learning_rate": 7.850746268656716e-06, - "loss": 0.2735, + "epoch": 17.71, + "learning_rate": 3.350530035335689e-06, + "loss": 0.3041, "step": 5100 }, { - "epoch": 70.97, - "learning_rate": 7.813432835820895e-06, - "loss": 0.2685, + "epoch": 17.74, + "learning_rate": 3.3491166077738515e-06, + "loss": 0.28, "step": 5110 }, { - "epoch": 71.0, - "eval_loss": 0.5079246163368225, - "eval_runtime": 131.456, - "eval_samples_per_second": 4.047, - "eval_steps_per_second": 0.51, - "eval_wer": 0.19560326541106898, - "step": 5112 - }, - { - "epoch": 71.11, - "learning_rate": 7.776119402985076e-06, - "loss": 0.2732, + "epoch": 17.78, + "learning_rate": 3.3477031802120143e-06, + "loss": 0.2479, "step": 5120 }, { - "epoch": 71.25, - "learning_rate": 7.738805970149254e-06, - "loss": 0.2568, + "epoch": 17.81, + "learning_rate": 3.3462897526501763e-06, + "loss": 0.2859, "step": 5130 }, { - "epoch": 71.39, - "learning_rate": 7.701492537313433e-06, - "loss": 0.2552, + "epoch": 17.85, + "learning_rate": 3.344876325088339e-06, + "loss": 0.2879, "step": 5140 }, { - "epoch": 71.53, - "learning_rate": 7.664179104477612e-06, - "loss": 0.2634, + "epoch": 17.88, + "learning_rate": 3.3434628975265015e-06, + "loss": 0.2668, "step": 5150 }, { - "epoch": 71.66, - "learning_rate": 7.626865671641792e-06, - "loss": 0.2663, + "epoch": 17.91, + "learning_rate": 3.3420494699646644e-06, + "loss": 0.2703, "step": 5160 }, { - "epoch": 71.8, - "learning_rate": 7.58955223880597e-06, - "loss": 0.2679, + "epoch": 17.95, + "learning_rate": 3.3406360424028268e-06, + "loss": 0.2949, "step": 5170 }, { - "epoch": 71.94, - "learning_rate": 7.5522388059701495e-06, - "loss": 0.2669, + "epoch": 17.98, + "learning_rate": 3.3392226148409896e-06, + "loss": 0.2872, "step": 5180 }, { - "epoch": 72.0, - "eval_loss": 0.49233612418174744, - "eval_runtime": 131.3756, - "eval_samples_per_second": 4.049, - "eval_steps_per_second": 0.51, - "eval_wer": 0.19361059330205052, + "epoch": 18.0, + "eval_loss": 0.5114011764526367, + "eval_runtime": 129.1607, + "eval_samples_per_second": 4.119, + "eval_steps_per_second": 1.03, + "eval_wer": 0.19811017548370508, "step": 5184 }, { - "epoch": 72.08, - "learning_rate": 7.514925373134328e-06, - "loss": 0.2722, + "epoch": 18.02, + "learning_rate": 3.3378091872791516e-06, + "loss": 0.2889, "step": 5190 }, { - "epoch": 72.22, - "learning_rate": 7.477611940298508e-06, - "loss": 0.2698, + "epoch": 18.06, + "learning_rate": 3.3363957597173144e-06, + "loss": 0.2601, "step": 5200 }, { - "epoch": 72.36, - "learning_rate": 7.440298507462687e-06, - "loss": 0.2527, + "epoch": 18.09, + "learning_rate": 3.334982332155477e-06, + "loss": 0.2864, "step": 5210 }, { - "epoch": 72.5, - "learning_rate": 7.402985074626865e-06, - "loss": 0.2658, + "epoch": 18.12, + "learning_rate": 3.3335689045936397e-06, + "loss": 0.2753, "step": 5220 }, { - "epoch": 72.64, - "learning_rate": 7.365671641791045e-06, - "loss": 0.2623, + "epoch": 18.16, + "learning_rate": 3.332155477031802e-06, + "loss": 0.298, "step": 5230 }, { - "epoch": 72.78, - "learning_rate": 7.3283582089552245e-06, - "loss": 0.2574, + "epoch": 18.19, + "learning_rate": 3.330742049469965e-06, + "loss": 0.2637, "step": 5240 }, { - "epoch": 72.91, - "learning_rate": 7.291044776119403e-06, - "loss": 0.2586, + "epoch": 18.23, + "learning_rate": 3.329328621908127e-06, + "loss": 0.2674, "step": 5250 }, { - "epoch": 73.0, - "eval_loss": 0.4957040250301361, - "eval_runtime": 131.9056, - "eval_samples_per_second": 4.033, - "eval_steps_per_second": 0.508, - "eval_wer": 0.19528186668380793, - "step": 5256 - }, - { - "epoch": 73.06, - "learning_rate": 7.253731343283582e-06, - "loss": 0.2703, + "epoch": 18.26, + "learning_rate": 3.3279151943462897e-06, + "loss": 0.2606, "step": 5260 }, { - "epoch": 73.19, - "learning_rate": 7.216417910447762e-06, - "loss": 0.2618, + "epoch": 18.3, + "learning_rate": 3.326501766784452e-06, + "loss": 0.2987, "step": 5270 }, { - "epoch": 73.33, - "learning_rate": 7.17910447761194e-06, - "loss": 0.2643, + "epoch": 18.33, + "learning_rate": 3.325088339222615e-06, + "loss": 0.2924, "step": 5280 }, { - "epoch": 73.47, - "learning_rate": 7.1417910447761194e-06, - "loss": 0.2735, + "epoch": 18.37, + "learning_rate": 3.3236749116607774e-06, + "loss": 0.3043, "step": 5290 }, { - "epoch": 73.61, - "learning_rate": 7.1044776119402994e-06, - "loss": 0.2562, + "epoch": 18.4, + "learning_rate": 3.3222614840989398e-06, + "loss": 0.2727, "step": 5300 }, { - "epoch": 73.75, - "learning_rate": 7.067164179104479e-06, - "loss": 0.2597, + "epoch": 18.44, + "learning_rate": 3.320848056537102e-06, + "loss": 0.2463, "step": 5310 }, { - "epoch": 73.89, - "learning_rate": 7.029850746268657e-06, - "loss": 0.2486, + "epoch": 18.47, + "learning_rate": 3.319434628975265e-06, + "loss": 0.3037, "step": 5320 }, { - "epoch": 74.0, - "eval_loss": 0.4974006712436676, - "eval_runtime": 132.0022, - "eval_samples_per_second": 4.03, - "eval_steps_per_second": 0.508, - "eval_wer": 0.19316063508388506, - "step": 5328 - }, - { - "epoch": 74.03, - "learning_rate": 6.992537313432835e-06, - "loss": 0.2732, + "epoch": 18.51, + "learning_rate": 3.3180212014134274e-06, + "loss": 0.2611, "step": 5330 }, { - "epoch": 74.17, - "learning_rate": 6.955223880597016e-06, - "loss": 0.2455, + "epoch": 18.54, + "learning_rate": 3.3166077738515903e-06, + "loss": 0.2597, "step": 5340 }, { - "epoch": 74.3, - "learning_rate": 6.917910447761194e-06, - "loss": 0.2517, + "epoch": 18.57, + "learning_rate": 3.3151943462897527e-06, + "loss": 0.2875, "step": 5350 }, { - "epoch": 74.44, - "learning_rate": 6.8805970149253735e-06, - "loss": 0.2618, + "epoch": 18.61, + "learning_rate": 3.313780918727915e-06, + "loss": 0.2847, "step": 5360 }, { - "epoch": 74.58, - "learning_rate": 6.843283582089552e-06, - "loss": 0.2667, + "epoch": 18.64, + "learning_rate": 3.3123674911660775e-06, + "loss": 0.2741, "step": 5370 }, { - "epoch": 74.72, - "learning_rate": 6.805970149253732e-06, - "loss": 0.2635, + "epoch": 18.68, + "learning_rate": 3.3109540636042403e-06, + "loss": 0.2683, "step": 5380 }, { - "epoch": 74.86, - "learning_rate": 6.768656716417911e-06, - "loss": 0.2667, + "epoch": 18.71, + "learning_rate": 3.3095406360424027e-06, + "loss": 0.2637, "step": 5390 }, { - "epoch": 75.0, - "learning_rate": 6.731343283582089e-06, - "loss": 0.2611, - "step": 5400 - }, - { - "epoch": 75.0, - "eval_loss": 0.5044746398925781, - "eval_runtime": 131.9706, - "eval_samples_per_second": 4.031, - "eval_steps_per_second": 0.508, - "eval_wer": 0.1948961882110947, + "epoch": 18.75, + "learning_rate": 3.3081272084805656e-06, + "loss": 0.2755, "step": 5400 }, { - "epoch": 75.14, - "learning_rate": 6.694029850746269e-06, - "loss": 0.2813, + "epoch": 18.78, + "learning_rate": 3.3067137809187276e-06, + "loss": 0.2604, "step": 5410 }, { - "epoch": 75.28, - "learning_rate": 6.6567164179104485e-06, - "loss": 0.2708, + "epoch": 18.82, + "learning_rate": 3.30530035335689e-06, + "loss": 0.3166, "step": 5420 }, { - "epoch": 75.42, - "learning_rate": 6.619402985074627e-06, - "loss": 0.2558, + "epoch": 18.85, + "learning_rate": 3.303886925795053e-06, + "loss": 0.2882, "step": 5430 }, { - "epoch": 75.55, - "learning_rate": 6.582089552238806e-06, - "loss": 0.2593, + "epoch": 18.89, + "learning_rate": 3.302473498233215e-06, + "loss": 0.2685, "step": 5440 }, { - "epoch": 75.69, - "learning_rate": 6.544776119402986e-06, - "loss": 0.2532, + "epoch": 18.92, + "learning_rate": 3.301060070671378e-06, + "loss": 0.2697, "step": 5450 }, { - "epoch": 75.83, - "learning_rate": 6.507462686567164e-06, - "loss": 0.2601, + "epoch": 18.96, + "learning_rate": 3.2996466431095405e-06, + "loss": 0.2673, "step": 5460 }, { - "epoch": 75.97, - "learning_rate": 6.4701492537313434e-06, - "loss": 0.264, + "epoch": 18.99, + "learning_rate": 3.298233215547703e-06, + "loss": 0.268, "step": 5470 }, { - "epoch": 76.0, - "eval_loss": 0.5025977492332458, - "eval_runtime": 132.0676, - "eval_samples_per_second": 4.028, - "eval_steps_per_second": 0.507, - "eval_wer": 0.1965674615928521, + "epoch": 19.0, + "eval_loss": 0.5078134536743164, + "eval_runtime": 128.8142, + "eval_samples_per_second": 4.13, + "eval_steps_per_second": 1.032, + "eval_wer": 0.19798161599280067, "step": 5472 }, { - "epoch": 76.11, - "learning_rate": 6.4328358208955234e-06, - "loss": 0.256, + "epoch": 19.03, + "learning_rate": 3.2968197879858653e-06, + "loss": 0.2845, "step": 5480 }, { - "epoch": 76.25, - "learning_rate": 6.395522388059702e-06, - "loss": 0.2661, + "epoch": 19.06, + "learning_rate": 3.295406360424028e-06, + "loss": 0.2673, "step": 5490 }, { - "epoch": 76.39, - "learning_rate": 6.358208955223881e-06, - "loss": 0.2603, + "epoch": 19.1, + "learning_rate": 3.2939929328621905e-06, + "loss": 0.2458, "step": 5500 }, { - "epoch": 76.53, - "learning_rate": 6.320895522388059e-06, - "loss": 0.2574, + "epoch": 19.13, + "learning_rate": 3.2925795053003533e-06, + "loss": 0.288, "step": 5510 }, { - "epoch": 76.66, - "learning_rate": 6.283582089552239e-06, - "loss": 0.2572, + "epoch": 19.17, + "learning_rate": 3.2911660777385158e-06, + "loss": 0.2833, "step": 5520 }, { - "epoch": 76.8, - "learning_rate": 6.246268656716418e-06, - "loss": 0.2587, + "epoch": 19.2, + "learning_rate": 3.289752650176678e-06, + "loss": 0.264, "step": 5530 }, { - "epoch": 76.94, - "learning_rate": 6.208955223880597e-06, - "loss": 0.2653, + "epoch": 19.24, + "learning_rate": 3.2883392226148406e-06, + "loss": 0.2782, "step": 5540 }, { - "epoch": 77.0, - "eval_loss": 0.5044174790382385, - "eval_runtime": 133.5324, - "eval_samples_per_second": 3.984, - "eval_steps_per_second": 0.502, - "eval_wer": 0.19361059330205052, - "step": 5544 - }, - { - "epoch": 77.08, - "learning_rate": 6.171641791044777e-06, - "loss": 0.2586, + "epoch": 19.27, + "learning_rate": 3.2869257950530034e-06, + "loss": 0.2702, "step": 5550 }, { - "epoch": 77.22, - "learning_rate": 6.134328358208956e-06, - "loss": 0.2628, + "epoch": 19.3, + "learning_rate": 3.285512367491166e-06, + "loss": 0.2908, "step": 5560 }, { - "epoch": 77.36, - "learning_rate": 6.097014925373134e-06, - "loss": 0.2637, + "epoch": 19.34, + "learning_rate": 3.2840989399293287e-06, + "loss": 0.2852, "step": 5570 }, { - "epoch": 77.5, - "learning_rate": 6.059701492537314e-06, - "loss": 0.2594, + "epoch": 19.37, + "learning_rate": 3.2826855123674906e-06, + "loss": 0.2657, "step": 5580 }, { - "epoch": 77.64, - "learning_rate": 6.0223880597014925e-06, - "loss": 0.2567, + "epoch": 19.41, + "learning_rate": 3.2812720848056535e-06, + "loss": 0.2553, "step": 5590 }, { - "epoch": 77.78, - "learning_rate": 5.9850746268656725e-06, - "loss": 0.2684, + "epoch": 19.44, + "learning_rate": 3.279858657243816e-06, + "loss": 0.2556, "step": 5600 }, { - "epoch": 77.91, - "learning_rate": 5.947761194029851e-06, - "loss": 0.2579, + "epoch": 19.48, + "learning_rate": 3.2784452296819787e-06, + "loss": 0.2677, "step": 5610 }, { - "epoch": 78.0, - "eval_loss": 0.4963833689689636, - "eval_runtime": 131.9034, - "eval_samples_per_second": 4.033, - "eval_steps_per_second": 0.508, - "eval_wer": 0.1966960210837565, - "step": 5616 - }, - { - "epoch": 78.06, - "learning_rate": 5.91044776119403e-06, - "loss": 0.2654, + "epoch": 19.51, + "learning_rate": 3.277031802120141e-06, + "loss": 0.276, "step": 5620 }, { - "epoch": 78.19, - "learning_rate": 5.873134328358209e-06, - "loss": 0.2565, + "epoch": 19.55, + "learning_rate": 3.275618374558304e-06, + "loss": 0.2622, "step": 5630 }, { - "epoch": 78.33, - "learning_rate": 5.835820895522388e-06, - "loss": 0.2647, + "epoch": 19.58, + "learning_rate": 3.274204946996466e-06, + "loss": 0.2778, "step": 5640 }, { - "epoch": 78.47, - "learning_rate": 5.7985074626865674e-06, - "loss": 0.2561, + "epoch": 19.62, + "learning_rate": 3.2727915194346288e-06, + "loss": 0.2744, "step": 5650 }, { - "epoch": 78.61, - "learning_rate": 5.761194029850747e-06, - "loss": 0.2495, + "epoch": 19.65, + "learning_rate": 3.271378091872791e-06, + "loss": 0.287, "step": 5660 }, { - "epoch": 78.75, - "learning_rate": 5.723880597014926e-06, - "loss": 0.2562, + "epoch": 19.69, + "learning_rate": 3.269964664310954e-06, + "loss": 0.2831, "step": 5670 }, { - "epoch": 78.89, - "learning_rate": 5.686567164179105e-06, - "loss": 0.26, + "epoch": 19.72, + "learning_rate": 3.2685512367491164e-06, + "loss": 0.256, "step": 5680 }, { - "epoch": 79.0, - "eval_loss": 0.4918227195739746, - "eval_runtime": 132.2622, - "eval_samples_per_second": 4.022, - "eval_steps_per_second": 0.507, - "eval_wer": 0.19373915279295495, - "step": 5688 + "epoch": 19.75, + "learning_rate": 3.2671378091872793e-06, + "loss": 0.2609, + "step": 5690 }, { - "epoch": 79.03, - "learning_rate": 5.649253731343284e-06, - "loss": 0.269, - "step": 5690 + "epoch": 19.79, + "learning_rate": 3.2657243816254412e-06, + "loss": 0.2601, + "step": 5700 }, { - "epoch": 79.17, - "learning_rate": 5.611940298507462e-06, - "loss": 0.2585, - "step": 5700 - }, - { - "epoch": 79.3, - "learning_rate": 5.574626865671642e-06, - "loss": 0.2609, + "epoch": 19.82, + "learning_rate": 3.264310954063604e-06, + "loss": 0.2834, "step": 5710 }, { - "epoch": 79.44, - "learning_rate": 5.537313432835821e-06, - "loss": 0.256, + "epoch": 19.86, + "learning_rate": 3.2628975265017665e-06, + "loss": 0.2889, "step": 5720 }, { - "epoch": 79.58, - "learning_rate": 5.500000000000001e-06, - "loss": 0.2615, + "epoch": 19.89, + "learning_rate": 3.2614840989399293e-06, + "loss": 0.2617, "step": 5730 }, { - "epoch": 79.72, - "learning_rate": 5.46268656716418e-06, - "loss": 0.2626, + "epoch": 19.93, + "learning_rate": 3.2600706713780917e-06, + "loss": 0.2747, "step": 5740 }, { - "epoch": 79.86, - "learning_rate": 5.425373134328358e-06, - "loss": 0.2545, + "epoch": 19.96, + "learning_rate": 3.258657243816254e-06, + "loss": 0.2867, "step": 5750 }, { - "epoch": 80.0, - "learning_rate": 5.388059701492538e-06, - "loss": 0.2634, + "epoch": 20.0, + "learning_rate": 3.2572438162544166e-06, + "loss": 0.2631, "step": 5760 }, { - "epoch": 80.0, - "eval_loss": 0.4841861128807068, - "eval_runtime": 131.8698, - "eval_samples_per_second": 4.034, - "eval_steps_per_second": 0.508, - "eval_wer": 0.19277495661117183, + "epoch": 20.0, + "eval_loss": 0.5262243747711182, + "eval_runtime": 129.2103, + "eval_samples_per_second": 4.117, + "eval_steps_per_second": 1.029, + "eval_wer": 0.20209551970174197, "step": 5760 }, { - "epoch": 80.14, - "learning_rate": 5.3507462686567165e-06, - "loss": 0.2575, + "epoch": 20.03, + "learning_rate": 3.2558303886925794e-06, + "loss": 0.2689, "step": 5770 }, { - "epoch": 80.28, - "learning_rate": 5.313432835820896e-06, - "loss": 0.2567, + "epoch": 20.07, + "learning_rate": 3.254416961130742e-06, + "loss": 0.2906, "step": 5780 }, { - "epoch": 80.42, - "learning_rate": 5.276119402985075e-06, - "loss": 0.2599, + "epoch": 20.1, + "learning_rate": 3.2530035335689046e-06, + "loss": 0.2586, "step": 5790 }, { - "epoch": 80.55, - "learning_rate": 5.238805970149254e-06, - "loss": 0.246, + "epoch": 20.14, + "learning_rate": 3.251590106007067e-06, + "loss": 0.2732, "step": 5800 }, { - "epoch": 80.69, - "learning_rate": 5.201492537313433e-06, - "loss": 0.2546, + "epoch": 20.17, + "learning_rate": 3.2501766784452294e-06, + "loss": 0.2528, "step": 5810 }, { - "epoch": 80.83, - "learning_rate": 5.164179104477612e-06, - "loss": 0.2675, + "epoch": 20.21, + "learning_rate": 3.248763250883392e-06, + "loss": 0.26, "step": 5820 }, { - "epoch": 80.97, - "learning_rate": 5.1268656716417914e-06, - "loss": 0.2598, + "epoch": 20.24, + "learning_rate": 3.2473498233215547e-06, + "loss": 0.279, "step": 5830 }, { - "epoch": 81.0, - "eval_loss": 0.5017235279083252, - "eval_runtime": 132.1658, - "eval_samples_per_second": 4.025, - "eval_steps_per_second": 0.507, - "eval_wer": 0.19463906922928584, - "step": 5832 - }, - { - "epoch": 81.11, - "learning_rate": 5.089552238805971e-06, - "loss": 0.2551, + "epoch": 20.28, + "learning_rate": 3.245936395759717e-06, + "loss": 0.2506, "step": 5840 }, { - "epoch": 81.25, - "learning_rate": 5.05223880597015e-06, - "loss": 0.2648, + "epoch": 20.31, + "learning_rate": 3.24452296819788e-06, + "loss": 0.2886, "step": 5850 }, { - "epoch": 81.39, - "learning_rate": 5.014925373134328e-06, - "loss": 0.2447, + "epoch": 20.35, + "learning_rate": 3.2431095406360423e-06, + "loss": 0.2779, "step": 5860 }, { - "epoch": 81.53, - "learning_rate": 4.977611940298508e-06, - "loss": 0.2561, + "epoch": 20.38, + "learning_rate": 3.2416961130742048e-06, + "loss": 0.2731, "step": 5870 }, { - "epoch": 81.66, - "learning_rate": 4.940298507462686e-06, - "loss": 0.261, + "epoch": 20.42, + "learning_rate": 3.240282685512367e-06, + "loss": 0.2575, "step": 5880 }, { - "epoch": 81.8, - "learning_rate": 4.902985074626866e-06, - "loss": 0.2653, + "epoch": 20.45, + "learning_rate": 3.23886925795053e-06, + "loss": 0.2671, "step": 5890 }, { - "epoch": 81.94, - "learning_rate": 4.865671641791045e-06, - "loss": 0.2571, + "epoch": 20.48, + "learning_rate": 3.2374558303886924e-06, + "loss": 0.2901, "step": 5900 }, { - "epoch": 82.0, - "eval_loss": 0.4997570514678955, - "eval_runtime": 131.7552, - "eval_samples_per_second": 4.038, - "eval_steps_per_second": 0.509, - "eval_wer": 0.1983672944655139, - "step": 5904 - }, - { - "epoch": 82.08, - "learning_rate": 4.828358208955224e-06, - "loss": 0.2628, + "epoch": 20.52, + "learning_rate": 3.2360424028268552e-06, + "loss": 0.2778, "step": 5910 }, { - "epoch": 82.22, - "learning_rate": 4.791044776119404e-06, - "loss": 0.2625, + "epoch": 20.55, + "learning_rate": 3.2346289752650172e-06, + "loss": 0.2629, "step": 5920 }, { - "epoch": 82.36, - "learning_rate": 4.753731343283582e-06, - "loss": 0.2396, + "epoch": 20.59, + "learning_rate": 3.23321554770318e-06, + "loss": 0.2539, "step": 5930 }, { - "epoch": 82.5, - "learning_rate": 4.716417910447761e-06, - "loss": 0.2698, + "epoch": 20.62, + "learning_rate": 3.2318021201413425e-06, + "loss": 0.2697, "step": 5940 }, { - "epoch": 82.64, - "learning_rate": 4.6791044776119405e-06, - "loss": 0.2571, + "epoch": 20.66, + "learning_rate": 3.2303886925795053e-06, + "loss": 0.279, "step": 5950 }, { - "epoch": 82.78, - "learning_rate": 4.64179104477612e-06, - "loss": 0.2592, + "epoch": 20.69, + "learning_rate": 3.2289752650176677e-06, + "loss": 0.2869, "step": 5960 }, { - "epoch": 82.91, - "learning_rate": 4.604477611940299e-06, - "loss": 0.2564, + "epoch": 20.73, + "learning_rate": 3.2275618374558305e-06, + "loss": 0.2761, "step": 5970 }, { - "epoch": 83.0, - "eval_loss": 0.4961981475353241, - "eval_runtime": 132.3751, - "eval_samples_per_second": 4.019, - "eval_steps_per_second": 0.506, - "eval_wer": 0.19393199202931155, - "step": 5976 - }, - { - "epoch": 83.06, - "learning_rate": 4.567164179104478e-06, - "loss": 0.2661, + "epoch": 20.76, + "learning_rate": 3.2261484098939925e-06, + "loss": 0.2775, "step": 5980 }, { - "epoch": 83.19, - "learning_rate": 4.529850746268656e-06, - "loss": 0.2602, + "epoch": 20.8, + "learning_rate": 3.2247349823321554e-06, + "loss": 0.2639, "step": 5990 }, { - "epoch": 83.33, - "learning_rate": 4.492537313432836e-06, - "loss": 0.2515, + "epoch": 20.83, + "learning_rate": 3.2233215547703178e-06, + "loss": 0.2925, "step": 6000 }, { - "epoch": 83.47, - "learning_rate": 4.4552238805970154e-06, - "loss": 0.2607, + "epoch": 20.87, + "learning_rate": 3.2219081272084806e-06, + "loss": 0.2851, "step": 6010 }, { - "epoch": 83.61, - "learning_rate": 4.417910447761195e-06, - "loss": 0.2457, + "epoch": 20.9, + "learning_rate": 3.220494699646643e-06, + "loss": 0.2682, "step": 6020 }, { - "epoch": 83.75, - "learning_rate": 4.380597014925374e-06, - "loss": 0.2613, + "epoch": 20.94, + "learning_rate": 3.2190812720848054e-06, + "loss": 0.2541, "step": 6030 }, { - "epoch": 83.89, - "learning_rate": 4.343283582089552e-06, - "loss": 0.2606, + "epoch": 20.97, + "learning_rate": 3.217667844522968e-06, + "loss": 0.2753, "step": 6040 }, { - "epoch": 84.0, - "eval_loss": 0.49531611800193787, - "eval_runtime": 131.4182, - "eval_samples_per_second": 4.048, - "eval_steps_per_second": 0.51, - "eval_wer": 0.19155364144757986, + "epoch": 21.0, + "eval_loss": 0.5161154866218567, + "eval_runtime": 128.857, + "eval_samples_per_second": 4.129, + "eval_steps_per_second": 1.032, + "eval_wer": 0.19913865141094042, "step": 6048 }, { - "epoch": 84.03, - "learning_rate": 4.305970149253732e-06, - "loss": 0.2655, + "epoch": 21.01, + "learning_rate": 3.2162544169611307e-06, + "loss": 0.296, "step": 6050 }, { - "epoch": 84.17, - "learning_rate": 4.26865671641791e-06, - "loss": 0.2488, + "epoch": 21.04, + "learning_rate": 3.214840989399293e-06, + "loss": 0.2774, "step": 6060 }, { - "epoch": 84.3, - "learning_rate": 4.2313432835820895e-06, - "loss": 0.258, + "epoch": 21.08, + "learning_rate": 3.213427561837456e-06, + "loss": 0.2601, "step": 6070 }, { - "epoch": 84.44, - "learning_rate": 4.194029850746269e-06, - "loss": 0.2644, + "epoch": 21.11, + "learning_rate": 3.2120141342756183e-06, + "loss": 0.2738, "step": 6080 }, { - "epoch": 84.58, - "learning_rate": 4.156716417910448e-06, - "loss": 0.2573, + "epoch": 21.15, + "learning_rate": 3.2106007067137807e-06, + "loss": 0.2756, "step": 6090 }, { - "epoch": 84.72, - "learning_rate": 4.119402985074627e-06, - "loss": 0.243, + "epoch": 21.18, + "learning_rate": 3.209187279151943e-06, + "loss": 0.2851, "step": 6100 }, { - "epoch": 84.86, - "learning_rate": 4.082089552238806e-06, - "loss": 0.2581, + "epoch": 21.21, + "learning_rate": 3.207773851590106e-06, + "loss": 0.2786, "step": 6110 }, { - "epoch": 85.0, - "learning_rate": 4.044776119402985e-06, - "loss": 0.2587, - "step": 6120 - }, - { - "epoch": 85.0, - "eval_loss": 0.4982677400112152, - "eval_runtime": 132.0294, - "eval_samples_per_second": 4.029, - "eval_steps_per_second": 0.507, - "eval_wer": 0.19463906922928584, + "epoch": 21.25, + "learning_rate": 3.2063604240282684e-06, + "loss": 0.2685, "step": 6120 }, { - "epoch": 85.14, - "learning_rate": 4.0074626865671645e-06, - "loss": 0.2455, + "epoch": 21.28, + "learning_rate": 3.204946996466431e-06, + "loss": 0.2652, "step": 6130 }, { - "epoch": 85.28, - "learning_rate": 3.970149253731344e-06, - "loss": 0.2532, + "epoch": 21.32, + "learning_rate": 3.2035335689045936e-06, + "loss": 0.278, "step": 6140 }, { - "epoch": 85.42, - "learning_rate": 3.932835820895522e-06, - "loss": 0.2608, + "epoch": 21.35, + "learning_rate": 3.202120141342756e-06, + "loss": 0.2855, "step": 6150 }, { - "epoch": 85.55, - "learning_rate": 3.895522388059702e-06, - "loss": 0.2604, + "epoch": 21.39, + "learning_rate": 3.2007067137809184e-06, + "loss": 0.2757, "step": 6160 }, { - "epoch": 85.69, - "learning_rate": 3.85820895522388e-06, - "loss": 0.2489, + "epoch": 21.42, + "learning_rate": 3.1992932862190813e-06, + "loss": 0.2702, "step": 6170 }, { - "epoch": 85.83, - "learning_rate": 3.82089552238806e-06, - "loss": 0.2594, + "epoch": 21.46, + "learning_rate": 3.1978798586572437e-06, + "loss": 0.2765, "step": 6180 }, { - "epoch": 85.97, - "learning_rate": 3.7835820895522394e-06, - "loss": 0.2499, + "epoch": 21.49, + "learning_rate": 3.1964664310954065e-06, + "loss": 0.2616, "step": 6190 }, { - "epoch": 86.0, - "eval_loss": 0.5027219653129578, - "eval_runtime": 131.6359, - "eval_samples_per_second": 4.041, - "eval_steps_per_second": 0.509, - "eval_wer": 0.19534614642926015, - "step": 6192 - }, - { - "epoch": 86.11, - "learning_rate": 3.746268656716418e-06, - "loss": 0.2499, + "epoch": 21.53, + "learning_rate": 3.1950530035335685e-06, + "loss": 0.2795, "step": 6200 }, { - "epoch": 86.25, - "learning_rate": 3.7089552238805973e-06, - "loss": 0.2627, + "epoch": 21.56, + "learning_rate": 3.1936395759717313e-06, + "loss": 0.2716, "step": 6210 }, { - "epoch": 86.39, - "learning_rate": 3.671641791044776e-06, - "loss": 0.2471, + "epoch": 21.6, + "learning_rate": 3.1922261484098937e-06, + "loss": 0.2697, "step": 6220 }, { - "epoch": 86.53, - "learning_rate": 3.6343283582089557e-06, - "loss": 0.2538, + "epoch": 21.63, + "learning_rate": 3.1908127208480566e-06, + "loss": 0.2416, "step": 6230 }, { - "epoch": 86.66, - "learning_rate": 3.5970149253731344e-06, - "loss": 0.2432, + "epoch": 21.66, + "learning_rate": 3.189399293286219e-06, + "loss": 0.2782, "step": 6240 }, { - "epoch": 86.8, - "learning_rate": 3.5597014925373135e-06, - "loss": 0.2625, + "epoch": 21.7, + "learning_rate": 3.187985865724382e-06, + "loss": 0.2617, "step": 6250 }, { - "epoch": 86.94, - "learning_rate": 3.5223880597014923e-06, - "loss": 0.253, + "epoch": 21.73, + "learning_rate": 3.186572438162544e-06, + "loss": 0.2701, "step": 6260 }, { - "epoch": 87.0, - "eval_loss": 0.5000377297401428, - "eval_runtime": 132.268, - "eval_samples_per_second": 4.022, - "eval_steps_per_second": 0.507, - "eval_wer": 0.19515330719290352, - "step": 6264 - }, - { - "epoch": 87.08, - "learning_rate": 3.485074626865672e-06, - "loss": 0.2605, + "epoch": 21.77, + "learning_rate": 3.1851590106007066e-06, + "loss": 0.2894, "step": 6270 }, { - "epoch": 87.22, - "learning_rate": 3.4477611940298506e-06, - "loss": 0.2625, + "epoch": 21.8, + "learning_rate": 3.183745583038869e-06, + "loss": 0.2634, "step": 6280 }, { - "epoch": 87.36, - "learning_rate": 3.41044776119403e-06, - "loss": 0.2449, + "epoch": 21.84, + "learning_rate": 3.182332155477032e-06, + "loss": 0.2928, "step": 6290 }, { - "epoch": 87.5, - "learning_rate": 3.3731343283582093e-06, - "loss": 0.2529, + "epoch": 21.87, + "learning_rate": 3.1809187279151943e-06, + "loss": 0.2425, "step": 6300 }, { - "epoch": 87.64, - "learning_rate": 3.335820895522388e-06, - "loss": 0.2388, + "epoch": 21.91, + "learning_rate": 3.179505300353357e-06, + "loss": 0.272, "step": 6310 }, { - "epoch": 87.78, - "learning_rate": 3.2985074626865677e-06, - "loss": 0.2504, + "epoch": 21.94, + "learning_rate": 3.178091872791519e-06, + "loss": 0.2818, "step": 6320 }, { - "epoch": 87.91, - "learning_rate": 3.2611940298507464e-06, - "loss": 0.2614, + "epoch": 21.98, + "learning_rate": 3.176678445229682e-06, + "loss": 0.2797, "step": 6330 }, { - "epoch": 88.0, - "eval_loss": 0.4974157512187958, - "eval_runtime": 132.0096, - "eval_samples_per_second": 4.03, - "eval_steps_per_second": 0.508, - "eval_wer": 0.19354631355659832, + "epoch": 22.0, + "eval_loss": 0.5096527338027954, + "eval_runtime": 129.6264, + "eval_samples_per_second": 4.104, + "eval_steps_per_second": 1.026, + "eval_wer": 0.20093848428360223, "step": 6336 }, { - "epoch": 88.06, - "learning_rate": 3.2238805970149255e-06, - "loss": 0.2682, + "epoch": 22.01, + "learning_rate": 3.1752650176678444e-06, + "loss": 0.3083, "step": 6340 }, { - "epoch": 88.19, - "learning_rate": 3.1865671641791043e-06, - "loss": 0.2494, + "epoch": 22.05, + "learning_rate": 3.173851590106007e-06, + "loss": 0.2683, "step": 6350 }, { - "epoch": 88.33, - "learning_rate": 3.149253731343284e-06, - "loss": 0.2554, + "epoch": 22.08, + "learning_rate": 3.1724381625441696e-06, + "loss": 0.2614, "step": 6360 }, { - "epoch": 88.47, - "learning_rate": 3.111940298507463e-06, - "loss": 0.2546, + "epoch": 22.12, + "learning_rate": 3.171024734982332e-06, + "loss": 0.2664, "step": 6370 }, { - "epoch": 88.61, - "learning_rate": 3.0746268656716418e-06, - "loss": 0.2447, + "epoch": 22.15, + "learning_rate": 3.1696113074204944e-06, + "loss": 0.2813, "step": 6380 }, { - "epoch": 88.75, - "learning_rate": 3.037313432835821e-06, - "loss": 0.257, + "epoch": 22.19, + "learning_rate": 3.1681978798586572e-06, + "loss": 0.2609, "step": 6390 }, { - "epoch": 88.89, - "learning_rate": 3e-06, - "loss": 0.2533, + "epoch": 22.22, + "learning_rate": 3.1667844522968197e-06, + "loss": 0.2811, "step": 6400 }, { - "epoch": 89.0, - "eval_loss": 0.4969758987426758, - "eval_runtime": 132.51, - "eval_samples_per_second": 4.015, - "eval_steps_per_second": 0.506, - "eval_wer": 0.1948961882110947, - "step": 6408 - }, - { - "epoch": 89.03, - "learning_rate": 2.9626865671641792e-06, - "loss": 0.2591, + "epoch": 22.26, + "learning_rate": 3.1653710247349825e-06, + "loss": 0.2664, "step": 6410 }, { - "epoch": 89.17, - "learning_rate": 2.9253731343283584e-06, - "loss": 0.2604, + "epoch": 22.29, + "learning_rate": 3.163957597173145e-06, + "loss": 0.3003, "step": 6420 }, { - "epoch": 89.3, - "learning_rate": 2.8880597014925376e-06, - "loss": 0.2445, + "epoch": 22.33, + "learning_rate": 3.1625441696113073e-06, + "loss": 0.2665, "step": 6430 }, { - "epoch": 89.44, - "learning_rate": 2.8507462686567167e-06, - "loss": 0.2494, + "epoch": 22.36, + "learning_rate": 3.1611307420494697e-06, + "loss": 0.2603, "step": 6440 }, { - "epoch": 89.58, - "learning_rate": 2.813432835820896e-06, - "loss": 0.255, + "epoch": 22.39, + "learning_rate": 3.1597173144876326e-06, + "loss": 0.2702, "step": 6450 }, { - "epoch": 89.72, - "learning_rate": 2.7761194029850746e-06, - "loss": 0.2512, + "epoch": 22.43, + "learning_rate": 3.158303886925795e-06, + "loss": 0.2403, "step": 6460 }, { - "epoch": 89.86, - "learning_rate": 2.7388059701492538e-06, - "loss": 0.253, + "epoch": 22.46, + "learning_rate": 3.156890459363958e-06, + "loss": 0.272, "step": 6470 }, { - "epoch": 90.0, - "learning_rate": 2.701492537313433e-06, - "loss": 0.2553, - "step": 6480 - }, - { - "epoch": 90.0, - "eval_loss": 0.5005418658256531, - "eval_runtime": 131.5872, - "eval_samples_per_second": 4.043, - "eval_steps_per_second": 0.509, - "eval_wer": 0.19296779584752843, + "epoch": 22.5, + "learning_rate": 3.15547703180212e-06, + "loss": 0.308, "step": 6480 }, { - "epoch": 90.14, - "learning_rate": 2.664179104477612e-06, - "loss": 0.2521, + "epoch": 22.53, + "learning_rate": 3.154063604240282e-06, + "loss": 0.275, "step": 6490 }, { - "epoch": 90.28, - "learning_rate": 2.626865671641791e-06, - "loss": 0.2599, + "epoch": 22.57, + "learning_rate": 3.152650176678445e-06, + "loss": 0.2824, "step": 6500 }, { - "epoch": 90.42, - "learning_rate": 2.5895522388059704e-06, - "loss": 0.256, + "epoch": 22.6, + "learning_rate": 3.1512367491166074e-06, + "loss": 0.2734, "step": 6510 }, { - "epoch": 90.55, - "learning_rate": 2.5522388059701496e-06, - "loss": 0.2559, + "epoch": 22.64, + "learning_rate": 3.1498233215547703e-06, + "loss": 0.2686, "step": 6520 }, { - "epoch": 90.69, - "learning_rate": 2.5149253731343287e-06, - "loss": 0.2507, + "epoch": 22.67, + "learning_rate": 3.148409893992933e-06, + "loss": 0.2826, "step": 6530 }, { - "epoch": 90.83, - "learning_rate": 2.4776119402985074e-06, - "loss": 0.2525, + "epoch": 22.71, + "learning_rate": 3.146996466431095e-06, + "loss": 0.2878, "step": 6540 }, { - "epoch": 90.97, - "learning_rate": 2.4402985074626866e-06, - "loss": 0.2518, + "epoch": 22.74, + "learning_rate": 3.1455830388692575e-06, + "loss": 0.2793, "step": 6550 }, { - "epoch": 91.0, - "eval_loss": 0.5009539127349854, - "eval_runtime": 131.4903, - "eval_samples_per_second": 4.046, - "eval_steps_per_second": 0.51, - "eval_wer": 0.1948961882110947, - "step": 6552 - }, - { - "epoch": 91.11, - "learning_rate": 2.4029850746268658e-06, - "loss": 0.2618, + "epoch": 22.78, + "learning_rate": 3.1441696113074203e-06, + "loss": 0.2574, "step": 6560 }, { - "epoch": 91.25, - "learning_rate": 2.365671641791045e-06, - "loss": 0.2592, + "epoch": 22.81, + "learning_rate": 3.1427561837455827e-06, + "loss": 0.2733, "step": 6570 }, { - "epoch": 91.39, - "learning_rate": 2.328358208955224e-06, - "loss": 0.2505, + "epoch": 22.85, + "learning_rate": 3.1413427561837456e-06, + "loss": 0.2887, "step": 6580 }, { - "epoch": 91.53, - "learning_rate": 2.291044776119403e-06, - "loss": 0.2539, + "epoch": 22.88, + "learning_rate": 3.139929328621908e-06, + "loss": 0.2801, "step": 6590 }, { - "epoch": 91.66, - "learning_rate": 2.2537313432835824e-06, - "loss": 0.249, + "epoch": 22.91, + "learning_rate": 3.1385159010600704e-06, + "loss": 0.2739, "step": 6600 }, { - "epoch": 91.8, - "learning_rate": 2.2164179104477616e-06, - "loss": 0.2428, + "epoch": 22.95, + "learning_rate": 3.137102473498233e-06, + "loss": 0.2622, "step": 6610 }, { - "epoch": 91.94, - "learning_rate": 2.1791044776119403e-06, - "loss": 0.2481, + "epoch": 22.98, + "learning_rate": 3.1356890459363956e-06, + "loss": 0.2667, "step": 6620 }, { - "epoch": 92.0, - "eval_loss": 0.4958493113517761, - "eval_runtime": 131.9046, - "eval_samples_per_second": 4.033, - "eval_steps_per_second": 0.508, - "eval_wer": 0.1918107604293887, + "epoch": 23.0, + "eval_loss": 0.5130947828292847, + "eval_runtime": 130.2324, + "eval_samples_per_second": 4.085, + "eval_steps_per_second": 1.021, + "eval_wer": 0.19952432988365365, "step": 6624 }, { - "epoch": 92.08, - "learning_rate": 2.1417910447761194e-06, + "epoch": 23.02, + "learning_rate": 3.134275618374558e-06, "loss": 0.2649, "step": 6630 }, { - "epoch": 92.22, - "learning_rate": 2.1044776119402986e-06, - "loss": 0.2549, + "epoch": 23.06, + "learning_rate": 3.132862190812721e-06, + "loss": 0.2847, "step": 6640 }, { - "epoch": 92.36, - "learning_rate": 2.0671641791044778e-06, - "loss": 0.2425, + "epoch": 23.09, + "learning_rate": 3.131448763250883e-06, + "loss": 0.2679, "step": 6650 }, { - "epoch": 92.5, - "learning_rate": 2.029850746268657e-06, - "loss": 0.2598, + "epoch": 23.12, + "learning_rate": 3.1300353356890457e-06, + "loss": 0.284, "step": 6660 }, { - "epoch": 92.64, - "learning_rate": 1.9925373134328357e-06, - "loss": 0.2429, + "epoch": 23.16, + "learning_rate": 3.128621908127208e-06, + "loss": 0.2729, "step": 6670 }, { - "epoch": 92.78, - "learning_rate": 1.955223880597015e-06, - "loss": 0.2596, + "epoch": 23.19, + "learning_rate": 3.127208480565371e-06, + "loss": 0.2708, "step": 6680 }, { - "epoch": 92.91, - "learning_rate": 1.9179104477611944e-06, - "loss": 0.2491, + "epoch": 23.23, + "learning_rate": 3.1257950530035333e-06, + "loss": 0.2851, "step": 6690 }, { - "epoch": 93.0, - "eval_loss": 0.4932185709476471, - "eval_runtime": 131.4467, - "eval_samples_per_second": 4.047, - "eval_steps_per_second": 0.51, - "eval_wer": 0.1909108439930578, - "step": 6696 - }, - { - "epoch": 93.06, - "learning_rate": 1.8805970149253733e-06, - "loss": 0.2682, + "epoch": 23.26, + "learning_rate": 3.124381625441696e-06, + "loss": 0.262, "step": 6700 }, { - "epoch": 93.19, - "learning_rate": 1.8432835820895525e-06, - "loss": 0.2455, + "epoch": 23.3, + "learning_rate": 3.122968197879858e-06, + "loss": 0.2997, "step": 6710 }, { - "epoch": 93.33, - "learning_rate": 1.8059701492537314e-06, - "loss": 0.2456, + "epoch": 23.33, + "learning_rate": 3.121554770318021e-06, + "loss": 0.2653, "step": 6720 }, { - "epoch": 93.47, - "learning_rate": 1.7686567164179106e-06, - "loss": 0.2493, + "epoch": 23.37, + "learning_rate": 3.1201413427561834e-06, + "loss": 0.2544, "step": 6730 }, { - "epoch": 93.61, - "learning_rate": 1.7313432835820896e-06, - "loss": 0.2526, + "epoch": 23.4, + "learning_rate": 3.1187279151943462e-06, + "loss": 0.2888, "step": 6740 }, { - "epoch": 93.75, - "learning_rate": 1.6940298507462687e-06, - "loss": 0.2599, + "epoch": 23.44, + "learning_rate": 3.1173144876325086e-06, + "loss": 0.2837, "step": 6750 }, { - "epoch": 93.89, - "learning_rate": 1.6567164179104477e-06, - "loss": 0.2455, + "epoch": 23.47, + "learning_rate": 3.1159010600706715e-06, + "loss": 0.2824, "step": 6760 }, { - "epoch": 94.0, - "eval_loss": 0.493074506521225, - "eval_runtime": 131.6855, - "eval_samples_per_second": 4.04, - "eval_steps_per_second": 0.509, - "eval_wer": 0.19123224272031883, - "step": 6768 - }, - { - "epoch": 94.03, - "learning_rate": 1.6194029850746268e-06, - "loss": 0.2531, + "epoch": 23.51, + "learning_rate": 3.1144876325088335e-06, + "loss": 0.3101, "step": 6770 }, { - "epoch": 94.17, - "learning_rate": 1.5820895522388062e-06, - "loss": 0.2513, + "epoch": 23.54, + "learning_rate": 3.1130742049469963e-06, + "loss": 0.2965, "step": 6780 }, { - "epoch": 94.3, - "learning_rate": 1.5447761194029851e-06, - "loss": 0.2534, + "epoch": 23.57, + "learning_rate": 3.1116607773851587e-06, + "loss": 0.2739, "step": 6790 }, { - "epoch": 94.44, - "learning_rate": 1.5111940298507464e-06, - "loss": 0.2418, + "epoch": 23.61, + "learning_rate": 3.1102473498233215e-06, + "loss": 0.2697, "step": 6800 }, { - "epoch": 94.58, - "learning_rate": 1.4738805970149254e-06, - "loss": 0.2407, + "epoch": 23.64, + "learning_rate": 3.108833922261484e-06, + "loss": 0.2837, "step": 6810 }, { - "epoch": 94.72, - "learning_rate": 1.4365671641791045e-06, - "loss": 0.251, + "epoch": 23.68, + "learning_rate": 3.1074204946996464e-06, + "loss": 0.277, "step": 6820 }, { - "epoch": 94.86, - "learning_rate": 1.3992537313432837e-06, - "loss": 0.2494, + "epoch": 23.71, + "learning_rate": 3.1060070671378088e-06, + "loss": 0.2887, "step": 6830 }, { - "epoch": 95.0, - "learning_rate": 1.3619402985074628e-06, - "loss": 0.2581, - "step": 6840 - }, - { - "epoch": 95.0, - "eval_loss": 0.49741461873054504, - "eval_runtime": 132.2805, - "eval_samples_per_second": 4.022, - "eval_steps_per_second": 0.506, - "eval_wer": 0.19148936170212766, + "epoch": 23.75, + "learning_rate": 3.1045936395759716e-06, + "loss": 0.2765, "step": 6840 }, { - "epoch": 95.14, - "learning_rate": 1.3246268656716418e-06, - "loss": 0.2415, + "epoch": 23.78, + "learning_rate": 3.103180212014134e-06, + "loss": 0.2468, "step": 6850 }, { - "epoch": 95.28, - "learning_rate": 1.287313432835821e-06, - "loss": 0.2474, + "epoch": 23.82, + "learning_rate": 3.101766784452297e-06, + "loss": 0.2786, "step": 6860 }, { - "epoch": 95.42, - "learning_rate": 1.25e-06, - "loss": 0.2488, + "epoch": 23.85, + "learning_rate": 3.1003533568904593e-06, + "loss": 0.2561, "step": 6870 }, { - "epoch": 95.55, - "learning_rate": 1.2126865671641793e-06, - "loss": 0.2566, + "epoch": 23.89, + "learning_rate": 3.0989399293286217e-06, + "loss": 0.2494, "step": 6880 }, { - "epoch": 95.69, - "learning_rate": 1.1753731343283582e-06, - "loss": 0.2457, + "epoch": 23.92, + "learning_rate": 3.097526501766784e-06, + "loss": 0.2619, "step": 6890 }, { - "epoch": 95.83, - "learning_rate": 1.1380597014925374e-06, - "loss": 0.2489, + "epoch": 23.96, + "learning_rate": 3.096113074204947e-06, + "loss": 0.2629, "step": 6900 }, { - "epoch": 95.97, - "learning_rate": 1.1007462686567163e-06, - "loss": 0.2578, + "epoch": 23.99, + "learning_rate": 3.0946996466431093e-06, + "loss": 0.2722, "step": 6910 }, { - "epoch": 96.0, - "eval_loss": 0.4990382492542267, - "eval_runtime": 131.6402, - "eval_samples_per_second": 4.041, - "eval_steps_per_second": 0.509, - "eval_wer": 0.1909108439930578, + "epoch": 24.0, + "eval_loss": 0.5097522735595703, + "eval_runtime": 129.544, + "eval_samples_per_second": 4.107, + "eval_steps_per_second": 1.027, + "eval_wer": 0.199010091920036, "step": 6912 }, { - "epoch": 96.11, - "learning_rate": 1.0634328358208957e-06, - "loss": 0.2528, + "epoch": 24.03, + "learning_rate": 3.093286219081272e-06, + "loss": 0.2714, "step": 6920 }, { - "epoch": 96.25, - "learning_rate": 1.0261194029850746e-06, - "loss": 0.2517, + "epoch": 24.06, + "learning_rate": 3.0918727915194346e-06, + "loss": 0.2682, "step": 6930 }, { - "epoch": 96.39, - "learning_rate": 9.888059701492538e-07, - "loss": 0.2358, + "epoch": 24.1, + "learning_rate": 3.090459363957597e-06, + "loss": 0.2623, "step": 6940 }, { - "epoch": 96.53, - "learning_rate": 9.514925373134328e-07, - "loss": 0.254, + "epoch": 24.13, + "learning_rate": 3.0890459363957594e-06, + "loss": 0.279, "step": 6950 }, { - "epoch": 96.66, - "learning_rate": 9.141791044776121e-07, - "loss": 0.2491, + "epoch": 24.17, + "learning_rate": 3.0876325088339222e-06, + "loss": 0.2612, "step": 6960 }, { - "epoch": 96.8, - "learning_rate": 8.768656716417912e-07, - "loss": 0.2494, + "epoch": 24.2, + "learning_rate": 3.0862190812720846e-06, + "loss": 0.2505, "step": 6970 }, { - "epoch": 96.94, - "learning_rate": 8.395522388059702e-07, - "loss": 0.2503, + "epoch": 24.24, + "learning_rate": 3.0848056537102475e-06, + "loss": 0.281, "step": 6980 }, { - "epoch": 97.0, - "eval_loss": 0.4989832937717438, - "eval_runtime": 131.556, - "eval_samples_per_second": 4.044, - "eval_steps_per_second": 0.509, - "eval_wer": 0.19136080221122323, - "step": 6984 - }, - { - "epoch": 97.08, - "learning_rate": 8.022388059701493e-07, - "loss": 0.2468, + "epoch": 24.27, + "learning_rate": 3.0833922261484094e-06, + "loss": 0.2653, "step": 6990 }, { - "epoch": 97.22, - "learning_rate": 7.649253731343284e-07, - "loss": 0.2519, + "epoch": 24.3, + "learning_rate": 3.0819787985865723e-06, + "loss": 0.2881, "step": 7000 }, { - "epoch": 97.36, - "learning_rate": 7.276119402985075e-07, - "loss": 0.2464, + "epoch": 24.34, + "learning_rate": 3.0805653710247347e-06, + "loss": 0.2596, "step": 7010 }, { - "epoch": 97.5, - "learning_rate": 6.902985074626866e-07, - "loss": 0.2423, + "epoch": 24.37, + "learning_rate": 3.0791519434628975e-06, + "loss": 0.2459, "step": 7020 }, { - "epoch": 97.64, - "learning_rate": 6.529850746268657e-07, - "loss": 0.2327, + "epoch": 24.41, + "learning_rate": 3.07773851590106e-06, + "loss": 0.2838, "step": 7030 }, { - "epoch": 97.78, - "learning_rate": 6.156716417910448e-07, - "loss": 0.2523, + "epoch": 24.44, + "learning_rate": 3.0763250883392228e-06, + "loss": 0.2497, "step": 7040 }, { - "epoch": 97.91, - "learning_rate": 5.783582089552239e-07, - "loss": 0.2544, + "epoch": 24.48, + "learning_rate": 3.0749116607773847e-06, + "loss": 0.2907, "step": 7050 }, { - "epoch": 98.0, - "eval_loss": 0.4931636154651642, - "eval_runtime": 132.145, - "eval_samples_per_second": 4.026, - "eval_steps_per_second": 0.507, - "eval_wer": 0.1903323262839879, - "step": 7056 - }, - { - "epoch": 98.06, - "learning_rate": 5.41044776119403e-07, - "loss": 0.2491, + "epoch": 24.51, + "learning_rate": 3.0734982332155476e-06, + "loss": 0.2954, "step": 7060 }, { - "epoch": 98.19, - "learning_rate": 5.037313432835821e-07, - "loss": 0.2483, + "epoch": 24.55, + "learning_rate": 3.07208480565371e-06, + "loss": 0.2536, "step": 7070 }, { - "epoch": 98.33, - "learning_rate": 4.6641791044776116e-07, - "loss": 0.2478, + "epoch": 24.58, + "learning_rate": 3.070671378091873e-06, + "loss": 0.2554, "step": 7080 }, { - "epoch": 98.47, - "learning_rate": 4.291044776119403e-07, - "loss": 0.255, + "epoch": 24.62, + "learning_rate": 3.0692579505300352e-06, + "loss": 0.2779, "step": 7090 }, { - "epoch": 98.61, - "learning_rate": 3.9179104477611937e-07, - "loss": 0.2429, + "epoch": 24.65, + "learning_rate": 3.067844522968198e-06, + "loss": 0.2681, "step": 7100 }, { - "epoch": 98.75, - "learning_rate": 3.544776119402985e-07, - "loss": 0.2524, + "epoch": 24.69, + "learning_rate": 3.06643109540636e-06, + "loss": 0.2715, "step": 7110 }, { - "epoch": 98.89, - "learning_rate": 3.1716417910447763e-07, - "loss": 0.2391, + "epoch": 24.72, + "learning_rate": 3.065017667844523e-06, + "loss": 0.2692, "step": 7120 }, { - "epoch": 99.0, - "eval_loss": 0.49354514479637146, - "eval_runtime": 131.8773, - "eval_samples_per_second": 4.034, - "eval_steps_per_second": 0.508, - "eval_wer": 0.1903966060294401, - "step": 7128 - }, - { - "epoch": 99.03, - "learning_rate": 2.7985074626865674e-07, - "loss": 0.265, + "epoch": 24.75, + "learning_rate": 3.0636042402826853e-06, + "loss": 0.2646, "step": 7130 }, { - "epoch": 99.17, - "learning_rate": 2.4253731343283584e-07, - "loss": 0.2477, + "epoch": 24.79, + "learning_rate": 3.062190812720848e-06, + "loss": 0.2585, "step": 7140 }, { - "epoch": 99.3, - "learning_rate": 2.0522388059701492e-07, - "loss": 0.2497, + "epoch": 24.82, + "learning_rate": 3.0607773851590105e-06, + "loss": 0.2706, "step": 7150 }, { - "epoch": 99.44, - "learning_rate": 1.6791044776119403e-07, - "loss": 0.2535, + "epoch": 24.86, + "learning_rate": 3.059363957597173e-06, + "loss": 0.2796, "step": 7160 }, { - "epoch": 99.58, - "learning_rate": 1.3059701492537316e-07, - "loss": 0.2511, + "epoch": 24.89, + "learning_rate": 3.0579505300353354e-06, + "loss": 0.2645, "step": 7170 }, { - "epoch": 99.72, - "learning_rate": 9.328358208955224e-08, - "loss": 0.2441, + "epoch": 24.93, + "learning_rate": 3.056537102473498e-06, + "loss": 0.2374, "step": 7180 }, { - "epoch": 99.86, - "learning_rate": 5.597014925373135e-08, - "loss": 0.2413, + "epoch": 24.96, + "learning_rate": 3.0551236749116606e-06, + "loss": 0.285, "step": 7190 }, { - "epoch": 100.0, - "learning_rate": 1.8656716417910447e-08, - "loss": 0.2498, + "epoch": 25.0, + "learning_rate": 3.0537102473498234e-06, + "loss": 0.3026, "step": 7200 }, { - "epoch": 100.0, - "eval_loss": 0.4945172667503357, - "eval_runtime": 132.2872, - "eval_samples_per_second": 4.022, - "eval_steps_per_second": 0.506, - "eval_wer": 0.1909108439930578, + "epoch": 25.0, + "eval_loss": 0.5193008780479431, + "eval_runtime": 129.4939, + "eval_samples_per_second": 4.108, + "eval_steps_per_second": 1.027, + "eval_wer": 0.200552805810889, "step": 7200 }, + { + "epoch": 25.03, + "learning_rate": 3.052296819787986e-06, + "loss": 0.3016, + "step": 7210 + }, + { + "epoch": 25.07, + "learning_rate": 3.0508833922261483e-06, + "loss": 0.2787, + "step": 7220 + }, + { + "epoch": 25.1, + "learning_rate": 3.0494699646643107e-06, + "loss": 0.2695, + "step": 7230 + }, + { + "epoch": 25.14, + "learning_rate": 3.048197879858657e-06, + "loss": 0.2666, + "step": 7240 + }, + { + "epoch": 25.17, + "learning_rate": 3.0467844522968195e-06, + "loss": 0.2892, + "step": 7250 + }, + { + "epoch": 25.21, + "learning_rate": 3.0453710247349824e-06, + "loss": 0.262, + "step": 7260 + }, + { + "epoch": 25.24, + "learning_rate": 3.0439575971731448e-06, + "loss": 0.2557, + "step": 7270 + }, + { + "epoch": 25.28, + "learning_rate": 3.0425441696113076e-06, + "loss": 0.255, + "step": 7280 + }, + { + "epoch": 25.31, + "learning_rate": 3.0411307420494696e-06, + "loss": 0.2848, + "step": 7290 + }, + { + "epoch": 25.35, + "learning_rate": 3.0397173144876324e-06, + "loss": 0.2734, + "step": 7300 + }, + { + "epoch": 25.38, + "learning_rate": 3.038303886925795e-06, + "loss": 0.2719, + "step": 7310 + }, + { + "epoch": 25.42, + "learning_rate": 3.0368904593639577e-06, + "loss": 0.2672, + "step": 7320 + }, + { + "epoch": 25.45, + "learning_rate": 3.03547703180212e-06, + "loss": 0.266, + "step": 7330 + }, + { + "epoch": 25.48, + "learning_rate": 3.034063604240283e-06, + "loss": 0.3005, + "step": 7340 + }, + { + "epoch": 25.52, + "learning_rate": 3.032650176678445e-06, + "loss": 0.2512, + "step": 7350 + }, + { + "epoch": 25.55, + "learning_rate": 3.0312367491166077e-06, + "loss": 0.2525, + "step": 7360 + }, + { + "epoch": 25.59, + "learning_rate": 3.02982332155477e-06, + "loss": 0.2543, + "step": 7370 + }, + { + "epoch": 25.62, + "learning_rate": 3.028409893992933e-06, + "loss": 0.2881, + "step": 7380 + }, + { + "epoch": 25.66, + "learning_rate": 3.0269964664310954e-06, + "loss": 0.2569, + "step": 7390 + }, + { + "epoch": 25.69, + "learning_rate": 3.0255830388692582e-06, + "loss": 0.2721, + "step": 7400 + }, + { + "epoch": 25.73, + "learning_rate": 3.02416961130742e-06, + "loss": 0.2717, + "step": 7410 + }, + { + "epoch": 25.76, + "learning_rate": 3.022756183745583e-06, + "loss": 0.2897, + "step": 7420 + }, + { + "epoch": 25.8, + "learning_rate": 3.0213427561837454e-06, + "loss": 0.2652, + "step": 7430 + }, + { + "epoch": 25.83, + "learning_rate": 3.0199293286219083e-06, + "loss": 0.2545, + "step": 7440 + }, + { + "epoch": 25.87, + "learning_rate": 3.0185159010600707e-06, + "loss": 0.2826, + "step": 7450 + }, + { + "epoch": 25.9, + "learning_rate": 3.0171024734982327e-06, + "loss": 0.2638, + "step": 7460 + }, + { + "epoch": 25.94, + "learning_rate": 3.0156890459363955e-06, + "loss": 0.2592, + "step": 7470 + }, + { + "epoch": 25.97, + "learning_rate": 3.014275618374558e-06, + "loss": 0.2888, + "step": 7480 + }, + { + "epoch": 26.0, + "eval_loss": 0.49870219826698303, + "eval_runtime": 130.4803, + "eval_samples_per_second": 4.077, + "eval_steps_per_second": 1.019, + "eval_wer": 0.19856013370187053, + "step": 7488 + }, + { + "epoch": 26.01, + "learning_rate": 3.0128621908127208e-06, + "loss": 0.2858, + "step": 7490 + }, + { + "epoch": 26.04, + "learning_rate": 3.011448763250883e-06, + "loss": 0.28, + "step": 7500 + }, + { + "epoch": 26.08, + "learning_rate": 3.010035335689046e-06, + "loss": 0.2725, + "step": 7510 + }, + { + "epoch": 26.11, + "learning_rate": 3.008621908127208e-06, + "loss": 0.271, + "step": 7520 + }, + { + "epoch": 26.15, + "learning_rate": 3.007208480565371e-06, + "loss": 0.2829, + "step": 7530 + }, + { + "epoch": 26.18, + "learning_rate": 3.0057950530035332e-06, + "loss": 0.2639, + "step": 7540 + }, + { + "epoch": 26.21, + "learning_rate": 3.004381625441696e-06, + "loss": 0.256, + "step": 7550 + }, + { + "epoch": 26.25, + "learning_rate": 3.0029681978798585e-06, + "loss": 0.2738, + "step": 7560 + }, + { + "epoch": 26.28, + "learning_rate": 3.001554770318021e-06, + "loss": 0.2642, + "step": 7570 + }, + { + "epoch": 26.32, + "learning_rate": 3.0001413427561833e-06, + "loss": 0.2953, + "step": 7580 + }, + { + "epoch": 26.35, + "learning_rate": 2.998727915194346e-06, + "loss": 0.2696, + "step": 7590 + }, + { + "epoch": 26.39, + "learning_rate": 2.9973144876325085e-06, + "loss": 0.2801, + "step": 7600 + }, + { + "epoch": 26.42, + "learning_rate": 2.9959010600706714e-06, + "loss": 0.2846, + "step": 7610 + }, + { + "epoch": 26.46, + "learning_rate": 2.9944876325088338e-06, + "loss": 0.2726, + "step": 7620 + }, + { + "epoch": 26.49, + "learning_rate": 2.993074204946996e-06, + "loss": 0.2773, + "step": 7630 + }, + { + "epoch": 26.53, + "learning_rate": 2.9916607773851586e-06, + "loss": 0.2555, + "step": 7640 + }, + { + "epoch": 26.56, + "learning_rate": 2.9902473498233214e-06, + "loss": 0.2797, + "step": 7650 + }, + { + "epoch": 26.6, + "learning_rate": 2.988833922261484e-06, + "loss": 0.2519, + "step": 7660 + }, + { + "epoch": 26.63, + "learning_rate": 2.9874204946996467e-06, + "loss": 0.2665, + "step": 7670 + }, + { + "epoch": 26.66, + "learning_rate": 2.986007067137809e-06, + "loss": 0.2618, + "step": 7680 + }, + { + "epoch": 26.7, + "learning_rate": 2.9845936395759715e-06, + "loss": 0.2807, + "step": 7690 + }, + { + "epoch": 26.73, + "learning_rate": 2.983180212014134e-06, + "loss": 0.2786, + "step": 7700 + }, + { + "epoch": 26.77, + "learning_rate": 2.9817667844522967e-06, + "loss": 0.2579, + "step": 7710 + }, + { + "epoch": 26.8, + "learning_rate": 2.980353356890459e-06, + "loss": 0.2748, + "step": 7720 + }, + { + "epoch": 26.84, + "learning_rate": 2.978939929328622e-06, + "loss": 0.2755, + "step": 7730 + }, + { + "epoch": 26.87, + "learning_rate": 2.977526501766784e-06, + "loss": 0.2483, + "step": 7740 + }, + { + "epoch": 26.91, + "learning_rate": 2.9761130742049468e-06, + "loss": 0.2753, + "step": 7750 + }, + { + "epoch": 26.94, + "learning_rate": 2.974699646643109e-06, + "loss": 0.2455, + "step": 7760 + }, + { + "epoch": 26.98, + "learning_rate": 2.973286219081272e-06, + "loss": 0.2732, + "step": 7770 + }, + { + "epoch": 27.0, + "eval_loss": 0.5063392519950867, + "eval_runtime": 129.9156, + "eval_samples_per_second": 4.095, + "eval_steps_per_second": 1.024, + "eval_wer": 0.20074564504724562, + "step": 7776 + }, + { + "epoch": 27.01, + "learning_rate": 2.9718727915194344e-06, + "loss": 0.2939, + "step": 7780 + }, + { + "epoch": 27.05, + "learning_rate": 2.9704593639575973e-06, + "loss": 0.2713, + "step": 7790 + }, + { + "epoch": 27.08, + "learning_rate": 2.9690459363957593e-06, + "loss": 0.2683, + "step": 7800 + }, + { + "epoch": 27.12, + "learning_rate": 2.967632508833922e-06, + "loss": 0.2905, + "step": 7810 + }, + { + "epoch": 27.15, + "learning_rate": 2.9662190812720845e-06, + "loss": 0.2755, + "step": 7820 + }, + { + "epoch": 27.19, + "learning_rate": 2.9648056537102473e-06, + "loss": 0.2745, + "step": 7830 + }, + { + "epoch": 27.22, + "learning_rate": 2.9633922261484097e-06, + "loss": 0.2813, + "step": 7840 + }, + { + "epoch": 27.26, + "learning_rate": 2.9619787985865726e-06, + "loss": 0.2405, + "step": 7850 + }, + { + "epoch": 27.29, + "learning_rate": 2.9605653710247346e-06, + "loss": 0.2778, + "step": 7860 + }, + { + "epoch": 27.33, + "learning_rate": 2.9591519434628974e-06, + "loss": 0.2785, + "step": 7870 + }, + { + "epoch": 27.36, + "learning_rate": 2.95773851590106e-06, + "loss": 0.2665, + "step": 7880 + }, + { + "epoch": 27.39, + "learning_rate": 2.9563250883392226e-06, + "loss": 0.2905, + "step": 7890 + }, + { + "epoch": 27.43, + "learning_rate": 2.954911660777385e-06, + "loss": 0.2611, + "step": 7900 + }, + { + "epoch": 27.46, + "learning_rate": 2.9534982332155475e-06, + "loss": 0.2633, + "step": 7910 + }, + { + "epoch": 27.5, + "learning_rate": 2.95208480565371e-06, + "loss": 0.2525, + "step": 7920 + }, + { + "epoch": 27.53, + "learning_rate": 2.9506713780918727e-06, + "loss": 0.2627, + "step": 7930 + }, + { + "epoch": 27.57, + "learning_rate": 2.949257950530035e-06, + "loss": 0.2834, + "step": 7940 + }, + { + "epoch": 27.6, + "learning_rate": 2.947844522968198e-06, + "loss": 0.2709, + "step": 7950 + }, + { + "epoch": 27.64, + "learning_rate": 2.9464310954063604e-06, + "loss": 0.2637, + "step": 7960 + }, + { + "epoch": 27.67, + "learning_rate": 2.9450176678445228e-06, + "loss": 0.304, + "step": 7970 + }, + { + "epoch": 27.71, + "learning_rate": 2.943604240282685e-06, + "loss": 0.2664, + "step": 7980 + }, + { + "epoch": 27.74, + "learning_rate": 2.942190812720848e-06, + "loss": 0.2684, + "step": 7990 + }, + { + "epoch": 27.78, + "learning_rate": 2.9407773851590104e-06, + "loss": 0.2641, + "step": 8000 + }, + { + "epoch": 27.81, + "learning_rate": 2.9393639575971732e-06, + "loss": 0.2767, + "step": 8010 + }, + { + "epoch": 27.85, + "learning_rate": 2.9379505300353357e-06, + "loss": 0.2825, + "step": 8020 + }, + { + "epoch": 27.88, + "learning_rate": 2.936537102473498e-06, + "loss": 0.2747, + "step": 8030 + }, + { + "epoch": 27.91, + "learning_rate": 2.9351236749116605e-06, + "loss": 0.2877, + "step": 8040 + }, + { + "epoch": 27.95, + "learning_rate": 2.9337102473498233e-06, + "loss": 0.2703, + "step": 8050 + }, + { + "epoch": 27.98, + "learning_rate": 2.9322968197879857e-06, + "loss": 0.2567, + "step": 8060 + }, + { + "epoch": 28.0, + "eval_loss": 0.5102671980857849, + "eval_runtime": 130.0784, + "eval_samples_per_second": 4.09, + "eval_steps_per_second": 1.022, + "eval_wer": 0.2015170019926721, + "step": 8064 + }, + { + "epoch": 28.02, + "learning_rate": 2.9308833922261486e-06, + "loss": 0.2758, + "step": 8070 + }, + { + "epoch": 28.06, + "learning_rate": 2.9294699646643105e-06, + "loss": 0.2866, + "step": 8080 + }, + { + "epoch": 28.09, + "learning_rate": 2.9280565371024734e-06, + "loss": 0.2397, + "step": 8090 + }, + { + "epoch": 28.12, + "learning_rate": 2.9266431095406358e-06, + "loss": 0.2718, + "step": 8100 + }, + { + "epoch": 28.16, + "learning_rate": 2.9252296819787986e-06, + "loss": 0.2795, + "step": 8110 + }, + { + "epoch": 28.19, + "learning_rate": 2.923816254416961e-06, + "loss": 0.258, + "step": 8120 + }, + { + "epoch": 28.23, + "learning_rate": 2.922402826855124e-06, + "loss": 0.2651, + "step": 8130 + }, + { + "epoch": 28.26, + "learning_rate": 2.920989399293286e-06, + "loss": 0.2741, + "step": 8140 + }, + { + "epoch": 28.3, + "learning_rate": 2.9195759717314487e-06, + "loss": 0.286, + "step": 8150 + }, + { + "epoch": 28.33, + "learning_rate": 2.918162544169611e-06, + "loss": 0.2716, + "step": 8160 + }, + { + "epoch": 28.37, + "learning_rate": 2.916749116607774e-06, + "loss": 0.2594, + "step": 8170 + }, + { + "epoch": 28.4, + "learning_rate": 2.9153356890459363e-06, + "loss": 0.2958, + "step": 8180 + }, + { + "epoch": 28.44, + "learning_rate": 2.9139222614840987e-06, + "loss": 0.2742, + "step": 8190 + }, + { + "epoch": 28.47, + "learning_rate": 2.912508833922261e-06, + "loss": 0.2678, + "step": 8200 + }, + { + "epoch": 28.51, + "learning_rate": 2.911095406360424e-06, + "loss": 0.2961, + "step": 8210 + }, + { + "epoch": 28.54, + "learning_rate": 2.9096819787985864e-06, + "loss": 0.2675, + "step": 8220 + }, + { + "epoch": 28.57, + "learning_rate": 2.9082685512367492e-06, + "loss": 0.2722, + "step": 8230 + }, + { + "epoch": 28.61, + "learning_rate": 2.9068551236749116e-06, + "loss": 0.257, + "step": 8240 + }, + { + "epoch": 28.64, + "learning_rate": 2.905441696113074e-06, + "loss": 0.3073, + "step": 8250 + }, + { + "epoch": 28.68, + "learning_rate": 2.9040282685512365e-06, + "loss": 0.2852, + "step": 8260 + }, + { + "epoch": 28.71, + "learning_rate": 2.9026148409893993e-06, + "loss": 0.275, + "step": 8270 + }, + { + "epoch": 28.75, + "learning_rate": 2.9012014134275617e-06, + "loss": 0.272, + "step": 8280 + }, + { + "epoch": 28.78, + "learning_rate": 2.8997879858657245e-06, + "loss": 0.2732, + "step": 8290 + }, + { + "epoch": 28.82, + "learning_rate": 2.898374558303887e-06, + "loss": 0.2734, + "step": 8300 + }, + { + "epoch": 28.85, + "learning_rate": 2.8969611307420493e-06, + "loss": 0.2581, + "step": 8310 + }, + { + "epoch": 28.89, + "learning_rate": 2.8955477031802118e-06, + "loss": 0.2689, + "step": 8320 + }, + { + "epoch": 28.92, + "learning_rate": 2.8941342756183746e-06, + "loss": 0.2592, + "step": 8330 + }, + { + "epoch": 28.96, + "learning_rate": 2.892720848056537e-06, + "loss": 0.261, + "step": 8340 + }, + { + "epoch": 28.99, + "learning_rate": 2.8913074204947e-06, + "loss": 0.2845, + "step": 8350 + }, + { + "epoch": 29.0, + "eval_loss": 0.5084418058395386, + "eval_runtime": 129.7694, + "eval_samples_per_second": 4.1, + "eval_steps_per_second": 1.025, + "eval_wer": 0.20203123995628977, + "step": 8352 + }, + { + "epoch": 29.03, + "learning_rate": 2.889893992932862e-06, + "loss": 0.2541, + "step": 8360 + }, + { + "epoch": 29.06, + "learning_rate": 2.8884805653710247e-06, + "loss": 0.2822, + "step": 8370 + }, + { + "epoch": 29.1, + "learning_rate": 2.887067137809187e-06, + "loss": 0.2498, + "step": 8380 + }, + { + "epoch": 29.13, + "learning_rate": 2.88565371024735e-06, + "loss": 0.2908, + "step": 8390 + }, + { + "epoch": 29.17, + "learning_rate": 2.8842402826855123e-06, + "loss": 0.2679, + "step": 8400 + }, + { + "epoch": 29.2, + "learning_rate": 2.882826855123675e-06, + "loss": 0.2352, + "step": 8410 + }, + { + "epoch": 29.24, + "learning_rate": 2.881413427561837e-06, + "loss": 0.2733, + "step": 8420 + }, + { + "epoch": 29.27, + "learning_rate": 2.88e-06, + "loss": 0.2427, + "step": 8430 + }, + { + "epoch": 29.3, + "learning_rate": 2.8785865724381624e-06, + "loss": 0.2692, + "step": 8440 + }, + { + "epoch": 29.34, + "learning_rate": 2.877173144876325e-06, + "loss": 0.27, + "step": 8450 + }, + { + "epoch": 29.37, + "learning_rate": 2.8757597173144876e-06, + "loss": 0.2465, + "step": 8460 + }, + { + "epoch": 29.41, + "learning_rate": 2.8743462897526504e-06, + "loss": 0.2853, + "step": 8470 + }, + { + "epoch": 29.44, + "learning_rate": 2.8729328621908124e-06, + "loss": 0.2536, + "step": 8480 + }, + { + "epoch": 29.48, + "learning_rate": 2.8715194346289753e-06, + "loss": 0.2824, + "step": 8490 + }, + { + "epoch": 29.51, + "learning_rate": 2.8701060070671377e-06, + "loss": 0.2749, + "step": 8500 + }, + { + "epoch": 29.55, + "learning_rate": 2.8686925795053005e-06, + "loss": 0.2399, + "step": 8510 + }, + { + "epoch": 29.58, + "learning_rate": 2.867279151943463e-06, + "loss": 0.2557, + "step": 8520 + }, + { + "epoch": 29.62, + "learning_rate": 2.865865724381625e-06, + "loss": 0.2561, + "step": 8530 + }, + { + "epoch": 29.65, + "learning_rate": 2.8644522968197877e-06, + "loss": 0.2758, + "step": 8540 + }, + { + "epoch": 29.69, + "learning_rate": 2.86303886925795e-06, + "loss": 0.2755, + "step": 8550 + }, + { + "epoch": 29.72, + "learning_rate": 2.861625441696113e-06, + "loss": 0.2732, + "step": 8560 + }, + { + "epoch": 29.75, + "learning_rate": 2.860212014134276e-06, + "loss": 0.282, + "step": 8570 + }, + { + "epoch": 29.79, + "learning_rate": 2.8587985865724382e-06, + "loss": 0.2516, + "step": 8580 + }, + { + "epoch": 29.82, + "learning_rate": 2.8573851590106e-06, + "loss": 0.2953, + "step": 8590 + }, + { + "epoch": 29.86, + "learning_rate": 2.855971731448763e-06, + "loss": 0.3114, + "step": 8600 + }, + { + "epoch": 29.89, + "learning_rate": 2.8545583038869254e-06, + "loss": 0.2853, + "step": 8610 + }, + { + "epoch": 29.93, + "learning_rate": 2.8531448763250883e-06, + "loss": 0.2648, + "step": 8620 + }, + { + "epoch": 29.96, + "learning_rate": 2.8517314487632507e-06, + "loss": 0.2812, + "step": 8630 + }, + { + "epoch": 30.0, + "learning_rate": 2.8503180212014135e-06, + "loss": 0.2591, + "step": 8640 + }, + { + "epoch": 30.0, + "eval_loss": 0.5109365582466125, + "eval_runtime": 129.6483, + "eval_samples_per_second": 4.103, + "eval_steps_per_second": 1.026, + "eval_wer": 0.1989458121745838, + "step": 8640 + }, + { + "epoch": 30.03, + "learning_rate": 2.8489045936395755e-06, + "loss": 0.272, + "step": 8650 + }, + { + "epoch": 30.07, + "learning_rate": 2.8474911660777383e-06, + "loss": 0.2787, + "step": 8660 + }, + { + "epoch": 30.1, + "learning_rate": 2.8460777385159007e-06, + "loss": 0.2711, + "step": 8670 + }, + { + "epoch": 30.14, + "learning_rate": 2.8446643109540636e-06, + "loss": 0.2828, + "step": 8680 + }, + { + "epoch": 30.17, + "learning_rate": 2.843250883392226e-06, + "loss": 0.2688, + "step": 8690 + }, + { + "epoch": 30.21, + "learning_rate": 2.8418374558303884e-06, + "loss": 0.2588, + "step": 8700 + }, + { + "epoch": 30.24, + "learning_rate": 2.840424028268551e-06, + "loss": 0.2539, + "step": 8710 + }, + { + "epoch": 30.28, + "learning_rate": 2.8390106007067136e-06, + "loss": 0.2443, + "step": 8720 + }, + { + "epoch": 30.31, + "learning_rate": 2.837597173144876e-06, + "loss": 0.2713, + "step": 8730 + }, + { + "epoch": 30.35, + "learning_rate": 2.836183745583039e-06, + "loss": 0.2811, + "step": 8740 + }, + { + "epoch": 30.38, + "learning_rate": 2.8347703180212013e-06, + "loss": 0.2653, + "step": 8750 + }, + { + "epoch": 30.42, + "learning_rate": 2.8333568904593637e-06, + "loss": 0.276, + "step": 8760 + }, + { + "epoch": 30.45, + "learning_rate": 2.831943462897526e-06, + "loss": 0.2519, + "step": 8770 + }, + { + "epoch": 30.48, + "learning_rate": 2.830530035335689e-06, + "loss": 0.2805, + "step": 8780 + }, + { + "epoch": 30.52, + "learning_rate": 2.8291166077738514e-06, + "loss": 0.2823, + "step": 8790 + }, + { + "epoch": 30.55, + "learning_rate": 2.827703180212014e-06, + "loss": 0.2714, + "step": 8800 + }, + { + "epoch": 30.59, + "learning_rate": 2.826289752650176e-06, + "loss": 0.2786, + "step": 8810 + }, + { + "epoch": 30.62, + "learning_rate": 2.824876325088339e-06, + "loss": 0.2636, + "step": 8820 + }, + { + "epoch": 30.66, + "learning_rate": 2.8234628975265014e-06, + "loss": 0.2723, + "step": 8830 + }, + { + "epoch": 30.69, + "learning_rate": 2.8220494699646643e-06, + "loss": 0.2795, + "step": 8840 + }, + { + "epoch": 30.73, + "learning_rate": 2.8206360424028267e-06, + "loss": 0.2547, + "step": 8850 + }, + { + "epoch": 30.76, + "learning_rate": 2.8192226148409895e-06, + "loss": 0.256, + "step": 8860 + }, + { + "epoch": 30.8, + "learning_rate": 2.8178091872791515e-06, + "loss": 0.2494, + "step": 8870 + }, + { + "epoch": 30.83, + "learning_rate": 2.8163957597173143e-06, + "loss": 0.2634, + "step": 8880 + }, + { + "epoch": 30.87, + "learning_rate": 2.8149823321554767e-06, + "loss": 0.2868, + "step": 8890 + }, + { + "epoch": 30.9, + "learning_rate": 2.8135689045936396e-06, + "loss": 0.247, + "step": 8900 + }, + { + "epoch": 30.94, + "learning_rate": 2.812155477031802e-06, + "loss": 0.2527, + "step": 8910 + }, + { + "epoch": 30.97, + "learning_rate": 2.810742049469965e-06, + "loss": 0.2777, + "step": 8920 + }, + { + "epoch": 31.0, + "eval_loss": 0.5179172158241272, + "eval_runtime": 129.9918, + "eval_samples_per_second": 4.093, + "eval_steps_per_second": 1.023, + "eval_wer": 0.19939577039274925, + "step": 8928 + }, + { + "epoch": 31.01, + "learning_rate": 2.8093286219081268e-06, + "loss": 0.2692, + "step": 8930 + }, + { + "epoch": 31.04, + "learning_rate": 2.8079151943462896e-06, + "loss": 0.2848, + "step": 8940 + }, + { + "epoch": 31.08, + "learning_rate": 2.806501766784452e-06, + "loss": 0.2704, + "step": 8950 + }, + { + "epoch": 31.11, + "learning_rate": 2.805088339222615e-06, + "loss": 0.253, + "step": 8960 + }, + { + "epoch": 31.15, + "learning_rate": 2.8036749116607773e-06, + "loss": 0.3008, + "step": 8970 + }, + { + "epoch": 31.18, + "learning_rate": 2.8022614840989397e-06, + "loss": 0.2674, + "step": 8980 + }, + { + "epoch": 31.21, + "learning_rate": 2.800848056537102e-06, + "loss": 0.2581, + "step": 8990 + }, + { + "epoch": 31.25, + "learning_rate": 2.799434628975265e-06, + "loss": 0.2539, + "step": 9000 + }, + { + "epoch": 31.28, + "learning_rate": 2.7980212014134273e-06, + "loss": 0.2625, + "step": 9010 + }, + { + "epoch": 31.32, + "learning_rate": 2.79660777385159e-06, + "loss": 0.2533, + "step": 9020 + }, + { + "epoch": 31.35, + "learning_rate": 2.7951943462897526e-06, + "loss": 0.2822, + "step": 9030 + }, + { + "epoch": 31.39, + "learning_rate": 2.793780918727915e-06, + "loss": 0.2678, + "step": 9040 + }, + { + "epoch": 31.42, + "learning_rate": 2.7923674911660774e-06, + "loss": 0.26, + "step": 9050 + }, + { + "epoch": 31.46, + "learning_rate": 2.7909540636042402e-06, + "loss": 0.2568, + "step": 9060 + }, + { + "epoch": 31.49, + "learning_rate": 2.7895406360424026e-06, + "loss": 0.2713, + "step": 9070 + }, + { + "epoch": 31.53, + "learning_rate": 2.7881272084805655e-06, + "loss": 0.2664, + "step": 9080 + }, + { + "epoch": 31.56, + "learning_rate": 2.786713780918728e-06, + "loss": 0.2682, + "step": 9090 + }, + { + "epoch": 31.6, + "learning_rate": 2.7853003533568903e-06, + "loss": 0.2739, + "step": 9100 + }, + { + "epoch": 31.63, + "learning_rate": 2.7838869257950527e-06, + "loss": 0.2553, + "step": 9110 + }, + { + "epoch": 31.66, + "learning_rate": 2.7824734982332155e-06, + "loss": 0.2882, + "step": 9120 + }, + { + "epoch": 31.7, + "learning_rate": 2.781060070671378e-06, + "loss": 0.252, + "step": 9130 + }, + { + "epoch": 31.73, + "learning_rate": 2.7796466431095408e-06, + "loss": 0.257, + "step": 9140 + }, + { + "epoch": 31.77, + "learning_rate": 2.7782332155477028e-06, + "loss": 0.271, + "step": 9150 + }, + { + "epoch": 31.8, + "learning_rate": 2.7768197879858656e-06, + "loss": 0.263, + "step": 9160 + }, + { + "epoch": 31.84, + "learning_rate": 2.775406360424028e-06, + "loss": 0.2663, + "step": 9170 + }, + { + "epoch": 31.87, + "learning_rate": 2.773992932862191e-06, + "loss": 0.274, + "step": 9180 + }, + { + "epoch": 31.91, + "learning_rate": 2.7725795053003532e-06, + "loss": 0.2567, + "step": 9190 + }, + { + "epoch": 31.94, + "learning_rate": 2.771166077738516e-06, + "loss": 0.2676, + "step": 9200 + }, + { + "epoch": 31.98, + "learning_rate": 2.769752650176678e-06, + "loss": 0.2784, + "step": 9210 + }, + { + "epoch": 32.0, + "eval_loss": 0.518265962600708, + "eval_runtime": 129.4613, + "eval_samples_per_second": 4.109, + "eval_steps_per_second": 1.027, + "eval_wer": 0.1989458121745838, + "step": 9216 + }, + { + "epoch": 32.01, + "learning_rate": 2.768339222614841e-06, + "loss": 0.2617, + "step": 9220 + }, + { + "epoch": 32.05, + "learning_rate": 2.7669257950530033e-06, + "loss": 0.2787, + "step": 9230 + }, + { + "epoch": 32.08, + "learning_rate": 2.765512367491166e-06, + "loss": 0.2495, + "step": 9240 + }, + { + "epoch": 32.12, + "learning_rate": 2.7640989399293285e-06, + "loss": 0.249, + "step": 9250 + }, + { + "epoch": 32.15, + "learning_rate": 2.7626855123674914e-06, + "loss": 0.2824, + "step": 9260 + }, + { + "epoch": 32.19, + "learning_rate": 2.7612720848056534e-06, + "loss": 0.2872, + "step": 9270 + }, + { + "epoch": 32.22, + "learning_rate": 2.759858657243816e-06, + "loss": 0.2743, + "step": 9280 + }, + { + "epoch": 32.26, + "learning_rate": 2.7585865724381622e-06, + "loss": 0.2752, + "step": 9290 + }, + { + "epoch": 32.29, + "learning_rate": 2.757173144876325e-06, + "loss": 0.2671, + "step": 9300 + }, + { + "epoch": 32.33, + "learning_rate": 2.7557597173144875e-06, + "loss": 0.2559, + "step": 9310 + }, + { + "epoch": 32.36, + "learning_rate": 2.7543462897526503e-06, + "loss": 0.2762, + "step": 9320 + }, + { + "epoch": 32.39, + "learning_rate": 2.7529328621908127e-06, + "loss": 0.2633, + "step": 9330 + }, + { + "epoch": 32.43, + "learning_rate": 2.751519434628975e-06, + "loss": 0.2554, + "step": 9340 + }, + { + "epoch": 32.46, + "learning_rate": 2.7501060070671375e-06, + "loss": 0.2922, + "step": 9350 + }, + { + "epoch": 32.5, + "learning_rate": 2.7486925795053004e-06, + "loss": 0.2827, + "step": 9360 + }, + { + "epoch": 32.53, + "learning_rate": 2.747279151943463e-06, + "loss": 0.2491, + "step": 9370 + }, + { + "epoch": 32.57, + "learning_rate": 2.7458657243816256e-06, + "loss": 0.2386, + "step": 9380 + }, + { + "epoch": 32.6, + "learning_rate": 2.744452296819788e-06, + "loss": 0.2375, + "step": 9390 + }, + { + "epoch": 32.64, + "learning_rate": 2.7430388692579504e-06, + "loss": 0.2663, + "step": 9400 + }, + { + "epoch": 32.67, + "learning_rate": 2.741625441696113e-06, + "loss": 0.2674, + "step": 9410 + }, + { + "epoch": 32.71, + "learning_rate": 2.7402120141342757e-06, + "loss": 0.2609, + "step": 9420 + }, + { + "epoch": 32.74, + "learning_rate": 2.738798586572438e-06, + "loss": 0.2538, + "step": 9430 + }, + { + "epoch": 32.78, + "learning_rate": 2.737385159010601e-06, + "loss": 0.268, + "step": 9440 + }, + { + "epoch": 32.81, + "learning_rate": 2.735971731448763e-06, + "loss": 0.2698, + "step": 9450 + }, + { + "epoch": 32.85, + "learning_rate": 2.7345583038869257e-06, + "loss": 0.2826, + "step": 9460 + }, + { + "epoch": 32.88, + "learning_rate": 2.733144876325088e-06, + "loss": 0.249, + "step": 9470 + }, + { + "epoch": 32.91, + "learning_rate": 2.731731448763251e-06, + "loss": 0.2555, + "step": 9480 + }, + { + "epoch": 32.95, + "learning_rate": 2.7303180212014134e-06, + "loss": 0.243, + "step": 9490 + }, + { + "epoch": 32.98, + "learning_rate": 2.7289045936395762e-06, + "loss": 0.2801, + "step": 9500 + }, + { + "epoch": 33.0, + "eval_loss": 0.5222018957138062, + "eval_runtime": 129.2645, + "eval_samples_per_second": 4.116, + "eval_steps_per_second": 1.029, + "eval_wer": 0.20029568682908017, + "step": 9504 + }, + { + "epoch": 33.02, + "learning_rate": 2.7274911660777382e-06, + "loss": 0.2721, + "step": 9510 + }, + { + "epoch": 33.06, + "learning_rate": 2.7260777385159006e-06, + "loss": 0.2799, + "step": 9520 + }, + { + "epoch": 33.09, + "learning_rate": 2.7246643109540635e-06, + "loss": 0.2719, + "step": 9530 + }, + { + "epoch": 33.12, + "learning_rate": 2.7232508833922263e-06, + "loss": 0.2716, + "step": 9540 + }, + { + "epoch": 33.16, + "learning_rate": 2.7218374558303887e-06, + "loss": 0.2768, + "step": 9550 + }, + { + "epoch": 33.19, + "learning_rate": 2.7204240282685515e-06, + "loss": 0.2619, + "step": 9560 + }, + { + "epoch": 33.23, + "learning_rate": 2.7190106007067135e-06, + "loss": 0.2864, + "step": 9570 + }, + { + "epoch": 33.26, + "learning_rate": 2.717597173144876e-06, + "loss": 0.2651, + "step": 9580 + }, + { + "epoch": 33.3, + "learning_rate": 2.7161837455830388e-06, + "loss": 0.2799, + "step": 9590 + }, + { + "epoch": 33.33, + "learning_rate": 2.714770318021201e-06, + "loss": 0.2821, + "step": 9600 + }, + { + "epoch": 33.37, + "learning_rate": 2.713356890459364e-06, + "loss": 0.2742, + "step": 9610 + }, + { + "epoch": 33.4, + "learning_rate": 2.711943462897526e-06, + "loss": 0.267, + "step": 9620 + }, + { + "epoch": 33.44, + "learning_rate": 2.710530035335689e-06, + "loss": 0.2676, + "step": 9630 + }, + { + "epoch": 33.47, + "learning_rate": 2.7091166077738512e-06, + "loss": 0.2992, + "step": 9640 + }, + { + "epoch": 33.51, + "learning_rate": 2.707703180212014e-06, + "loss": 0.3028, + "step": 9650 + }, + { + "epoch": 33.54, + "learning_rate": 2.7062897526501765e-06, + "loss": 0.2624, + "step": 9660 + }, + { + "epoch": 33.57, + "learning_rate": 2.7048763250883393e-06, + "loss": 0.2673, + "step": 9670 + }, + { + "epoch": 33.61, + "learning_rate": 2.7034628975265013e-06, + "loss": 0.2599, + "step": 9680 + }, + { + "epoch": 33.64, + "learning_rate": 2.702049469964664e-06, + "loss": 0.2548, + "step": 9690 + }, + { + "epoch": 33.68, + "learning_rate": 2.7006360424028265e-06, + "loss": 0.2647, + "step": 9700 + }, + { + "epoch": 33.71, + "learning_rate": 2.6992226148409894e-06, + "loss": 0.264, + "step": 9710 + }, + { + "epoch": 33.75, + "learning_rate": 2.6978091872791518e-06, + "loss": 0.2615, + "step": 9720 + }, + { + "epoch": 33.78, + "learning_rate": 2.696395759717314e-06, + "loss": 0.2579, + "step": 9730 + }, + { + "epoch": 33.82, + "learning_rate": 2.6949823321554766e-06, + "loss": 0.2806, + "step": 9740 + }, + { + "epoch": 33.85, + "learning_rate": 2.6935689045936394e-06, + "loss": 0.2679, + "step": 9750 + }, + { + "epoch": 33.89, + "learning_rate": 2.692155477031802e-06, + "loss": 0.2415, + "step": 9760 + }, + { + "epoch": 33.92, + "learning_rate": 2.6907420494699647e-06, + "loss": 0.2645, + "step": 9770 + }, + { + "epoch": 33.96, + "learning_rate": 2.689328621908127e-06, + "loss": 0.2602, + "step": 9780 + }, + { + "epoch": 33.99, + "learning_rate": 2.6879151943462895e-06, + "loss": 0.2554, + "step": 9790 + }, + { + "epoch": 34.0, + "eval_loss": 0.5137259364128113, + "eval_runtime": 129.6969, + "eval_samples_per_second": 4.102, + "eval_steps_per_second": 1.025, + "eval_wer": 0.199010091920036, + "step": 9792 + }, + { + "epoch": 34.03, + "learning_rate": 2.686501766784452e-06, + "loss": 0.2962, + "step": 9800 + }, + { + "epoch": 34.06, + "learning_rate": 2.6850883392226147e-06, + "loss": 0.2692, + "step": 9810 + }, + { + "epoch": 34.1, + "learning_rate": 2.683674911660777e-06, + "loss": 0.2522, + "step": 9820 + }, + { + "epoch": 34.13, + "learning_rate": 2.68226148409894e-06, + "loss": 0.2894, + "step": 9830 + }, + { + "epoch": 34.17, + "learning_rate": 2.6808480565371024e-06, + "loss": 0.2864, + "step": 9840 + }, + { + "epoch": 34.2, + "learning_rate": 2.679434628975265e-06, + "loss": 0.2564, + "step": 9850 + }, + { + "epoch": 34.24, + "learning_rate": 2.678021201413427e-06, + "loss": 0.2632, + "step": 9860 + }, + { + "epoch": 34.27, + "learning_rate": 2.67660777385159e-06, + "loss": 0.2442, + "step": 9870 + }, + { + "epoch": 34.3, + "learning_rate": 2.6751943462897525e-06, + "loss": 0.2923, + "step": 9880 + }, + { + "epoch": 34.34, + "learning_rate": 2.6737809187279153e-06, + "loss": 0.2789, + "step": 9890 + }, + { + "epoch": 34.37, + "learning_rate": 2.6723674911660773e-06, + "loss": 0.2835, + "step": 9900 + }, + { + "epoch": 34.41, + "learning_rate": 2.67095406360424e-06, + "loss": 0.2634, + "step": 9910 + }, + { + "epoch": 34.44, + "learning_rate": 2.6695406360424025e-06, + "loss": 0.2771, + "step": 9920 + }, + { + "epoch": 34.48, + "learning_rate": 2.6681272084805653e-06, + "loss": 0.2659, + "step": 9930 + }, + { + "epoch": 34.51, + "learning_rate": 2.6667137809187278e-06, + "loss": 0.2556, + "step": 9940 + }, + { + "epoch": 34.55, + "learning_rate": 2.6653003533568906e-06, + "loss": 0.2524, + "step": 9950 + }, + { + "epoch": 34.58, + "learning_rate": 2.6638869257950526e-06, + "loss": 0.2783, + "step": 9960 + }, + { + "epoch": 34.62, + "learning_rate": 2.6624734982332154e-06, + "loss": 0.245, + "step": 9970 + }, + { + "epoch": 34.65, + "learning_rate": 2.661060070671378e-06, + "loss": 0.2642, + "step": 9980 + }, + { + "epoch": 34.69, + "learning_rate": 2.6596466431095407e-06, + "loss": 0.2945, + "step": 9990 + }, + { + "epoch": 34.72, + "learning_rate": 2.658233215547703e-06, + "loss": 0.25, + "step": 10000 + }, + { + "epoch": 34.75, + "learning_rate": 2.656819787985866e-06, + "loss": 0.2635, + "step": 10010 + }, + { + "epoch": 34.79, + "learning_rate": 2.655406360424028e-06, + "loss": 0.2492, + "step": 10020 + }, + { + "epoch": 34.82, + "learning_rate": 2.6539929328621907e-06, + "loss": 0.2789, + "step": 10030 + }, + { + "epoch": 34.86, + "learning_rate": 2.652579505300353e-06, + "loss": 0.2797, + "step": 10040 + }, + { + "epoch": 34.89, + "learning_rate": 2.651166077738516e-06, + "loss": 0.2378, + "step": 10050 + }, + { + "epoch": 34.93, + "learning_rate": 2.6497526501766784e-06, + "loss": 0.2545, + "step": 10060 + }, + { + "epoch": 34.96, + "learning_rate": 2.6483392226148408e-06, + "loss": 0.2677, + "step": 10070 + }, + { + "epoch": 35.0, + "learning_rate": 2.646925795053003e-06, + "loss": 0.2708, + "step": 10080 + }, + { + "epoch": 35.0, + "eval_loss": 0.5093948841094971, + "eval_runtime": 129.527, + "eval_samples_per_second": 4.107, + "eval_steps_per_second": 1.027, + "eval_wer": 0.19643890210194767, + "step": 10080 + }, + { + "epoch": 35.03, + "learning_rate": 2.645512367491166e-06, + "loss": 0.2628, + "step": 10090 + }, + { + "epoch": 35.07, + "learning_rate": 2.6440989399293284e-06, + "loss": 0.263, + "step": 10100 + }, + { + "epoch": 35.1, + "learning_rate": 2.6426855123674913e-06, + "loss": 0.241, + "step": 10110 + }, + { + "epoch": 35.14, + "learning_rate": 2.6412720848056537e-06, + "loss": 0.2802, + "step": 10120 + }, + { + "epoch": 35.17, + "learning_rate": 2.639858657243816e-06, + "loss": 0.2675, + "step": 10130 + }, + { + "epoch": 35.21, + "learning_rate": 2.6384452296819785e-06, + "loss": 0.2626, + "step": 10140 + }, + { + "epoch": 35.24, + "learning_rate": 2.6370318021201413e-06, + "loss": 0.2853, + "step": 10150 + }, + { + "epoch": 35.28, + "learning_rate": 2.6356183745583037e-06, + "loss": 0.2683, + "step": 10160 + }, + { + "epoch": 35.31, + "learning_rate": 2.6342049469964666e-06, + "loss": 0.269, + "step": 10170 + }, + { + "epoch": 35.35, + "learning_rate": 2.632791519434629e-06, + "loss": 0.2872, + "step": 10180 + }, + { + "epoch": 35.38, + "learning_rate": 2.6313780918727914e-06, + "loss": 0.2519, + "step": 10190 + }, + { + "epoch": 35.42, + "learning_rate": 2.629964664310954e-06, + "loss": 0.2554, + "step": 10200 + }, + { + "epoch": 35.45, + "learning_rate": 2.6285512367491166e-06, + "loss": 0.2548, + "step": 10210 + }, + { + "epoch": 35.48, + "learning_rate": 2.627137809187279e-06, + "loss": 0.291, + "step": 10220 + }, + { + "epoch": 35.52, + "learning_rate": 2.625724381625442e-06, + "loss": 0.2507, + "step": 10230 + }, + { + "epoch": 35.55, + "learning_rate": 2.624310954063604e-06, + "loss": 0.2681, + "step": 10240 + }, + { + "epoch": 35.59, + "learning_rate": 2.6228975265017667e-06, + "loss": 0.2637, + "step": 10250 + }, + { + "epoch": 35.62, + "learning_rate": 2.621484098939929e-06, + "loss": 0.2707, + "step": 10260 + }, + { + "epoch": 35.66, + "learning_rate": 2.620070671378092e-06, + "loss": 0.2784, + "step": 10270 + }, + { + "epoch": 35.69, + "learning_rate": 2.6186572438162543e-06, + "loss": 0.28, + "step": 10280 + }, + { + "epoch": 35.73, + "learning_rate": 2.617243816254417e-06, + "loss": 0.2459, + "step": 10290 + }, + { + "epoch": 35.76, + "learning_rate": 2.615830388692579e-06, + "loss": 0.2663, + "step": 10300 + }, + { + "epoch": 35.8, + "learning_rate": 2.614416961130742e-06, + "loss": 0.2546, + "step": 10310 + }, + { + "epoch": 35.83, + "learning_rate": 2.6130035335689044e-06, + "loss": 0.2632, + "step": 10320 + }, + { + "epoch": 35.87, + "learning_rate": 2.6115901060070672e-06, + "loss": 0.2692, + "step": 10330 + }, + { + "epoch": 35.9, + "learning_rate": 2.6101766784452296e-06, + "loss": 0.292, + "step": 10340 + }, + { + "epoch": 35.94, + "learning_rate": 2.608763250883392e-06, + "loss": 0.2487, + "step": 10350 + }, + { + "epoch": 35.97, + "learning_rate": 2.6073498233215545e-06, + "loss": 0.27, + "step": 10360 + }, + { + "epoch": 36.0, + "eval_loss": 0.5076168775558472, + "eval_runtime": 129.8583, + "eval_samples_per_second": 4.097, + "eval_steps_per_second": 1.024, + "eval_wer": 0.19798161599280067, + "step": 10368 + }, + { + "epoch": 36.01, + "learning_rate": 2.6059363957597173e-06, + "loss": 0.2559, + "step": 10370 + }, + { + "epoch": 36.04, + "learning_rate": 2.6045229681978797e-06, + "loss": 0.2505, + "step": 10380 + }, + { + "epoch": 36.08, + "learning_rate": 2.6031095406360425e-06, + "loss": 0.279, + "step": 10390 + }, + { + "epoch": 36.11, + "learning_rate": 2.601696113074205e-06, + "loss": 0.2585, + "step": 10400 + }, + { + "epoch": 36.15, + "learning_rate": 2.6002826855123674e-06, + "loss": 0.2484, + "step": 10410 + }, + { + "epoch": 36.18, + "learning_rate": 2.5988692579505298e-06, + "loss": 0.2734, + "step": 10420 + }, + { + "epoch": 36.21, + "learning_rate": 2.5974558303886926e-06, + "loss": 0.2707, + "step": 10430 + }, + { + "epoch": 36.25, + "learning_rate": 2.596042402826855e-06, + "loss": 0.2594, + "step": 10440 + }, + { + "epoch": 36.28, + "learning_rate": 2.594628975265018e-06, + "loss": 0.248, + "step": 10450 + }, + { + "epoch": 36.32, + "learning_rate": 2.5932155477031803e-06, + "loss": 0.2647, + "step": 10460 + }, + { + "epoch": 36.35, + "learning_rate": 2.5918021201413427e-06, + "loss": 0.2599, + "step": 10470 + }, + { + "epoch": 36.39, + "learning_rate": 2.590388692579505e-06, + "loss": 0.267, + "step": 10480 + }, + { + "epoch": 36.42, + "learning_rate": 2.588975265017668e-06, + "loss": 0.2639, + "step": 10490 + }, + { + "epoch": 36.46, + "learning_rate": 2.5875618374558303e-06, + "loss": 0.2715, + "step": 10500 + }, + { + "epoch": 36.49, + "learning_rate": 2.586148409893993e-06, + "loss": 0.3031, + "step": 10510 + }, + { + "epoch": 36.53, + "learning_rate": 2.584734982332155e-06, + "loss": 0.2996, + "step": 10520 + }, + { + "epoch": 36.56, + "learning_rate": 2.583321554770318e-06, + "loss": 0.2586, + "step": 10530 + }, + { + "epoch": 36.6, + "learning_rate": 2.5819081272084804e-06, + "loss": 0.2514, + "step": 10540 + }, + { + "epoch": 36.63, + "learning_rate": 2.580494699646643e-06, + "loss": 0.255, + "step": 10550 + }, + { + "epoch": 36.66, + "learning_rate": 2.5790812720848056e-06, + "loss": 0.2765, + "step": 10560 + }, + { + "epoch": 36.7, + "learning_rate": 2.5776678445229685e-06, + "loss": 0.2721, + "step": 10570 + }, + { + "epoch": 36.73, + "learning_rate": 2.5762544169611304e-06, + "loss": 0.2704, + "step": 10580 + }, + { + "epoch": 36.77, + "learning_rate": 2.5748409893992933e-06, + "loss": 0.2613, + "step": 10590 + }, + { + "epoch": 36.8, + "learning_rate": 2.5734275618374557e-06, + "loss": 0.2711, + "step": 10600 + }, + { + "epoch": 36.84, + "learning_rate": 2.5720141342756185e-06, + "loss": 0.2769, + "step": 10610 + }, + { + "epoch": 36.87, + "learning_rate": 2.570600706713781e-06, + "loss": 0.2635, + "step": 10620 + }, + { + "epoch": 36.91, + "learning_rate": 2.5691872791519438e-06, + "loss": 0.2655, + "step": 10630 + }, + { + "epoch": 36.94, + "learning_rate": 2.5677738515901057e-06, + "loss": 0.2689, + "step": 10640 + }, + { + "epoch": 36.98, + "learning_rate": 2.566360424028268e-06, + "loss": 0.2706, + "step": 10650 + }, + { + "epoch": 37.0, + "eval_loss": 0.5178768038749695, + "eval_runtime": 130.9202, + "eval_samples_per_second": 4.064, + "eval_steps_per_second": 1.016, + "eval_wer": 0.1983030147200617, + "step": 10656 + }, + { + "epoch": 37.01, + "learning_rate": 2.564946996466431e-06, + "loss": 0.2868, + "step": 10660 + }, + { + "epoch": 37.05, + "learning_rate": 2.5635335689045934e-06, + "loss": 0.2749, + "step": 10670 + }, + { + "epoch": 37.08, + "learning_rate": 2.5621201413427562e-06, + "loss": 0.2454, + "step": 10680 + }, + { + "epoch": 37.12, + "learning_rate": 2.5607067137809182e-06, + "loss": 0.283, + "step": 10690 + }, + { + "epoch": 37.15, + "learning_rate": 2.559293286219081e-06, + "loss": 0.2709, + "step": 10700 + }, + { + "epoch": 37.19, + "learning_rate": 2.5578798586572435e-06, + "loss": 0.2623, + "step": 10710 + }, + { + "epoch": 37.22, + "learning_rate": 2.5564664310954063e-06, + "loss": 0.2742, + "step": 10720 + }, + { + "epoch": 37.26, + "learning_rate": 2.5550530035335687e-06, + "loss": 0.2683, + "step": 10730 + }, + { + "epoch": 37.29, + "learning_rate": 2.5536395759717315e-06, + "loss": 0.251, + "step": 10740 + }, + { + "epoch": 37.33, + "learning_rate": 2.5522261484098935e-06, + "loss": 0.2613, + "step": 10750 + }, + { + "epoch": 37.36, + "learning_rate": 2.5508127208480564e-06, + "loss": 0.2655, + "step": 10760 + }, + { + "epoch": 37.39, + "learning_rate": 2.5493992932862188e-06, + "loss": 0.2723, + "step": 10770 + }, + { + "epoch": 37.43, + "learning_rate": 2.5479858657243816e-06, + "loss": 0.2675, + "step": 10780 + }, + { + "epoch": 37.46, + "learning_rate": 2.546572438162544e-06, + "loss": 0.2732, + "step": 10790 + }, + { + "epoch": 37.5, + "learning_rate": 2.545159010600707e-06, + "loss": 0.2773, + "step": 10800 + }, + { + "epoch": 37.53, + "learning_rate": 2.543745583038869e-06, + "loss": 0.2536, + "step": 10810 + }, + { + "epoch": 37.57, + "learning_rate": 2.5423321554770317e-06, + "loss": 0.2693, + "step": 10820 + }, + { + "epoch": 37.6, + "learning_rate": 2.540918727915194e-06, + "loss": 0.2498, + "step": 10830 + }, + { + "epoch": 37.64, + "learning_rate": 2.539505300353357e-06, + "loss": 0.2603, + "step": 10840 + }, + { + "epoch": 37.67, + "learning_rate": 2.5380918727915193e-06, + "loss": 0.2798, + "step": 10850 + }, + { + "epoch": 37.71, + "learning_rate": 2.5366784452296817e-06, + "loss": 0.2911, + "step": 10860 + }, + { + "epoch": 37.74, + "learning_rate": 2.535265017667844e-06, + "loss": 0.2625, + "step": 10870 + }, + { + "epoch": 37.78, + "learning_rate": 2.533851590106007e-06, + "loss": 0.2744, + "step": 10880 + }, + { + "epoch": 37.81, + "learning_rate": 2.5324381625441694e-06, + "loss": 0.2753, + "step": 10890 + }, + { + "epoch": 37.85, + "learning_rate": 2.531024734982332e-06, + "loss": 0.267, + "step": 10900 + }, + { + "epoch": 37.88, + "learning_rate": 2.5296113074204946e-06, + "loss": 0.2572, + "step": 10910 + }, + { + "epoch": 37.91, + "learning_rate": 2.528197879858657e-06, + "loss": 0.2551, + "step": 10920 + }, + { + "epoch": 37.95, + "learning_rate": 2.5267844522968194e-06, + "loss": 0.2469, + "step": 10930 + }, + { + "epoch": 37.98, + "learning_rate": 2.5253710247349823e-06, + "loss": 0.2791, + "step": 10940 + }, + { + "epoch": 38.0, + "eval_loss": 0.515429675579071, + "eval_runtime": 130.0554, + "eval_samples_per_second": 4.091, + "eval_steps_per_second": 1.023, + "eval_wer": 0.19759593752008742, + "step": 10944 + }, + { + "epoch": 38.02, + "learning_rate": 2.5239575971731447e-06, + "loss": 0.2944, + "step": 10950 + }, + { + "epoch": 38.06, + "learning_rate": 2.5225441696113075e-06, + "loss": 0.264, + "step": 10960 + }, + { + "epoch": 38.09, + "learning_rate": 2.52113074204947e-06, + "loss": 0.2722, + "step": 10970 + }, + { + "epoch": 38.12, + "learning_rate": 2.5197173144876323e-06, + "loss": 0.2692, + "step": 10980 + }, + { + "epoch": 38.16, + "learning_rate": 2.5183038869257947e-06, + "loss": 0.2607, + "step": 10990 + }, + { + "epoch": 38.19, + "learning_rate": 2.5168904593639576e-06, + "loss": 0.2412, + "step": 11000 + }, + { + "epoch": 38.23, + "learning_rate": 2.51547703180212e-06, + "loss": 0.2621, + "step": 11010 + }, + { + "epoch": 38.26, + "learning_rate": 2.514063604240283e-06, + "loss": 0.2383, + "step": 11020 + }, + { + "epoch": 38.3, + "learning_rate": 2.512650176678445e-06, + "loss": 0.2608, + "step": 11030 + }, + { + "epoch": 38.33, + "learning_rate": 2.5112367491166076e-06, + "loss": 0.2865, + "step": 11040 + }, + { + "epoch": 38.37, + "learning_rate": 2.50982332155477e-06, + "loss": 0.2529, + "step": 11050 + }, + { + "epoch": 38.4, + "learning_rate": 2.508409893992933e-06, + "loss": 0.2468, + "step": 11060 + }, + { + "epoch": 38.44, + "learning_rate": 2.5069964664310953e-06, + "loss": 0.2767, + "step": 11070 + }, + { + "epoch": 38.47, + "learning_rate": 2.505583038869258e-06, + "loss": 0.2832, + "step": 11080 + }, + { + "epoch": 38.51, + "learning_rate": 2.50416961130742e-06, + "loss": 0.2732, + "step": 11090 + }, + { + "epoch": 38.54, + "learning_rate": 2.502756183745583e-06, + "loss": 0.2604, + "step": 11100 + }, + { + "epoch": 38.57, + "learning_rate": 2.5013427561837453e-06, + "loss": 0.2797, + "step": 11110 + }, + { + "epoch": 38.61, + "learning_rate": 2.499929328621908e-06, + "loss": 0.2548, + "step": 11120 + }, + { + "epoch": 38.64, + "learning_rate": 2.4985159010600706e-06, + "loss": 0.2735, + "step": 11130 + }, + { + "epoch": 38.68, + "learning_rate": 2.497102473498233e-06, + "loss": 0.2544, + "step": 11140 + }, + { + "epoch": 38.71, + "learning_rate": 2.4956890459363954e-06, + "loss": 0.2744, + "step": 11150 + }, + { + "epoch": 38.75, + "learning_rate": 2.4942756183745582e-06, + "loss": 0.2696, + "step": 11160 + }, + { + "epoch": 38.78, + "learning_rate": 2.4928621908127206e-06, + "loss": 0.2339, + "step": 11170 + }, + { + "epoch": 38.82, + "learning_rate": 2.4914487632508835e-06, + "loss": 0.2658, + "step": 11180 + }, + { + "epoch": 38.85, + "learning_rate": 2.490035335689046e-06, + "loss": 0.2626, + "step": 11190 + }, + { + "epoch": 38.89, + "learning_rate": 2.4886219081272083e-06, + "loss": 0.2592, + "step": 11200 + }, + { + "epoch": 38.92, + "learning_rate": 2.4872084805653707e-06, + "loss": 0.2644, + "step": 11210 + }, + { + "epoch": 38.96, + "learning_rate": 2.4857950530035335e-06, + "loss": 0.2661, + "step": 11220 + }, + { + "epoch": 38.99, + "learning_rate": 2.484381625441696e-06, + "loss": 0.3148, + "step": 11230 + }, + { + "epoch": 39.0, + "eval_loss": 0.5082433223724365, + "eval_runtime": 132.6404, + "eval_samples_per_second": 4.011, + "eval_steps_per_second": 1.003, + "eval_wer": 0.199010091920036, + "step": 11232 + }, + { + "epoch": 39.03, + "learning_rate": 2.4829681978798588e-06, + "loss": 0.261, + "step": 11240 + }, + { + "epoch": 39.06, + "learning_rate": 2.481554770318021e-06, + "loss": 0.2706, + "step": 11250 + }, + { + "epoch": 39.1, + "learning_rate": 2.4801413427561836e-06, + "loss": 0.2532, + "step": 11260 + }, + { + "epoch": 39.13, + "learning_rate": 2.478727915194346e-06, + "loss": 0.2841, + "step": 11270 + }, + { + "epoch": 39.17, + "learning_rate": 2.477314487632509e-06, + "loss": 0.2502, + "step": 11280 + }, + { + "epoch": 39.2, + "learning_rate": 2.4759010600706713e-06, + "loss": 0.2579, + "step": 11290 + }, + { + "epoch": 39.24, + "learning_rate": 2.474487632508834e-06, + "loss": 0.2768, + "step": 11300 + }, + { + "epoch": 39.27, + "learning_rate": 2.473074204946996e-06, + "loss": 0.2351, + "step": 11310 + }, + { + "epoch": 39.3, + "learning_rate": 2.471660777385159e-06, + "loss": 0.2888, + "step": 11320 + }, + { + "epoch": 39.34, + "learning_rate": 2.4702473498233213e-06, + "loss": 0.2852, + "step": 11330 + }, + { + "epoch": 39.37, + "learning_rate": 2.468833922261484e-06, + "loss": 0.2604, + "step": 11340 + }, + { + "epoch": 39.41, + "learning_rate": 2.4674204946996466e-06, + "loss": 0.2629, + "step": 11350 + }, + { + "epoch": 39.44, + "learning_rate": 2.4660070671378094e-06, + "loss": 0.2291, + "step": 11360 + }, + { + "epoch": 39.48, + "learning_rate": 2.4645936395759714e-06, + "loss": 0.2684, + "step": 11370 + }, + { + "epoch": 39.51, + "learning_rate": 2.4631802120141342e-06, + "loss": 0.2635, + "step": 11380 + }, + { + "epoch": 39.55, + "learning_rate": 2.4617667844522966e-06, + "loss": 0.2524, + "step": 11390 + }, + { + "epoch": 39.58, + "learning_rate": 2.4603533568904595e-06, + "loss": 0.2813, + "step": 11400 + }, + { + "epoch": 39.62, + "learning_rate": 2.458939929328622e-06, + "loss": 0.2778, + "step": 11410 + }, + { + "epoch": 39.65, + "learning_rate": 2.4575265017667847e-06, + "loss": 0.2845, + "step": 11420 + }, + { + "epoch": 39.69, + "learning_rate": 2.4561130742049467e-06, + "loss": 0.2779, + "step": 11430 + }, + { + "epoch": 39.72, + "learning_rate": 2.4546996466431095e-06, + "loss": 0.2418, + "step": 11440 + }, + { + "epoch": 39.75, + "learning_rate": 2.453286219081272e-06, + "loss": 0.2493, + "step": 11450 + }, + { + "epoch": 39.79, + "learning_rate": 2.4518727915194348e-06, + "loss": 0.2677, + "step": 11460 + }, + { + "epoch": 39.82, + "learning_rate": 2.450459363957597e-06, + "loss": 0.2747, + "step": 11470 + }, + { + "epoch": 39.86, + "learning_rate": 2.4490459363957596e-06, + "loss": 0.2768, + "step": 11480 + }, + { + "epoch": 39.89, + "learning_rate": 2.447632508833922e-06, + "loss": 0.2705, + "step": 11490 + }, + { + "epoch": 39.93, + "learning_rate": 2.446219081272085e-06, + "loss": 0.2486, + "step": 11500 + }, + { + "epoch": 39.96, + "learning_rate": 2.4448056537102472e-06, + "loss": 0.2852, + "step": 11510 + }, + { + "epoch": 40.0, + "learning_rate": 2.44339222614841e-06, + "loss": 0.2834, + "step": 11520 + }, + { + "epoch": 40.0, + "eval_loss": 0.5106706023216248, + "eval_runtime": 132.6333, + "eval_samples_per_second": 4.011, + "eval_steps_per_second": 1.003, + "eval_wer": 0.19804589573825288, + "step": 11520 + }, + { + "epoch": 40.03, + "learning_rate": 2.4419787985865725e-06, + "loss": 0.2684, + "step": 11530 + }, + { + "epoch": 40.07, + "learning_rate": 2.440565371024735e-06, + "loss": 0.2851, + "step": 11540 + }, + { + "epoch": 40.1, + "learning_rate": 2.4391519434628973e-06, + "loss": 0.2619, + "step": 11550 + }, + { + "epoch": 40.14, + "learning_rate": 2.43773851590106e-06, + "loss": 0.2778, + "step": 11560 + }, + { + "epoch": 40.17, + "learning_rate": 2.4363250883392225e-06, + "loss": 0.2822, + "step": 11570 + }, + { + "epoch": 40.21, + "learning_rate": 2.4349116607773854e-06, + "loss": 0.2447, + "step": 11580 + }, + { + "epoch": 40.24, + "learning_rate": 2.4334982332155478e-06, + "loss": 0.2741, + "step": 11590 + }, + { + "epoch": 40.28, + "learning_rate": 2.43208480565371e-06, + "loss": 0.2678, + "step": 11600 + }, + { + "epoch": 40.31, + "learning_rate": 2.4306713780918726e-06, + "loss": 0.2677, + "step": 11610 + }, + { + "epoch": 40.35, + "learning_rate": 2.4292579505300354e-06, + "loss": 0.2553, + "step": 11620 + }, + { + "epoch": 40.38, + "learning_rate": 2.427844522968198e-06, + "loss": 0.262, + "step": 11630 + }, + { + "epoch": 40.42, + "learning_rate": 2.4264310954063607e-06, + "loss": 0.2346, + "step": 11640 + }, + { + "epoch": 40.45, + "learning_rate": 2.4250176678445227e-06, + "loss": 0.2454, + "step": 11650 + }, + { + "epoch": 40.48, + "learning_rate": 2.4236042402826855e-06, + "loss": 0.2916, + "step": 11660 + }, + { + "epoch": 40.52, + "learning_rate": 2.422190812720848e-06, + "loss": 0.2796, + "step": 11670 + }, + { + "epoch": 40.55, + "learning_rate": 2.4207773851590107e-06, + "loss": 0.2665, + "step": 11680 + }, + { + "epoch": 40.59, + "learning_rate": 2.419363957597173e-06, + "loss": 0.2589, + "step": 11690 + }, + { + "epoch": 40.62, + "learning_rate": 2.417950530035336e-06, + "loss": 0.2391, + "step": 11700 + }, + { + "epoch": 40.66, + "learning_rate": 2.416537102473498e-06, + "loss": 0.2641, + "step": 11710 + }, + { + "epoch": 40.69, + "learning_rate": 2.4151236749116604e-06, + "loss": 0.2821, + "step": 11720 + }, + { + "epoch": 40.73, + "learning_rate": 2.413710247349823e-06, + "loss": 0.2595, + "step": 11730 + }, + { + "epoch": 40.76, + "learning_rate": 2.4122968197879856e-06, + "loss": 0.2632, + "step": 11740 + }, + { + "epoch": 40.8, + "learning_rate": 2.4108833922261484e-06, + "loss": 0.2707, + "step": 11750 + }, + { + "epoch": 40.83, + "learning_rate": 2.4094699646643104e-06, + "loss": 0.2821, + "step": 11760 + }, + { + "epoch": 40.87, + "learning_rate": 2.4080565371024733e-06, + "loss": 0.27, + "step": 11770 + }, + { + "epoch": 40.9, + "learning_rate": 2.4066431095406357e-06, + "loss": 0.2556, + "step": 11780 + }, + { + "epoch": 40.94, + "learning_rate": 2.4052296819787985e-06, + "loss": 0.2552, + "step": 11790 + }, + { + "epoch": 40.97, + "learning_rate": 2.403816254416961e-06, + "loss": 0.2739, + "step": 11800 + }, + { + "epoch": 41.0, + "eval_loss": 0.5009294152259827, + "eval_runtime": 134.0218, + "eval_samples_per_second": 3.97, + "eval_steps_per_second": 0.992, + "eval_wer": 0.199010091920036, + "step": 11808 + }, + { + "epoch": 41.01, + "learning_rate": 2.4024028268551238e-06, + "loss": 0.2686, + "step": 11810 + }, + { + "epoch": 41.04, + "learning_rate": 2.4009893992932857e-06, + "loss": 0.2519, + "step": 11820 + }, + { + "epoch": 41.08, + "learning_rate": 2.3995759717314486e-06, + "loss": 0.2594, + "step": 11830 + }, + { + "epoch": 41.11, + "learning_rate": 2.398162544169611e-06, + "loss": 0.2581, + "step": 11840 + }, + { + "epoch": 41.15, + "learning_rate": 2.396749116607774e-06, + "loss": 0.2805, + "step": 11850 + }, + { + "epoch": 41.18, + "learning_rate": 2.3953356890459362e-06, + "loss": 0.2676, + "step": 11860 + }, + { + "epoch": 41.21, + "learning_rate": 2.393922261484099e-06, + "loss": 0.266, + "step": 11870 + }, + { + "epoch": 41.25, + "learning_rate": 2.392508833922261e-06, + "loss": 0.2659, + "step": 11880 + }, + { + "epoch": 41.28, + "learning_rate": 2.391095406360424e-06, + "loss": 0.2744, + "step": 11890 + }, + { + "epoch": 41.32, + "learning_rate": 2.3896819787985863e-06, + "loss": 0.2645, + "step": 11900 + }, + { + "epoch": 41.35, + "learning_rate": 2.388268551236749e-06, + "loss": 0.2566, + "step": 11910 + }, + { + "epoch": 41.39, + "learning_rate": 2.3868551236749115e-06, + "loss": 0.2739, + "step": 11920 + }, + { + "epoch": 41.42, + "learning_rate": 2.385441696113074e-06, + "loss": 0.2716, + "step": 11930 + }, + { + "epoch": 41.46, + "learning_rate": 2.3840282685512363e-06, + "loss": 0.2489, + "step": 11940 + }, + { + "epoch": 41.49, + "learning_rate": 2.382614840989399e-06, + "loss": 0.2852, + "step": 11950 + }, + { + "epoch": 41.53, + "learning_rate": 2.3812014134275616e-06, + "loss": 0.2709, + "step": 11960 + }, + { + "epoch": 41.56, + "learning_rate": 2.3797879858657244e-06, + "loss": 0.274, + "step": 11970 + }, + { + "epoch": 41.6, + "learning_rate": 2.378374558303887e-06, + "loss": 0.2656, + "step": 11980 + }, + { + "epoch": 41.63, + "learning_rate": 2.3769611307420492e-06, + "loss": 0.2745, + "step": 11990 + }, + { + "epoch": 41.66, + "learning_rate": 2.3755477031802117e-06, + "loss": 0.2757, + "step": 12000 + }, + { + "epoch": 41.7, + "learning_rate": 2.3741342756183745e-06, + "loss": 0.2799, + "step": 12010 + }, + { + "epoch": 41.73, + "learning_rate": 2.372720848056537e-06, + "loss": 0.2521, + "step": 12020 + }, + { + "epoch": 41.77, + "learning_rate": 2.3713074204946997e-06, + "loss": 0.2568, + "step": 12030 + }, + { + "epoch": 41.8, + "learning_rate": 2.369893992932862e-06, + "loss": 0.2557, + "step": 12040 + }, + { + "epoch": 41.84, + "learning_rate": 2.3684805653710245e-06, + "loss": 0.2617, + "step": 12050 + }, + { + "epoch": 41.87, + "learning_rate": 2.367067137809187e-06, + "loss": 0.2595, + "step": 12060 + }, + { + "epoch": 41.91, + "learning_rate": 2.36565371024735e-06, + "loss": 0.2647, + "step": 12070 + }, + { + "epoch": 41.94, + "learning_rate": 2.364240282685512e-06, + "loss": 0.2544, + "step": 12080 + }, + { + "epoch": 41.98, + "learning_rate": 2.362826855123675e-06, + "loss": 0.2687, + "step": 12090 + }, + { + "epoch": 42.0, + "eval_loss": 0.5231707692146301, + "eval_runtime": 133.0554, + "eval_samples_per_second": 3.998, + "eval_steps_per_second": 1.0, + "eval_wer": 0.20113132351995885, + "step": 12096 + }, + { + "epoch": 42.01, + "learning_rate": 2.361413427561837e-06, + "loss": 0.288, + "step": 12100 + }, + { + "epoch": 42.05, + "learning_rate": 2.36e-06, + "loss": 0.2828, + "step": 12110 + }, + { + "epoch": 42.08, + "learning_rate": 2.3585865724381623e-06, + "loss": 0.267, + "step": 12120 + }, + { + "epoch": 42.12, + "learning_rate": 2.357173144876325e-06, + "loss": 0.2614, + "step": 12130 + }, + { + "epoch": 42.15, + "learning_rate": 2.3557597173144875e-06, + "loss": 0.2614, + "step": 12140 + }, + { + "epoch": 42.19, + "learning_rate": 2.3543462897526503e-06, + "loss": 0.2936, + "step": 12150 + }, + { + "epoch": 42.22, + "learning_rate": 2.3529328621908123e-06, + "loss": 0.2661, + "step": 12160 + }, + { + "epoch": 42.26, + "learning_rate": 2.351519434628975e-06, + "loss": 0.2655, + "step": 12170 + }, + { + "epoch": 42.29, + "learning_rate": 2.3501060070671376e-06, + "loss": 0.2874, + "step": 12180 + }, + { + "epoch": 42.33, + "learning_rate": 2.3486925795053004e-06, + "loss": 0.2629, + "step": 12190 + }, + { + "epoch": 42.36, + "learning_rate": 2.347279151943463e-06, + "loss": 0.2498, + "step": 12200 + }, + { + "epoch": 42.39, + "learning_rate": 2.3458657243816256e-06, + "loss": 0.2821, + "step": 12210 + }, + { + "epoch": 42.43, + "learning_rate": 2.3444522968197876e-06, + "loss": 0.2461, + "step": 12220 + }, + { + "epoch": 42.46, + "learning_rate": 2.3430388692579505e-06, + "loss": 0.2809, + "step": 12230 + }, + { + "epoch": 42.5, + "learning_rate": 2.341625441696113e-06, + "loss": 0.2653, + "step": 12240 + }, + { + "epoch": 42.53, + "learning_rate": 2.3402120141342757e-06, + "loss": 0.2616, + "step": 12250 + }, + { + "epoch": 42.57, + "learning_rate": 2.338798586572438e-06, + "loss": 0.261, + "step": 12260 + }, + { + "epoch": 42.6, + "learning_rate": 2.3373851590106005e-06, + "loss": 0.2511, + "step": 12270 + }, + { + "epoch": 42.64, + "learning_rate": 2.335971731448763e-06, + "loss": 0.2572, + "step": 12280 + }, + { + "epoch": 42.67, + "learning_rate": 2.3345583038869258e-06, + "loss": 0.2928, + "step": 12290 + }, + { + "epoch": 42.71, + "learning_rate": 2.333144876325088e-06, + "loss": 0.2539, + "step": 12300 + }, + { + "epoch": 42.74, + "learning_rate": 2.331731448763251e-06, + "loss": 0.2707, + "step": 12310 + }, + { + "epoch": 42.78, + "learning_rate": 2.3303180212014134e-06, + "loss": 0.2607, + "step": 12320 + }, + { + "epoch": 42.81, + "learning_rate": 2.328904593639576e-06, + "loss": 0.2695, + "step": 12330 + }, + { + "epoch": 42.85, + "learning_rate": 2.3274911660777382e-06, + "loss": 0.2836, + "step": 12340 + }, + { + "epoch": 42.88, + "learning_rate": 2.326077738515901e-06, + "loss": 0.2677, + "step": 12350 + }, + { + "epoch": 42.91, + "learning_rate": 2.3246643109540635e-06, + "loss": 0.2583, + "step": 12360 + }, + { + "epoch": 42.95, + "learning_rate": 2.3232508833922263e-06, + "loss": 0.2554, + "step": 12370 + }, + { + "epoch": 42.98, + "learning_rate": 2.3218374558303883e-06, + "loss": 0.2696, + "step": 12380 + }, + { + "epoch": 43.0, + "eval_loss": 0.5108169913291931, + "eval_runtime": 133.4619, + "eval_samples_per_second": 3.986, + "eval_steps_per_second": 0.997, + "eval_wer": 0.19862441344732276, + "step": 12384 + }, + { + "epoch": 43.02, + "learning_rate": 2.320424028268551e-06, + "loss": 0.2739, + "step": 12390 + }, + { + "epoch": 43.06, + "learning_rate": 2.3190106007067135e-06, + "loss": 0.2612, + "step": 12400 + }, + { + "epoch": 43.09, + "learning_rate": 2.3175971731448764e-06, + "loss": 0.2596, + "step": 12410 + }, + { + "epoch": 43.12, + "learning_rate": 2.3161837455830388e-06, + "loss": 0.2777, + "step": 12420 + }, + { + "epoch": 43.16, + "learning_rate": 2.3147703180212016e-06, + "loss": 0.2487, + "step": 12430 + }, + { + "epoch": 43.19, + "learning_rate": 2.3133568904593636e-06, + "loss": 0.2452, + "step": 12440 + }, + { + "epoch": 43.23, + "learning_rate": 2.3119434628975264e-06, + "loss": 0.2495, + "step": 12450 + }, + { + "epoch": 43.26, + "learning_rate": 2.310530035335689e-06, + "loss": 0.2412, + "step": 12460 + }, + { + "epoch": 43.3, + "learning_rate": 2.3091166077738517e-06, + "loss": 0.2515, + "step": 12470 + }, + { + "epoch": 43.33, + "learning_rate": 2.307703180212014e-06, + "loss": 0.2955, + "step": 12480 + }, + { + "epoch": 43.37, + "learning_rate": 2.306289752650177e-06, + "loss": 0.2725, + "step": 12490 + }, + { + "epoch": 43.4, + "learning_rate": 2.304876325088339e-06, + "loss": 0.2414, + "step": 12500 + }, + { + "epoch": 43.44, + "learning_rate": 2.3034628975265017e-06, + "loss": 0.251, + "step": 12510 + }, + { + "epoch": 43.47, + "learning_rate": 2.302049469964664e-06, + "loss": 0.2579, + "step": 12520 + }, + { + "epoch": 43.51, + "learning_rate": 2.300636042402827e-06, + "loss": 0.2531, + "step": 12530 + }, + { + "epoch": 43.54, + "learning_rate": 2.2992226148409894e-06, + "loss": 0.247, + "step": 12540 + }, + { + "epoch": 43.57, + "learning_rate": 2.297809187279152e-06, + "loss": 0.278, + "step": 12550 + }, + { + "epoch": 43.61, + "learning_rate": 2.296395759717314e-06, + "loss": 0.2435, + "step": 12560 + }, + { + "epoch": 43.64, + "learning_rate": 2.294982332155477e-06, + "loss": 0.258, + "step": 12570 + }, + { + "epoch": 43.68, + "learning_rate": 2.2935689045936395e-06, + "loss": 0.2659, + "step": 12580 + }, + { + "epoch": 43.71, + "learning_rate": 2.2921554770318023e-06, + "loss": 0.2554, + "step": 12590 + }, + { + "epoch": 43.75, + "learning_rate": 2.2907420494699647e-06, + "loss": 0.2671, + "step": 12600 + }, + { + "epoch": 43.78, + "learning_rate": 2.289328621908127e-06, + "loss": 0.26, + "step": 12610 + }, + { + "epoch": 43.82, + "learning_rate": 2.2879151943462895e-06, + "loss": 0.2791, + "step": 12620 + }, + { + "epoch": 43.85, + "learning_rate": 2.2865017667844523e-06, + "loss": 0.2532, + "step": 12630 + }, + { + "epoch": 43.89, + "learning_rate": 2.2850883392226148e-06, + "loss": 0.2759, + "step": 12640 + }, + { + "epoch": 43.92, + "learning_rate": 2.2836749116607776e-06, + "loss": 0.2659, + "step": 12650 + }, + { + "epoch": 43.96, + "learning_rate": 2.28226148409894e-06, + "loss": 0.2672, + "step": 12660 + }, + { + "epoch": 43.99, + "learning_rate": 2.2808480565371024e-06, + "loss": 0.2729, + "step": 12670 + }, + { + "epoch": 44.0, + "eval_loss": 0.5158911943435669, + "eval_runtime": 133.2183, + "eval_samples_per_second": 3.993, + "eval_steps_per_second": 0.998, + "eval_wer": 0.1990743716654882, + "step": 12672 + }, + { + "epoch": 44.03, + "learning_rate": 2.279434628975265e-06, + "loss": 0.2755, + "step": 12680 + }, + { + "epoch": 44.06, + "learning_rate": 2.2780212014134277e-06, + "loss": 0.2787, + "step": 12690 + }, + { + "epoch": 44.1, + "learning_rate": 2.27660777385159e-06, + "loss": 0.2539, + "step": 12700 + }, + { + "epoch": 44.13, + "learning_rate": 2.275194346289753e-06, + "loss": 0.2686, + "step": 12710 + }, + { + "epoch": 44.17, + "learning_rate": 2.273780918727915e-06, + "loss": 0.2883, + "step": 12720 + }, + { + "epoch": 44.2, + "learning_rate": 2.2723674911660777e-06, + "loss": 0.2573, + "step": 12730 + }, + { + "epoch": 44.24, + "learning_rate": 2.27095406360424e-06, + "loss": 0.2739, + "step": 12740 + }, + { + "epoch": 44.27, + "learning_rate": 2.269540636042403e-06, + "loss": 0.2749, + "step": 12750 + }, + { + "epoch": 44.3, + "learning_rate": 2.2681272084805654e-06, + "loss": 0.275, + "step": 12760 + }, + { + "epoch": 44.34, + "learning_rate": 2.266713780918728e-06, + "loss": 0.2766, + "step": 12770 + }, + { + "epoch": 44.37, + "learning_rate": 2.26530035335689e-06, + "loss": 0.2475, + "step": 12780 + }, + { + "epoch": 44.41, + "learning_rate": 2.2638869257950526e-06, + "loss": 0.2739, + "step": 12790 + }, + { + "epoch": 44.44, + "learning_rate": 2.2624734982332154e-06, + "loss": 0.2448, + "step": 12800 + }, + { + "epoch": 44.48, + "learning_rate": 2.2610600706713783e-06, + "loss": 0.2801, + "step": 12810 + }, + { + "epoch": 44.51, + "learning_rate": 2.2596466431095407e-06, + "loss": 0.2575, + "step": 12820 + }, + { + "epoch": 44.55, + "learning_rate": 2.2582332155477035e-06, + "loss": 0.249, + "step": 12830 + }, + { + "epoch": 44.58, + "learning_rate": 2.2568197879858655e-06, + "loss": 0.2546, + "step": 12840 + }, + { + "epoch": 44.62, + "learning_rate": 2.255406360424028e-06, + "loss": 0.2462, + "step": 12850 + }, + { + "epoch": 44.65, + "learning_rate": 2.2539929328621907e-06, + "loss": 0.2588, + "step": 12860 + }, + { + "epoch": 44.69, + "learning_rate": 2.252579505300353e-06, + "loss": 0.2569, + "step": 12870 + }, + { + "epoch": 44.72, + "learning_rate": 2.251166077738516e-06, + "loss": 0.2515, + "step": 12880 + }, + { + "epoch": 44.75, + "learning_rate": 2.249752650176678e-06, + "loss": 0.2564, + "step": 12890 + }, + { + "epoch": 44.79, + "learning_rate": 2.248339222614841e-06, + "loss": 0.2579, + "step": 12900 + }, + { + "epoch": 44.82, + "learning_rate": 2.246925795053003e-06, + "loss": 0.2831, + "step": 12910 + }, + { + "epoch": 44.86, + "learning_rate": 2.245512367491166e-06, + "loss": 0.2546, + "step": 12920 + }, + { + "epoch": 44.89, + "learning_rate": 2.2440989399293284e-06, + "loss": 0.2653, + "step": 12930 + }, + { + "epoch": 44.93, + "learning_rate": 2.2426855123674913e-06, + "loss": 0.2527, + "step": 12940 + }, + { + "epoch": 44.96, + "learning_rate": 2.2412720848056533e-06, + "loss": 0.2692, + "step": 12950 + }, + { + "epoch": 45.0, + "learning_rate": 2.239858657243816e-06, + "loss": 0.2579, + "step": 12960 + }, + { + "epoch": 45.0, + "eval_loss": 0.516213059425354, + "eval_runtime": 133.2787, + "eval_samples_per_second": 3.992, + "eval_steps_per_second": 0.998, + "eval_wer": 0.19913865141094042, + "step": 12960 + }, + { + "epoch": 45.03, + "learning_rate": 2.2384452296819785e-06, + "loss": 0.273, + "step": 12970 + }, + { + "epoch": 45.07, + "learning_rate": 2.2370318021201413e-06, + "loss": 0.2757, + "step": 12980 + }, + { + "epoch": 45.1, + "learning_rate": 2.2356183745583037e-06, + "loss": 0.2461, + "step": 12990 + }, + { + "epoch": 45.14, + "learning_rate": 2.234204946996466e-06, + "loss": 0.2693, + "step": 13000 + }, + { + "epoch": 45.17, + "learning_rate": 2.2327915194346286e-06, + "loss": 0.2596, + "step": 13010 + }, + { + "epoch": 45.21, + "learning_rate": 2.2313780918727914e-06, + "loss": 0.2436, + "step": 13020 + }, + { + "epoch": 45.24, + "learning_rate": 2.229964664310954e-06, + "loss": 0.2484, + "step": 13030 + }, + { + "epoch": 45.28, + "learning_rate": 2.2285512367491166e-06, + "loss": 0.2378, + "step": 13040 + }, + { + "epoch": 45.31, + "learning_rate": 2.227137809187279e-06, + "loss": 0.2688, + "step": 13050 + }, + { + "epoch": 45.35, + "learning_rate": 2.2257243816254415e-06, + "loss": 0.2768, + "step": 13060 + }, + { + "epoch": 45.38, + "learning_rate": 2.224310954063604e-06, + "loss": 0.2626, + "step": 13070 + }, + { + "epoch": 45.42, + "learning_rate": 2.2228975265017667e-06, + "loss": 0.2602, + "step": 13080 + }, + { + "epoch": 45.45, + "learning_rate": 2.221484098939929e-06, + "loss": 0.2623, + "step": 13090 + }, + { + "epoch": 45.48, + "learning_rate": 2.220070671378092e-06, + "loss": 0.2782, + "step": 13100 + }, + { + "epoch": 45.52, + "learning_rate": 2.2186572438162544e-06, + "loss": 0.2689, + "step": 13110 + }, + { + "epoch": 45.55, + "learning_rate": 2.2172438162544168e-06, + "loss": 0.2642, + "step": 13120 + }, + { + "epoch": 45.59, + "learning_rate": 2.215830388692579e-06, + "loss": 0.2557, + "step": 13130 + }, + { + "epoch": 45.62, + "learning_rate": 2.214416961130742e-06, + "loss": 0.2737, + "step": 13140 + }, + { + "epoch": 45.66, + "learning_rate": 2.2130035335689044e-06, + "loss": 0.2703, + "step": 13150 + }, + { + "epoch": 45.69, + "learning_rate": 2.2115901060070673e-06, + "loss": 0.2737, + "step": 13160 + }, + { + "epoch": 45.73, + "learning_rate": 2.2101766784452292e-06, + "loss": 0.264, + "step": 13170 + }, + { + "epoch": 45.76, + "learning_rate": 2.208763250883392e-06, + "loss": 0.2595, + "step": 13180 + }, + { + "epoch": 45.8, + "learning_rate": 2.2073498233215545e-06, + "loss": 0.2488, + "step": 13190 + }, + { + "epoch": 45.83, + "learning_rate": 2.2059363957597173e-06, + "loss": 0.2766, + "step": 13200 + }, + { + "epoch": 45.87, + "learning_rate": 2.2045229681978797e-06, + "loss": 0.253, + "step": 13210 + }, + { + "epoch": 45.9, + "learning_rate": 2.2031095406360426e-06, + "loss": 0.2589, + "step": 13220 + }, + { + "epoch": 45.94, + "learning_rate": 2.2016961130742045e-06, + "loss": 0.2794, + "step": 13230 + }, + { + "epoch": 45.97, + "learning_rate": 2.2002826855123674e-06, + "loss": 0.283, + "step": 13240 + }, + { + "epoch": 46.0, + "eval_loss": 0.5031996369361877, + "eval_runtime": 133.0395, + "eval_samples_per_second": 3.999, + "eval_steps_per_second": 1.0, + "eval_wer": 0.1981744552291573, + "step": 13248 + }, + { + "epoch": 46.01, + "learning_rate": 2.1988692579505298e-06, + "loss": 0.2882, + "step": 13250 + }, + { + "epoch": 46.04, + "learning_rate": 2.1974558303886926e-06, + "loss": 0.2563, + "step": 13260 + }, + { + "epoch": 46.08, + "learning_rate": 2.196042402826855e-06, + "loss": 0.2821, + "step": 13270 + }, + { + "epoch": 46.11, + "learning_rate": 2.194628975265018e-06, + "loss": 0.2555, + "step": 13280 + }, + { + "epoch": 46.15, + "learning_rate": 2.19321554770318e-06, + "loss": 0.2765, + "step": 13290 + }, + { + "epoch": 46.18, + "learning_rate": 2.1918021201413427e-06, + "loss": 0.2745, + "step": 13300 + }, + { + "epoch": 46.21, + "learning_rate": 2.190388692579505e-06, + "loss": 0.2667, + "step": 13310 + }, + { + "epoch": 46.25, + "learning_rate": 2.188975265017668e-06, + "loss": 0.2759, + "step": 13320 + }, + { + "epoch": 46.28, + "learning_rate": 2.1875618374558303e-06, + "loss": 0.2642, + "step": 13330 + }, + { + "epoch": 46.32, + "learning_rate": 2.1861484098939927e-06, + "loss": 0.2702, + "step": 13340 + }, + { + "epoch": 46.35, + "learning_rate": 2.184734982332155e-06, + "loss": 0.2689, + "step": 13350 + }, + { + "epoch": 46.39, + "learning_rate": 2.183321554770318e-06, + "loss": 0.2657, + "step": 13360 + }, + { + "epoch": 46.42, + "learning_rate": 2.1819081272084804e-06, + "loss": 0.2431, + "step": 13370 + }, + { + "epoch": 46.46, + "learning_rate": 2.1804946996466432e-06, + "loss": 0.2472, + "step": 13380 + }, + { + "epoch": 46.49, + "learning_rate": 2.1790812720848056e-06, + "loss": 0.2774, + "step": 13390 + }, + { + "epoch": 46.53, + "learning_rate": 2.177667844522968e-06, + "loss": 0.2459, + "step": 13400 + }, + { + "epoch": 46.56, + "learning_rate": 2.1762544169611305e-06, + "loss": 0.269, + "step": 13410 + }, + { + "epoch": 46.6, + "learning_rate": 2.1748409893992933e-06, + "loss": 0.2489, + "step": 13420 + }, + { + "epoch": 46.63, + "learning_rate": 2.1734275618374557e-06, + "loss": 0.2567, + "step": 13430 + }, + { + "epoch": 46.66, + "learning_rate": 2.1720141342756185e-06, + "loss": 0.2636, + "step": 13440 + }, + { + "epoch": 46.7, + "learning_rate": 2.170600706713781e-06, + "loss": 0.2421, + "step": 13450 + }, + { + "epoch": 46.73, + "learning_rate": 2.1691872791519434e-06, + "loss": 0.2446, + "step": 13460 + }, + { + "epoch": 46.77, + "learning_rate": 2.1677738515901058e-06, + "loss": 0.2593, + "step": 13470 + }, + { + "epoch": 46.8, + "learning_rate": 2.1663604240282686e-06, + "loss": 0.2525, + "step": 13480 + }, + { + "epoch": 46.84, + "learning_rate": 2.164946996466431e-06, + "loss": 0.2719, + "step": 13490 + }, + { + "epoch": 46.87, + "learning_rate": 2.163533568904594e-06, + "loss": 0.2601, + "step": 13500 + }, + { + "epoch": 46.91, + "learning_rate": 2.162120141342756e-06, + "loss": 0.2798, + "step": 13510 + }, + { + "epoch": 46.94, + "learning_rate": 2.1608480565371027e-06, + "loss": 0.2435, + "step": 13520 + }, + { + "epoch": 46.98, + "learning_rate": 2.1594346289752647e-06, + "loss": 0.282, + "step": 13530 + }, + { + "epoch": 47.0, + "eval_loss": 0.5107125639915466, + "eval_runtime": 133.7168, + "eval_samples_per_second": 3.979, + "eval_steps_per_second": 0.995, + "eval_wer": 0.19804589573825288, + "step": 13536 + }, + { + "epoch": 47.01, + "learning_rate": 2.1580212014134275e-06, + "loss": 0.2783, + "step": 13540 + }, + { + "epoch": 47.05, + "learning_rate": 2.15660777385159e-06, + "loss": 0.2695, + "step": 13550 + }, + { + "epoch": 47.08, + "learning_rate": 2.1551943462897528e-06, + "loss": 0.2469, + "step": 13560 + }, + { + "epoch": 47.12, + "learning_rate": 2.153780918727915e-06, + "loss": 0.2757, + "step": 13570 + }, + { + "epoch": 47.15, + "learning_rate": 2.152367491166078e-06, + "loss": 0.2721, + "step": 13580 + }, + { + "epoch": 47.19, + "learning_rate": 2.15095406360424e-06, + "loss": 0.2529, + "step": 13590 + }, + { + "epoch": 47.22, + "learning_rate": 2.149540636042403e-06, + "loss": 0.2562, + "step": 13600 + }, + { + "epoch": 47.26, + "learning_rate": 2.1481272084805652e-06, + "loss": 0.2712, + "step": 13610 + }, + { + "epoch": 47.29, + "learning_rate": 2.146713780918728e-06, + "loss": 0.2696, + "step": 13620 + }, + { + "epoch": 47.33, + "learning_rate": 2.1453003533568905e-06, + "loss": 0.2698, + "step": 13630 + }, + { + "epoch": 47.36, + "learning_rate": 2.143886925795053e-06, + "loss": 0.2528, + "step": 13640 + }, + { + "epoch": 47.39, + "learning_rate": 2.1424734982332153e-06, + "loss": 0.2671, + "step": 13650 + }, + { + "epoch": 47.43, + "learning_rate": 2.141060070671378e-06, + "loss": 0.2542, + "step": 13660 + }, + { + "epoch": 47.46, + "learning_rate": 2.1396466431095405e-06, + "loss": 0.2696, + "step": 13670 + }, + { + "epoch": 47.5, + "learning_rate": 2.1382332155477034e-06, + "loss": 0.2652, + "step": 13680 + }, + { + "epoch": 47.53, + "learning_rate": 2.136819787985866e-06, + "loss": 0.2518, + "step": 13690 + }, + { + "epoch": 47.57, + "learning_rate": 2.135406360424028e-06, + "loss": 0.2353, + "step": 13700 + }, + { + "epoch": 47.6, + "learning_rate": 2.1339929328621906e-06, + "loss": 0.2568, + "step": 13710 + }, + { + "epoch": 47.64, + "learning_rate": 2.1325795053003534e-06, + "loss": 0.2935, + "step": 13720 + }, + { + "epoch": 47.67, + "learning_rate": 2.131166077738516e-06, + "loss": 0.2511, + "step": 13730 + }, + { + "epoch": 47.71, + "learning_rate": 2.1297526501766787e-06, + "loss": 0.2768, + "step": 13740 + }, + { + "epoch": 47.74, + "learning_rate": 2.128339222614841e-06, + "loss": 0.2525, + "step": 13750 + }, + { + "epoch": 47.78, + "learning_rate": 2.126925795053003e-06, + "loss": 0.2236, + "step": 13760 + }, + { + "epoch": 47.81, + "learning_rate": 2.125512367491166e-06, + "loss": 0.2719, + "step": 13770 + }, + { + "epoch": 47.85, + "learning_rate": 2.1240989399293287e-06, + "loss": 0.2772, + "step": 13780 + }, + { + "epoch": 47.88, + "learning_rate": 2.122685512367491e-06, + "loss": 0.2682, + "step": 13790 + }, + { + "epoch": 47.91, + "learning_rate": 2.121272084805654e-06, + "loss": 0.2631, + "step": 13800 + }, + { + "epoch": 47.95, + "learning_rate": 2.119858657243816e-06, + "loss": 0.2571, + "step": 13810 + }, + { + "epoch": 47.98, + "learning_rate": 2.1184452296819784e-06, + "loss": 0.2708, + "step": 13820 + }, + { + "epoch": 48.0, + "eval_loss": 0.5127933025360107, + "eval_runtime": 133.2709, + "eval_samples_per_second": 3.992, + "eval_steps_per_second": 0.998, + "eval_wer": 0.1982387349746095, + "step": 13824 + }, + { + "epoch": 48.02, + "learning_rate": 2.1170318021201412e-06, + "loss": 0.2812, + "step": 13830 + }, + { + "epoch": 48.06, + "learning_rate": 2.1156183745583036e-06, + "loss": 0.2673, + "step": 13840 + }, + { + "epoch": 48.09, + "learning_rate": 2.1142049469964665e-06, + "loss": 0.2529, + "step": 13850 + }, + { + "epoch": 48.12, + "learning_rate": 2.112791519434629e-06, + "loss": 0.2602, + "step": 13860 + }, + { + "epoch": 48.16, + "learning_rate": 2.1113780918727913e-06, + "loss": 0.2634, + "step": 13870 + }, + { + "epoch": 48.19, + "learning_rate": 2.1099646643109537e-06, + "loss": 0.2439, + "step": 13880 + }, + { + "epoch": 48.23, + "learning_rate": 2.1085512367491165e-06, + "loss": 0.2744, + "step": 13890 + }, + { + "epoch": 48.26, + "learning_rate": 2.107137809187279e-06, + "loss": 0.2572, + "step": 13900 + }, + { + "epoch": 48.3, + "learning_rate": 2.1057243816254418e-06, + "loss": 0.2838, + "step": 13910 + }, + { + "epoch": 48.33, + "learning_rate": 2.1043109540636038e-06, + "loss": 0.2746, + "step": 13920 + }, + { + "epoch": 48.37, + "learning_rate": 2.1028975265017666e-06, + "loss": 0.2663, + "step": 13930 + }, + { + "epoch": 48.4, + "learning_rate": 2.101484098939929e-06, + "loss": 0.2817, + "step": 13940 + }, + { + "epoch": 48.44, + "learning_rate": 2.100070671378092e-06, + "loss": 0.2583, + "step": 13950 + }, + { + "epoch": 48.47, + "learning_rate": 2.0986572438162542e-06, + "loss": 0.2796, + "step": 13960 + }, + { + "epoch": 48.51, + "learning_rate": 2.097243816254417e-06, + "loss": 0.266, + "step": 13970 + }, + { + "epoch": 48.54, + "learning_rate": 2.095830388692579e-06, + "loss": 0.2757, + "step": 13980 + }, + { + "epoch": 48.57, + "learning_rate": 2.094416961130742e-06, + "loss": 0.262, + "step": 13990 + }, + { + "epoch": 48.61, + "learning_rate": 2.0930035335689043e-06, + "loss": 0.2463, + "step": 14000 + }, + { + "epoch": 48.64, + "learning_rate": 2.091590106007067e-06, + "loss": 0.2763, + "step": 14010 + }, + { + "epoch": 48.68, + "learning_rate": 2.0901766784452295e-06, + "loss": 0.2746, + "step": 14020 + }, + { + "epoch": 48.71, + "learning_rate": 2.0887632508833924e-06, + "loss": 0.2459, + "step": 14030 + }, + { + "epoch": 48.75, + "learning_rate": 2.0873498233215544e-06, + "loss": 0.2657, + "step": 14040 + }, + { + "epoch": 48.78, + "learning_rate": 2.085936395759717e-06, + "loss": 0.2599, + "step": 14050 + }, + { + "epoch": 48.82, + "learning_rate": 2.0845229681978796e-06, + "loss": 0.2634, + "step": 14060 + }, + { + "epoch": 48.85, + "learning_rate": 2.0831095406360424e-06, + "loss": 0.2551, + "step": 14070 + }, + { + "epoch": 48.89, + "learning_rate": 2.081696113074205e-06, + "loss": 0.2322, + "step": 14080 + }, + { + "epoch": 48.92, + "learning_rate": 2.0802826855123673e-06, + "loss": 0.2524, + "step": 14090 + }, + { + "epoch": 48.96, + "learning_rate": 2.0788692579505297e-06, + "loss": 0.2667, + "step": 14100 + }, + { + "epoch": 48.99, + "learning_rate": 2.0774558303886925e-06, + "loss": 0.2562, + "step": 14110 + }, + { + "epoch": 49.0, + "eval_loss": 0.5162803530693054, + "eval_runtime": 133.3898, + "eval_samples_per_second": 3.988, + "eval_steps_per_second": 0.997, + "eval_wer": 0.1990743716654882, + "step": 14112 + }, + { + "epoch": 49.03, + "learning_rate": 2.076042402826855e-06, + "loss": 0.2776, + "step": 14120 + }, + { + "epoch": 49.06, + "learning_rate": 2.0746289752650177e-06, + "loss": 0.2473, + "step": 14130 + }, + { + "epoch": 49.1, + "learning_rate": 2.07321554770318e-06, + "loss": 0.2626, + "step": 14140 + }, + { + "epoch": 49.13, + "learning_rate": 2.0718021201413426e-06, + "loss": 0.2602, + "step": 14150 + }, + { + "epoch": 49.17, + "learning_rate": 2.070388692579505e-06, + "loss": 0.2707, + "step": 14160 + }, + { + "epoch": 49.2, + "learning_rate": 2.068975265017668e-06, + "loss": 0.2423, + "step": 14170 + }, + { + "epoch": 49.24, + "learning_rate": 2.06756183745583e-06, + "loss": 0.2965, + "step": 14180 + }, + { + "epoch": 49.27, + "learning_rate": 2.066148409893993e-06, + "loss": 0.2602, + "step": 14190 + }, + { + "epoch": 49.3, + "learning_rate": 2.0647349823321555e-06, + "loss": 0.2547, + "step": 14200 + }, + { + "epoch": 49.34, + "learning_rate": 2.063321554770318e-06, + "loss": 0.2702, + "step": 14210 + }, + { + "epoch": 49.37, + "learning_rate": 2.0619081272084803e-06, + "loss": 0.2806, + "step": 14220 + }, + { + "epoch": 49.41, + "learning_rate": 2.060494699646643e-06, + "loss": 0.2648, + "step": 14230 + }, + { + "epoch": 49.44, + "learning_rate": 2.0590812720848055e-06, + "loss": 0.2396, + "step": 14240 + }, + { + "epoch": 49.48, + "learning_rate": 2.0576678445229683e-06, + "loss": 0.2837, + "step": 14250 + }, + { + "epoch": 49.51, + "learning_rate": 2.0562544169611303e-06, + "loss": 0.281, + "step": 14260 + }, + { + "epoch": 49.55, + "learning_rate": 2.054840989399293e-06, + "loss": 0.235, + "step": 14270 + }, + { + "epoch": 49.58, + "learning_rate": 2.0534275618374556e-06, + "loss": 0.2556, + "step": 14280 + }, + { + "epoch": 49.62, + "learning_rate": 2.0520141342756184e-06, + "loss": 0.2675, + "step": 14290 + }, + { + "epoch": 49.65, + "learning_rate": 2.050600706713781e-06, + "loss": 0.2774, + "step": 14300 + }, + { + "epoch": 49.69, + "learning_rate": 2.0491872791519437e-06, + "loss": 0.2742, + "step": 14310 + }, + { + "epoch": 49.72, + "learning_rate": 2.0477738515901056e-06, + "loss": 0.2665, + "step": 14320 + }, + { + "epoch": 49.75, + "learning_rate": 2.0463604240282685e-06, + "loss": 0.2664, + "step": 14330 + }, + { + "epoch": 49.79, + "learning_rate": 2.044946996466431e-06, + "loss": 0.2496, + "step": 14340 + }, + { + "epoch": 49.82, + "learning_rate": 2.0435335689045937e-06, + "loss": 0.2725, + "step": 14350 + }, + { + "epoch": 49.86, + "learning_rate": 2.042120141342756e-06, + "loss": 0.2581, + "step": 14360 + }, + { + "epoch": 49.89, + "learning_rate": 2.040706713780919e-06, + "loss": 0.2582, + "step": 14370 + }, + { + "epoch": 49.93, + "learning_rate": 2.039293286219081e-06, + "loss": 0.2514, + "step": 14380 + }, + { + "epoch": 49.96, + "learning_rate": 2.0378798586572438e-06, + "loss": 0.2765, + "step": 14390 + }, + { + "epoch": 50.0, + "learning_rate": 2.036466431095406e-06, + "loss": 0.2675, + "step": 14400 + }, + { + "epoch": 50.0, + "eval_loss": 0.5062453150749207, + "eval_runtime": 133.1193, + "eval_samples_per_second": 3.996, + "eval_steps_per_second": 0.999, + "eval_wer": 0.19939577039274925, + "step": 14400 + }, + { + "epoch": 50.03, + "learning_rate": 2.035053003533569e-06, + "loss": 0.2766, + "step": 14410 + }, + { + "epoch": 50.07, + "learning_rate": 2.0336395759717314e-06, + "loss": 0.2511, + "step": 14420 + }, + { + "epoch": 50.1, + "learning_rate": 2.032226148409894e-06, + "loss": 0.2459, + "step": 14430 + }, + { + "epoch": 50.14, + "learning_rate": 2.0308127208480562e-06, + "loss": 0.2715, + "step": 14440 + }, + { + "epoch": 50.17, + "learning_rate": 2.029399293286219e-06, + "loss": 0.2912, + "step": 14450 + }, + { + "epoch": 50.21, + "learning_rate": 2.0279858657243815e-06, + "loss": 0.2606, + "step": 14460 + }, + { + "epoch": 50.24, + "learning_rate": 2.0265724381625443e-06, + "loss": 0.2685, + "step": 14470 + }, + { + "epoch": 50.28, + "learning_rate": 2.0251590106007067e-06, + "loss": 0.2354, + "step": 14480 + }, + { + "epoch": 50.31, + "learning_rate": 2.023745583038869e-06, + "loss": 0.2725, + "step": 14490 + }, + { + "epoch": 50.35, + "learning_rate": 2.0223321554770316e-06, + "loss": 0.2681, + "step": 14500 + }, + { + "epoch": 50.38, + "learning_rate": 2.0209187279151944e-06, + "loss": 0.242, + "step": 14510 + }, + { + "epoch": 50.42, + "learning_rate": 2.019505300353357e-06, + "loss": 0.2646, + "step": 14520 + }, + { + "epoch": 50.45, + "learning_rate": 2.0180918727915196e-06, + "loss": 0.2415, + "step": 14530 + }, + { + "epoch": 50.48, + "learning_rate": 2.0166784452296816e-06, + "loss": 0.2905, + "step": 14540 + }, + { + "epoch": 50.52, + "learning_rate": 2.0152650176678444e-06, + "loss": 0.2674, + "step": 14550 + }, + { + "epoch": 50.55, + "learning_rate": 2.013851590106007e-06, + "loss": 0.2427, + "step": 14560 + }, + { + "epoch": 50.59, + "learning_rate": 2.0124381625441697e-06, + "loss": 0.2535, + "step": 14570 + }, + { + "epoch": 50.62, + "learning_rate": 2.011024734982332e-06, + "loss": 0.252, + "step": 14580 + }, + { + "epoch": 50.66, + "learning_rate": 2.009611307420495e-06, + "loss": 0.2764, + "step": 14590 + }, + { + "epoch": 50.69, + "learning_rate": 2.008197879858657e-06, + "loss": 0.2632, + "step": 14600 + }, + { + "epoch": 50.73, + "learning_rate": 2.0067844522968198e-06, + "loss": 0.2551, + "step": 14610 + }, + { + "epoch": 50.76, + "learning_rate": 2.005371024734982e-06, + "loss": 0.2657, + "step": 14620 + }, + { + "epoch": 50.8, + "learning_rate": 2.003957597173145e-06, + "loss": 0.2655, + "step": 14630 + }, + { + "epoch": 50.83, + "learning_rate": 2.0025441696113074e-06, + "loss": 0.2512, + "step": 14640 + }, + { + "epoch": 50.87, + "learning_rate": 2.0011307420494702e-06, + "loss": 0.2607, + "step": 14650 + }, + { + "epoch": 50.9, + "learning_rate": 1.9997173144876326e-06, + "loss": 0.2681, + "step": 14660 + }, + { + "epoch": 50.94, + "learning_rate": 1.998303886925795e-06, + "loss": 0.2625, + "step": 14670 + }, + { + "epoch": 50.97, + "learning_rate": 1.9968904593639575e-06, + "loss": 0.285, + "step": 14680 + }, + { + "epoch": 51.0, + "eval_loss": 0.4999462068080902, + "eval_runtime": 133.4245, + "eval_samples_per_second": 3.987, + "eval_steps_per_second": 0.997, + "eval_wer": 0.19875297293822716, + "step": 14688 + }, + { + "epoch": 51.01, + "learning_rate": 1.9954770318021203e-06, + "loss": 0.2801, + "step": 14690 + }, + { + "epoch": 51.04, + "learning_rate": 1.9940636042402827e-06, + "loss": 0.2528, + "step": 14700 + }, + { + "epoch": 51.08, + "learning_rate": 1.992650176678445e-06, + "loss": 0.2613, + "step": 14710 + }, + { + "epoch": 51.11, + "learning_rate": 1.991236749116608e-06, + "loss": 0.2647, + "step": 14720 + }, + { + "epoch": 51.15, + "learning_rate": 1.9898233215547704e-06, + "loss": 0.2629, + "step": 14730 + }, + { + "epoch": 51.18, + "learning_rate": 1.9884098939929328e-06, + "loss": 0.2848, + "step": 14740 + }, + { + "epoch": 51.21, + "learning_rate": 1.9869964664310956e-06, + "loss": 0.25, + "step": 14750 + }, + { + "epoch": 51.25, + "learning_rate": 1.985583038869258e-06, + "loss": 0.2707, + "step": 14760 + }, + { + "epoch": 51.28, + "learning_rate": 1.9841696113074204e-06, + "loss": 0.2287, + "step": 14770 + }, + { + "epoch": 51.32, + "learning_rate": 1.982756183745583e-06, + "loss": 0.2822, + "step": 14780 + }, + { + "epoch": 51.35, + "learning_rate": 1.9813427561837457e-06, + "loss": 0.2816, + "step": 14790 + }, + { + "epoch": 51.39, + "learning_rate": 1.979929328621908e-06, + "loss": 0.2655, + "step": 14800 + }, + { + "epoch": 51.42, + "learning_rate": 1.9785159010600705e-06, + "loss": 0.2573, + "step": 14810 + }, + { + "epoch": 51.46, + "learning_rate": 1.9771024734982333e-06, + "loss": 0.2674, + "step": 14820 + }, + { + "epoch": 51.49, + "learning_rate": 1.9756890459363957e-06, + "loss": 0.2745, + "step": 14830 + }, + { + "epoch": 51.53, + "learning_rate": 1.974275618374558e-06, + "loss": 0.2586, + "step": 14840 + }, + { + "epoch": 51.56, + "learning_rate": 1.972862190812721e-06, + "loss": 0.2439, + "step": 14850 + }, + { + "epoch": 51.6, + "learning_rate": 1.9714487632508834e-06, + "loss": 0.2376, + "step": 14860 + }, + { + "epoch": 51.63, + "learning_rate": 1.9700353356890458e-06, + "loss": 0.248, + "step": 14870 + }, + { + "epoch": 51.66, + "learning_rate": 1.968621908127208e-06, + "loss": 0.2522, + "step": 14880 + }, + { + "epoch": 51.7, + "learning_rate": 1.967208480565371e-06, + "loss": 0.2599, + "step": 14890 + }, + { + "epoch": 51.73, + "learning_rate": 1.9657950530035334e-06, + "loss": 0.2678, + "step": 14900 + }, + { + "epoch": 51.77, + "learning_rate": 1.964381625441696e-06, + "loss": 0.2662, + "step": 14910 + }, + { + "epoch": 51.8, + "learning_rate": 1.9629681978798587e-06, + "loss": 0.2576, + "step": 14920 + }, + { + "epoch": 51.84, + "learning_rate": 1.961554770318021e-06, + "loss": 0.2788, + "step": 14930 + }, + { + "epoch": 51.87, + "learning_rate": 1.9601413427561835e-06, + "loss": 0.2517, + "step": 14940 + }, + { + "epoch": 51.91, + "learning_rate": 1.958727915194346e-06, + "loss": 0.2728, + "step": 14950 + }, + { + "epoch": 51.94, + "learning_rate": 1.9573144876325087e-06, + "loss": 0.2538, + "step": 14960 + }, + { + "epoch": 51.98, + "learning_rate": 1.955901060070671e-06, + "loss": 0.2756, + "step": 14970 + }, + { + "epoch": 52.0, + "eval_loss": 0.5029511451721191, + "eval_runtime": 133.7467, + "eval_samples_per_second": 3.978, + "eval_steps_per_second": 0.994, + "eval_wer": 0.19862441344732276, + "step": 14976 + }, + { + "epoch": 52.01, + "learning_rate": 1.9544876325088336e-06, + "loss": 0.2558, + "step": 14980 + }, + { + "epoch": 52.05, + "learning_rate": 1.9530742049469964e-06, + "loss": 0.2658, + "step": 14990 + }, + { + "epoch": 52.08, + "learning_rate": 1.951660777385159e-06, + "loss": 0.255, + "step": 15000 + }, + { + "epoch": 52.12, + "learning_rate": 1.9503886925795053e-06, + "loss": 0.2528, + "step": 15010 + }, + { + "epoch": 52.15, + "learning_rate": 1.9489752650176677e-06, + "loss": 0.2853, + "step": 15020 + }, + { + "epoch": 52.19, + "learning_rate": 1.94756183745583e-06, + "loss": 0.2631, + "step": 15030 + }, + { + "epoch": 52.22, + "learning_rate": 1.946148409893993e-06, + "loss": 0.2424, + "step": 15040 + }, + { + "epoch": 52.26, + "learning_rate": 1.9447349823321553e-06, + "loss": 0.2537, + "step": 15050 + }, + { + "epoch": 52.29, + "learning_rate": 1.9433215547703177e-06, + "loss": 0.2686, + "step": 15060 + }, + { + "epoch": 52.33, + "learning_rate": 1.9419081272084806e-06, + "loss": 0.259, + "step": 15070 + }, + { + "epoch": 52.36, + "learning_rate": 1.940494699646643e-06, + "loss": 0.2609, + "step": 15080 + }, + { + "epoch": 52.39, + "learning_rate": 1.9390812720848054e-06, + "loss": 0.2807, + "step": 15090 + }, + { + "epoch": 52.43, + "learning_rate": 1.9376678445229682e-06, + "loss": 0.2633, + "step": 15100 + }, + { + "epoch": 52.46, + "learning_rate": 1.9362544169611306e-06, + "loss": 0.2583, + "step": 15110 + }, + { + "epoch": 52.5, + "learning_rate": 1.934840989399293e-06, + "loss": 0.2656, + "step": 15120 + }, + { + "epoch": 52.53, + "learning_rate": 1.933427561837456e-06, + "loss": 0.2534, + "step": 15130 + }, + { + "epoch": 52.57, + "learning_rate": 1.9320141342756183e-06, + "loss": 0.2639, + "step": 15140 + }, + { + "epoch": 52.6, + "learning_rate": 1.9306007067137807e-06, + "loss": 0.2408, + "step": 15150 + }, + { + "epoch": 52.64, + "learning_rate": 1.9291872791519435e-06, + "loss": 0.2493, + "step": 15160 + }, + { + "epoch": 52.67, + "learning_rate": 1.927773851590106e-06, + "loss": 0.2729, + "step": 15170 + }, + { + "epoch": 52.71, + "learning_rate": 1.9263604240282684e-06, + "loss": 0.2708, + "step": 15180 + }, + { + "epoch": 52.74, + "learning_rate": 1.924946996466431e-06, + "loss": 0.2759, + "step": 15190 + }, + { + "epoch": 52.78, + "learning_rate": 1.9235335689045936e-06, + "loss": 0.254, + "step": 15200 + }, + { + "epoch": 52.81, + "learning_rate": 1.922120141342756e-06, + "loss": 0.2598, + "step": 15210 + }, + { + "epoch": 52.85, + "learning_rate": 1.9207067137809184e-06, + "loss": 0.2672, + "step": 15220 + }, + { + "epoch": 52.88, + "learning_rate": 1.9192932862190812e-06, + "loss": 0.2436, + "step": 15230 + }, + { + "epoch": 52.91, + "learning_rate": 1.9178798586572437e-06, + "loss": 0.2741, + "step": 15240 + }, + { + "epoch": 52.95, + "learning_rate": 1.916466431095406e-06, + "loss": 0.2601, + "step": 15250 + }, + { + "epoch": 52.98, + "learning_rate": 1.915053003533569e-06, + "loss": 0.2888, + "step": 15260 + }, + { + "epoch": 53.0, + "eval_loss": 0.5042588114738464, + "eval_runtime": 133.2498, + "eval_samples_per_second": 3.993, + "eval_steps_per_second": 0.998, + "eval_wer": 0.19746737802918302, + "step": 15264 + }, + { + "epoch": 53.02, + "learning_rate": 1.9136395759717313e-06, + "loss": 0.2853, + "step": 15270 + }, + { + "epoch": 53.06, + "learning_rate": 1.9122261484098937e-06, + "loss": 0.2504, + "step": 15280 + }, + { + "epoch": 53.09, + "learning_rate": 1.9108127208480565e-06, + "loss": 0.2608, + "step": 15290 + }, + { + "epoch": 53.12, + "learning_rate": 1.909399293286219e-06, + "loss": 0.2486, + "step": 15300 + }, + { + "epoch": 53.16, + "learning_rate": 1.9079858657243814e-06, + "loss": 0.2576, + "step": 15310 + }, + { + "epoch": 53.19, + "learning_rate": 1.906572438162544e-06, + "loss": 0.2678, + "step": 15320 + }, + { + "epoch": 53.23, + "learning_rate": 1.9051590106007068e-06, + "loss": 0.271, + "step": 15330 + }, + { + "epoch": 53.26, + "learning_rate": 1.903745583038869e-06, + "loss": 0.2528, + "step": 15340 + }, + { + "epoch": 53.3, + "learning_rate": 1.9023321554770316e-06, + "loss": 0.2786, + "step": 15350 + }, + { + "epoch": 53.33, + "learning_rate": 1.9009187279151943e-06, + "loss": 0.2634, + "step": 15360 + }, + { + "epoch": 53.37, + "learning_rate": 1.8995053003533567e-06, + "loss": 0.2764, + "step": 15370 + }, + { + "epoch": 53.4, + "learning_rate": 1.8980918727915193e-06, + "loss": 0.2592, + "step": 15380 + }, + { + "epoch": 53.44, + "learning_rate": 1.8966784452296817e-06, + "loss": 0.2503, + "step": 15390 + }, + { + "epoch": 53.47, + "learning_rate": 1.8952650176678443e-06, + "loss": 0.2712, + "step": 15400 + }, + { + "epoch": 53.51, + "learning_rate": 1.893851590106007e-06, + "loss": 0.2914, + "step": 15410 + }, + { + "epoch": 53.54, + "learning_rate": 1.8924381625441694e-06, + "loss": 0.2474, + "step": 15420 + }, + { + "epoch": 53.57, + "learning_rate": 1.891024734982332e-06, + "loss": 0.2733, + "step": 15430 + }, + { + "epoch": 53.61, + "learning_rate": 1.8896113074204946e-06, + "loss": 0.2511, + "step": 15440 + }, + { + "epoch": 53.64, + "learning_rate": 1.888197879858657e-06, + "loss": 0.2564, + "step": 15450 + }, + { + "epoch": 53.68, + "learning_rate": 1.8867844522968196e-06, + "loss": 0.2475, + "step": 15460 + }, + { + "epoch": 53.71, + "learning_rate": 1.8853710247349823e-06, + "loss": 0.2616, + "step": 15470 + }, + { + "epoch": 53.75, + "learning_rate": 1.8839575971731447e-06, + "loss": 0.2788, + "step": 15480 + }, + { + "epoch": 53.78, + "learning_rate": 1.8825441696113073e-06, + "loss": 0.2476, + "step": 15490 + }, + { + "epoch": 53.82, + "learning_rate": 1.88113074204947e-06, + "loss": 0.2713, + "step": 15500 + }, + { + "epoch": 53.85, + "learning_rate": 1.8797173144876323e-06, + "loss": 0.2638, + "step": 15510 + }, + { + "epoch": 53.89, + "learning_rate": 1.878303886925795e-06, + "loss": 0.2478, + "step": 15520 + }, + { + "epoch": 53.92, + "learning_rate": 1.8768904593639573e-06, + "loss": 0.2535, + "step": 15530 + }, + { + "epoch": 53.96, + "learning_rate": 1.87547703180212e-06, + "loss": 0.2804, + "step": 15540 + }, + { + "epoch": 53.99, + "learning_rate": 1.8740636042402826e-06, + "loss": 0.2778, + "step": 15550 + }, + { + "epoch": 54.0, + "eval_loss": 0.5110978484153748, + "eval_runtime": 133.5788, + "eval_samples_per_second": 3.983, + "eval_steps_per_second": 0.996, + "eval_wer": 0.19804589573825288, + "step": 15552 + }, + { + "epoch": 54.03, + "learning_rate": 1.872650176678445e-06, + "loss": 0.2538, + "step": 15560 + }, + { + "epoch": 54.06, + "learning_rate": 1.8712367491166076e-06, + "loss": 0.2607, + "step": 15570 + }, + { + "epoch": 54.1, + "learning_rate": 1.8698233215547702e-06, + "loss": 0.2557, + "step": 15580 + }, + { + "epoch": 54.13, + "learning_rate": 1.8684098939929326e-06, + "loss": 0.2918, + "step": 15590 + }, + { + "epoch": 54.17, + "learning_rate": 1.8669964664310953e-06, + "loss": 0.3063, + "step": 15600 + }, + { + "epoch": 54.2, + "learning_rate": 1.8655830388692579e-06, + "loss": 0.2604, + "step": 15610 + }, + { + "epoch": 54.24, + "learning_rate": 1.8641696113074203e-06, + "loss": 0.263, + "step": 15620 + }, + { + "epoch": 54.27, + "learning_rate": 1.862756183745583e-06, + "loss": 0.2506, + "step": 15630 + }, + { + "epoch": 54.3, + "learning_rate": 1.8613427561837455e-06, + "loss": 0.271, + "step": 15640 + }, + { + "epoch": 54.34, + "learning_rate": 1.859929328621908e-06, + "loss": 0.2591, + "step": 15650 + }, + { + "epoch": 54.37, + "learning_rate": 1.8585159010600706e-06, + "loss": 0.2762, + "step": 15660 + }, + { + "epoch": 54.41, + "learning_rate": 1.8571024734982332e-06, + "loss": 0.2877, + "step": 15670 + }, + { + "epoch": 54.44, + "learning_rate": 1.8556890459363956e-06, + "loss": 0.2491, + "step": 15680 + }, + { + "epoch": 54.48, + "learning_rate": 1.8542756183745582e-06, + "loss": 0.2738, + "step": 15690 + }, + { + "epoch": 54.51, + "learning_rate": 1.8528621908127206e-06, + "loss": 0.2679, + "step": 15700 + }, + { + "epoch": 54.55, + "learning_rate": 1.8514487632508833e-06, + "loss": 0.2627, + "step": 15710 + }, + { + "epoch": 54.58, + "learning_rate": 1.8500353356890459e-06, + "loss": 0.2609, + "step": 15720 + }, + { + "epoch": 54.62, + "learning_rate": 1.8486219081272083e-06, + "loss": 0.2451, + "step": 15730 + }, + { + "epoch": 54.65, + "learning_rate": 1.847208480565371e-06, + "loss": 0.2622, + "step": 15740 + }, + { + "epoch": 54.69, + "learning_rate": 1.8457950530035335e-06, + "loss": 0.2716, + "step": 15750 + }, + { + "epoch": 54.72, + "learning_rate": 1.844381625441696e-06, + "loss": 0.2604, + "step": 15760 + }, + { + "epoch": 54.75, + "learning_rate": 1.8429681978798586e-06, + "loss": 0.2488, + "step": 15770 + }, + { + "epoch": 54.79, + "learning_rate": 1.8415547703180212e-06, + "loss": 0.2716, + "step": 15780 + }, + { + "epoch": 54.82, + "learning_rate": 1.8401413427561836e-06, + "loss": 0.2795, + "step": 15790 + }, + { + "epoch": 54.86, + "learning_rate": 1.8387279151943462e-06, + "loss": 0.2662, + "step": 15800 + }, + { + "epoch": 54.89, + "learning_rate": 1.8373144876325088e-06, + "loss": 0.2475, + "step": 15810 + }, + { + "epoch": 54.93, + "learning_rate": 1.8359010600706712e-06, + "loss": 0.2695, + "step": 15820 + }, + { + "epoch": 54.96, + "learning_rate": 1.8344876325088339e-06, + "loss": 0.2605, + "step": 15830 + }, + { + "epoch": 55.0, + "learning_rate": 1.8330742049469965e-06, + "loss": 0.2707, + "step": 15840 + }, + { + "epoch": 55.0, + "eval_loss": 0.5116538405418396, + "eval_runtime": 133.5286, + "eval_samples_per_second": 3.984, + "eval_steps_per_second": 0.996, + "eval_wer": 0.19946005013820145, + "step": 15840 + }, + { + "epoch": 55.03, + "learning_rate": 1.831660777385159e-06, + "loss": 0.2439, + "step": 15850 + }, + { + "epoch": 55.07, + "learning_rate": 1.8302473498233215e-06, + "loss": 0.2534, + "step": 15860 + }, + { + "epoch": 55.1, + "learning_rate": 1.828833922261484e-06, + "loss": 0.2465, + "step": 15870 + }, + { + "epoch": 55.14, + "learning_rate": 1.8274204946996465e-06, + "loss": 0.2705, + "step": 15880 + }, + { + "epoch": 55.17, + "learning_rate": 1.8260070671378092e-06, + "loss": 0.2686, + "step": 15890 + }, + { + "epoch": 55.21, + "learning_rate": 1.8245936395759716e-06, + "loss": 0.2646, + "step": 15900 + }, + { + "epoch": 55.24, + "learning_rate": 1.8231802120141342e-06, + "loss": 0.2688, + "step": 15910 + }, + { + "epoch": 55.28, + "learning_rate": 1.8217667844522968e-06, + "loss": 0.2504, + "step": 15920 + }, + { + "epoch": 55.31, + "learning_rate": 1.8203533568904592e-06, + "loss": 0.2696, + "step": 15930 + }, + { + "epoch": 55.35, + "learning_rate": 1.8189399293286219e-06, + "loss": 0.2634, + "step": 15940 + }, + { + "epoch": 55.38, + "learning_rate": 1.8175265017667845e-06, + "loss": 0.281, + "step": 15950 + }, + { + "epoch": 55.42, + "learning_rate": 1.8161130742049469e-06, + "loss": 0.2617, + "step": 15960 + }, + { + "epoch": 55.45, + "learning_rate": 1.8146996466431095e-06, + "loss": 0.2631, + "step": 15970 + }, + { + "epoch": 55.48, + "learning_rate": 1.8132862190812721e-06, + "loss": 0.2646, + "step": 15980 + }, + { + "epoch": 55.52, + "learning_rate": 1.8118727915194345e-06, + "loss": 0.2597, + "step": 15990 + }, + { + "epoch": 55.55, + "learning_rate": 1.8104593639575972e-06, + "loss": 0.2723, + "step": 16000 + }, + { + "epoch": 55.59, + "learning_rate": 1.8090459363957596e-06, + "loss": 0.2507, + "step": 16010 + }, + { + "epoch": 55.62, + "learning_rate": 1.8076325088339222e-06, + "loss": 0.2457, + "step": 16020 + }, + { + "epoch": 55.66, + "learning_rate": 1.8062190812720848e-06, + "loss": 0.2963, + "step": 16030 + }, + { + "epoch": 55.69, + "learning_rate": 1.8048056537102472e-06, + "loss": 0.2469, + "step": 16040 + }, + { + "epoch": 55.73, + "learning_rate": 1.8033922261484098e-06, + "loss": 0.2333, + "step": 16050 + }, + { + "epoch": 55.76, + "learning_rate": 1.8019787985865725e-06, + "loss": 0.2694, + "step": 16060 + }, + { + "epoch": 55.8, + "learning_rate": 1.8005653710247349e-06, + "loss": 0.2568, + "step": 16070 + }, + { + "epoch": 55.83, + "learning_rate": 1.7991519434628975e-06, + "loss": 0.277, + "step": 16080 + }, + { + "epoch": 55.87, + "learning_rate": 1.7977385159010601e-06, + "loss": 0.2871, + "step": 16090 + }, + { + "epoch": 55.9, + "learning_rate": 1.7963250883392225e-06, + "loss": 0.2669, + "step": 16100 + }, + { + "epoch": 55.94, + "learning_rate": 1.7949116607773851e-06, + "loss": 0.2684, + "step": 16110 + }, + { + "epoch": 55.97, + "learning_rate": 1.7934982332155478e-06, + "loss": 0.2566, + "step": 16120 + }, + { + "epoch": 56.0, + "eval_loss": 0.5196597576141357, + "eval_runtime": 133.3522, + "eval_samples_per_second": 3.989, + "eval_steps_per_second": 0.997, + "eval_wer": 0.20023140708362794, + "step": 16128 + }, + { + "epoch": 56.01, + "learning_rate": 1.7920848056537102e-06, + "loss": 0.2742, + "step": 16130 + }, + { + "epoch": 56.04, + "learning_rate": 1.7906713780918728e-06, + "loss": 0.2635, + "step": 16140 + }, + { + "epoch": 56.08, + "learning_rate": 1.7892579505300354e-06, + "loss": 0.263, + "step": 16150 + }, + { + "epoch": 56.11, + "learning_rate": 1.7878445229681978e-06, + "loss": 0.2578, + "step": 16160 + }, + { + "epoch": 56.15, + "learning_rate": 1.7864310954063604e-06, + "loss": 0.26, + "step": 16170 + }, + { + "epoch": 56.18, + "learning_rate": 1.7850176678445229e-06, + "loss": 0.2523, + "step": 16180 + }, + { + "epoch": 56.21, + "learning_rate": 1.7836042402826855e-06, + "loss": 0.2663, + "step": 16190 + }, + { + "epoch": 56.25, + "learning_rate": 1.782190812720848e-06, + "loss": 0.2493, + "step": 16200 + }, + { + "epoch": 56.28, + "learning_rate": 1.7807773851590105e-06, + "loss": 0.2407, + "step": 16210 + }, + { + "epoch": 56.32, + "learning_rate": 1.7793639575971731e-06, + "loss": 0.2565, + "step": 16220 + }, + { + "epoch": 56.35, + "learning_rate": 1.7779505300353358e-06, + "loss": 0.2673, + "step": 16230 + }, + { + "epoch": 56.39, + "learning_rate": 1.7765371024734982e-06, + "loss": 0.2487, + "step": 16240 + }, + { + "epoch": 56.42, + "learning_rate": 1.7751236749116608e-06, + "loss": 0.2539, + "step": 16250 + }, + { + "epoch": 56.46, + "learning_rate": 1.7737102473498234e-06, + "loss": 0.267, + "step": 16260 + }, + { + "epoch": 56.49, + "learning_rate": 1.7722968197879858e-06, + "loss": 0.2649, + "step": 16270 + }, + { + "epoch": 56.53, + "learning_rate": 1.7708833922261484e-06, + "loss": 0.2514, + "step": 16280 + }, + { + "epoch": 56.56, + "learning_rate": 1.769469964664311e-06, + "loss": 0.2652, + "step": 16290 + }, + { + "epoch": 56.6, + "learning_rate": 1.7680565371024735e-06, + "loss": 0.2702, + "step": 16300 + }, + { + "epoch": 56.63, + "learning_rate": 1.766643109540636e-06, + "loss": 0.2674, + "step": 16310 + }, + { + "epoch": 56.66, + "learning_rate": 1.7652296819787985e-06, + "loss": 0.3018, + "step": 16320 + }, + { + "epoch": 56.7, + "learning_rate": 1.7638162544169611e-06, + "loss": 0.2583, + "step": 16330 + }, + { + "epoch": 56.73, + "learning_rate": 1.7624028268551237e-06, + "loss": 0.262, + "step": 16340 + }, + { + "epoch": 56.77, + "learning_rate": 1.7609893992932861e-06, + "loss": 0.2863, + "step": 16350 + }, + { + "epoch": 56.8, + "learning_rate": 1.7595759717314488e-06, + "loss": 0.2632, + "step": 16360 + }, + { + "epoch": 56.84, + "learning_rate": 1.7581625441696114e-06, + "loss": 0.2861, + "step": 16370 + }, + { + "epoch": 56.87, + "learning_rate": 1.7567491166077738e-06, + "loss": 0.2588, + "step": 16380 + }, + { + "epoch": 56.91, + "learning_rate": 1.7553356890459364e-06, + "loss": 0.2594, + "step": 16390 + }, + { + "epoch": 56.94, + "learning_rate": 1.753922261484099e-06, + "loss": 0.2593, + "step": 16400 + }, + { + "epoch": 56.98, + "learning_rate": 1.7525088339222612e-06, + "loss": 0.2517, + "step": 16410 + }, + { + "epoch": 57.0, + "eval_loss": 0.5210915803909302, + "eval_runtime": 133.6955, + "eval_samples_per_second": 3.979, + "eval_steps_per_second": 0.995, + "eval_wer": 0.19766021726553962, + "step": 16416 + }, + { + "epoch": 57.01, + "learning_rate": 1.7510954063604239e-06, + "loss": 0.2697, + "step": 16420 + }, + { + "epoch": 57.05, + "learning_rate": 1.7496819787985865e-06, + "loss": 0.2594, + "step": 16430 + }, + { + "epoch": 57.08, + "learning_rate": 1.7482685512367489e-06, + "loss": 0.255, + "step": 16440 + }, + { + "epoch": 57.12, + "learning_rate": 1.7468551236749115e-06, + "loss": 0.2831, + "step": 16450 + }, + { + "epoch": 57.15, + "learning_rate": 1.7454416961130741e-06, + "loss": 0.2727, + "step": 16460 + }, + { + "epoch": 57.19, + "learning_rate": 1.7440282685512365e-06, + "loss": 0.2516, + "step": 16470 + }, + { + "epoch": 57.22, + "learning_rate": 1.7426148409893992e-06, + "loss": 0.2602, + "step": 16480 + }, + { + "epoch": 57.26, + "learning_rate": 1.7412014134275616e-06, + "loss": 0.2567, + "step": 16490 + }, + { + "epoch": 57.29, + "learning_rate": 1.7397879858657242e-06, + "loss": 0.2625, + "step": 16500 + }, + { + "epoch": 57.33, + "learning_rate": 1.7383745583038868e-06, + "loss": 0.2711, + "step": 16510 + }, + { + "epoch": 57.36, + "learning_rate": 1.7369611307420492e-06, + "loss": 0.2688, + "step": 16520 + }, + { + "epoch": 57.39, + "learning_rate": 1.7355477031802119e-06, + "loss": 0.2677, + "step": 16530 + }, + { + "epoch": 57.43, + "learning_rate": 1.7341342756183745e-06, + "loss": 0.2636, + "step": 16540 + }, + { + "epoch": 57.46, + "learning_rate": 1.7327208480565369e-06, + "loss": 0.2531, + "step": 16550 + }, + { + "epoch": 57.5, + "learning_rate": 1.7313074204946995e-06, + "loss": 0.2769, + "step": 16560 + }, + { + "epoch": 57.53, + "learning_rate": 1.7298939929328621e-06, + "loss": 0.2666, + "step": 16570 + }, + { + "epoch": 57.57, + "learning_rate": 1.7284805653710245e-06, + "loss": 0.2544, + "step": 16580 + }, + { + "epoch": 57.6, + "learning_rate": 1.7270671378091872e-06, + "loss": 0.2544, + "step": 16590 + }, + { + "epoch": 57.64, + "learning_rate": 1.7256537102473498e-06, + "loss": 0.2738, + "step": 16600 + }, + { + "epoch": 57.67, + "learning_rate": 1.7242402826855122e-06, + "loss": 0.274, + "step": 16610 + }, + { + "epoch": 57.71, + "learning_rate": 1.7228268551236748e-06, + "loss": 0.2501, + "step": 16620 + }, + { + "epoch": 57.74, + "learning_rate": 1.7214134275618372e-06, + "loss": 0.2516, + "step": 16630 + }, + { + "epoch": 57.78, + "learning_rate": 1.7199999999999998e-06, + "loss": 0.2444, + "step": 16640 + }, + { + "epoch": 57.81, + "learning_rate": 1.7185865724381625e-06, + "loss": 0.2728, + "step": 16650 + }, + { + "epoch": 57.85, + "learning_rate": 1.7171731448763249e-06, + "loss": 0.2628, + "step": 16660 + }, + { + "epoch": 57.88, + "learning_rate": 1.7157597173144875e-06, + "loss": 0.2577, + "step": 16670 + }, + { + "epoch": 57.91, + "learning_rate": 1.7143462897526501e-06, + "loss": 0.2769, + "step": 16680 + }, + { + "epoch": 57.95, + "learning_rate": 1.7129328621908125e-06, + "loss": 0.2379, + "step": 16690 + }, + { + "epoch": 57.98, + "learning_rate": 1.7115194346289751e-06, + "loss": 0.2629, + "step": 16700 + }, + { + "epoch": 58.0, + "eval_loss": 0.5079585313796997, + "eval_runtime": 133.0035, + "eval_samples_per_second": 4.0, + "eval_steps_per_second": 1.0, + "eval_wer": 0.19856013370187053, + "step": 16704 + }, + { + "epoch": 58.02, + "learning_rate": 1.7101060070671378e-06, + "loss": 0.2771, + "step": 16710 + }, + { + "epoch": 58.06, + "learning_rate": 1.7086925795053002e-06, + "loss": 0.2628, + "step": 16720 + }, + { + "epoch": 58.09, + "learning_rate": 1.7072791519434628e-06, + "loss": 0.278, + "step": 16730 + }, + { + "epoch": 58.12, + "learning_rate": 1.7058657243816254e-06, + "loss": 0.2515, + "step": 16740 + }, + { + "epoch": 58.16, + "learning_rate": 1.7044522968197878e-06, + "loss": 0.2736, + "step": 16750 + }, + { + "epoch": 58.19, + "learning_rate": 1.7030388692579504e-06, + "loss": 0.263, + "step": 16760 + }, + { + "epoch": 58.23, + "learning_rate": 1.701625441696113e-06, + "loss": 0.2649, + "step": 16770 + }, + { + "epoch": 58.26, + "learning_rate": 1.7002120141342755e-06, + "loss": 0.2387, + "step": 16780 + }, + { + "epoch": 58.3, + "learning_rate": 1.698798586572438e-06, + "loss": 0.2654, + "step": 16790 + }, + { + "epoch": 58.33, + "learning_rate": 1.6973851590106005e-06, + "loss": 0.2658, + "step": 16800 + }, + { + "epoch": 58.37, + "learning_rate": 1.6959717314487631e-06, + "loss": 0.2685, + "step": 16810 + }, + { + "epoch": 58.4, + "learning_rate": 1.6945583038869258e-06, + "loss": 0.2531, + "step": 16820 + }, + { + "epoch": 58.44, + "learning_rate": 1.6931448763250882e-06, + "loss": 0.2577, + "step": 16830 + }, + { + "epoch": 58.47, + "learning_rate": 1.6917314487632508e-06, + "loss": 0.2636, + "step": 16840 + }, + { + "epoch": 58.51, + "learning_rate": 1.6903180212014134e-06, + "loss": 0.2856, + "step": 16850 + }, + { + "epoch": 58.54, + "learning_rate": 1.6889045936395758e-06, + "loss": 0.2475, + "step": 16860 + }, + { + "epoch": 58.57, + "learning_rate": 1.6874911660777384e-06, + "loss": 0.2671, + "step": 16870 + }, + { + "epoch": 58.61, + "learning_rate": 1.686077738515901e-06, + "loss": 0.2512, + "step": 16880 + }, + { + "epoch": 58.64, + "learning_rate": 1.6846643109540635e-06, + "loss": 0.2786, + "step": 16890 + }, + { + "epoch": 58.68, + "learning_rate": 1.683250883392226e-06, + "loss": 0.2816, + "step": 16900 + }, + { + "epoch": 58.71, + "learning_rate": 1.6818374558303887e-06, + "loss": 0.2577, + "step": 16910 + }, + { + "epoch": 58.75, + "learning_rate": 1.6804240282685511e-06, + "loss": 0.2604, + "step": 16920 + }, + { + "epoch": 58.78, + "learning_rate": 1.6790106007067137e-06, + "loss": 0.2746, + "step": 16930 + }, + { + "epoch": 58.82, + "learning_rate": 1.6775971731448761e-06, + "loss": 0.269, + "step": 16940 + }, + { + "epoch": 58.85, + "learning_rate": 1.6761837455830388e-06, + "loss": 0.2399, + "step": 16950 + }, + { + "epoch": 58.89, + "learning_rate": 1.6747703180212014e-06, + "loss": 0.275, + "step": 16960 + }, + { + "epoch": 58.92, + "learning_rate": 1.6733568904593638e-06, + "loss": 0.2616, + "step": 16970 + }, + { + "epoch": 58.96, + "learning_rate": 1.6719434628975264e-06, + "loss": 0.2533, + "step": 16980 + }, + { + "epoch": 58.99, + "learning_rate": 1.670530035335689e-06, + "loss": 0.2787, + "step": 16990 + }, + { + "epoch": 59.0, + "eval_loss": 0.5133015513420105, + "eval_runtime": 133.197, + "eval_samples_per_second": 3.994, + "eval_steps_per_second": 0.999, + "eval_wer": 0.19798161599280067, + "step": 16992 + }, + { + "epoch": 59.03, + "learning_rate": 1.6691166077738515e-06, + "loss": 0.2536, + "step": 17000 + }, + { + "epoch": 59.06, + "learning_rate": 1.667703180212014e-06, + "loss": 0.2524, + "step": 17010 + }, + { + "epoch": 59.1, + "learning_rate": 1.6662897526501767e-06, + "loss": 0.2374, + "step": 17020 + }, + { + "epoch": 59.13, + "learning_rate": 1.664876325088339e-06, + "loss": 0.2744, + "step": 17030 + }, + { + "epoch": 59.17, + "learning_rate": 1.6634628975265017e-06, + "loss": 0.2803, + "step": 17040 + }, + { + "epoch": 59.2, + "learning_rate": 1.6620494699646643e-06, + "loss": 0.2857, + "step": 17050 + }, + { + "epoch": 59.24, + "learning_rate": 1.6606360424028268e-06, + "loss": 0.2656, + "step": 17060 + }, + { + "epoch": 59.27, + "learning_rate": 1.6592226148409894e-06, + "loss": 0.2608, + "step": 17070 + }, + { + "epoch": 59.3, + "learning_rate": 1.657809187279152e-06, + "loss": 0.2826, + "step": 17080 + }, + { + "epoch": 59.34, + "learning_rate": 1.6563957597173144e-06, + "loss": 0.2972, + "step": 17090 + }, + { + "epoch": 59.37, + "learning_rate": 1.654982332155477e-06, + "loss": 0.2681, + "step": 17100 + }, + { + "epoch": 59.41, + "learning_rate": 1.6535689045936394e-06, + "loss": 0.2643, + "step": 17110 + }, + { + "epoch": 59.44, + "learning_rate": 1.652155477031802e-06, + "loss": 0.255, + "step": 17120 + }, + { + "epoch": 59.48, + "learning_rate": 1.6507420494699647e-06, + "loss": 0.2737, + "step": 17130 + }, + { + "epoch": 59.51, + "learning_rate": 1.649328621908127e-06, + "loss": 0.2642, + "step": 17140 + }, + { + "epoch": 59.55, + "learning_rate": 1.6479151943462897e-06, + "loss": 0.2459, + "step": 17150 + }, + { + "epoch": 59.58, + "learning_rate": 1.6465017667844523e-06, + "loss": 0.2693, + "step": 17160 + }, + { + "epoch": 59.62, + "learning_rate": 1.6450883392226147e-06, + "loss": 0.2648, + "step": 17170 + }, + { + "epoch": 59.65, + "learning_rate": 1.6436749116607774e-06, + "loss": 0.2467, + "step": 17180 + }, + { + "epoch": 59.69, + "learning_rate": 1.64226148409894e-06, + "loss": 0.2732, + "step": 17190 + }, + { + "epoch": 59.72, + "learning_rate": 1.6408480565371024e-06, + "loss": 0.2362, + "step": 17200 + }, + { + "epoch": 59.75, + "learning_rate": 1.639434628975265e-06, + "loss": 0.2591, + "step": 17210 + }, + { + "epoch": 59.79, + "learning_rate": 1.6380212014134276e-06, + "loss": 0.2481, + "step": 17220 + }, + { + "epoch": 59.82, + "learning_rate": 1.63660777385159e-06, + "loss": 0.2918, + "step": 17230 + }, + { + "epoch": 59.86, + "learning_rate": 1.6351943462897527e-06, + "loss": 0.2633, + "step": 17240 + }, + { + "epoch": 59.89, + "learning_rate": 1.633780918727915e-06, + "loss": 0.2691, + "step": 17250 + }, + { + "epoch": 59.93, + "learning_rate": 1.6323674911660777e-06, + "loss": 0.2457, + "step": 17260 + }, + { + "epoch": 59.96, + "learning_rate": 1.6309540636042403e-06, + "loss": 0.2563, + "step": 17270 + }, + { + "epoch": 60.0, + "learning_rate": 1.6295406360424027e-06, + "loss": 0.269, + "step": 17280 + }, + { + "epoch": 60.0, + "eval_loss": 0.5155569314956665, + "eval_runtime": 133.7176, + "eval_samples_per_second": 3.979, + "eval_steps_per_second": 0.995, + "eval_wer": 0.1972745387928264, + "step": 17280 + }, + { + "epoch": 60.03, + "learning_rate": 1.6281272084805654e-06, + "loss": 0.2982, + "step": 17290 + }, + { + "epoch": 60.07, + "learning_rate": 1.626713780918728e-06, + "loss": 0.2651, + "step": 17300 + }, + { + "epoch": 60.1, + "learning_rate": 1.6253003533568904e-06, + "loss": 0.2533, + "step": 17310 + }, + { + "epoch": 60.14, + "learning_rate": 1.623886925795053e-06, + "loss": 0.2531, + "step": 17320 + }, + { + "epoch": 60.17, + "learning_rate": 1.6224734982332156e-06, + "loss": 0.2584, + "step": 17330 + }, + { + "epoch": 60.21, + "learning_rate": 1.621060070671378e-06, + "loss": 0.2649, + "step": 17340 + }, + { + "epoch": 60.24, + "learning_rate": 1.6196466431095407e-06, + "loss": 0.2601, + "step": 17350 + }, + { + "epoch": 60.28, + "learning_rate": 1.6182332155477033e-06, + "loss": 0.2509, + "step": 17360 + }, + { + "epoch": 60.31, + "learning_rate": 1.6168197879858657e-06, + "loss": 0.2647, + "step": 17370 + }, + { + "epoch": 60.35, + "learning_rate": 1.6154063604240283e-06, + "loss": 0.259, + "step": 17380 + }, + { + "epoch": 60.38, + "learning_rate": 1.613992932862191e-06, + "loss": 0.2466, + "step": 17390 + }, + { + "epoch": 60.42, + "learning_rate": 1.6125795053003533e-06, + "loss": 0.2568, + "step": 17400 + }, + { + "epoch": 60.45, + "learning_rate": 1.611166077738516e-06, + "loss": 0.2427, + "step": 17410 + }, + { + "epoch": 60.48, + "learning_rate": 1.6097526501766784e-06, + "loss": 0.265, + "step": 17420 + }, + { + "epoch": 60.52, + "learning_rate": 1.608339222614841e-06, + "loss": 0.2602, + "step": 17430 + }, + { + "epoch": 60.55, + "learning_rate": 1.6069257950530036e-06, + "loss": 0.2419, + "step": 17440 + }, + { + "epoch": 60.59, + "learning_rate": 1.605512367491166e-06, + "loss": 0.2363, + "step": 17450 + }, + { + "epoch": 60.62, + "learning_rate": 1.6040989399293286e-06, + "loss": 0.2614, + "step": 17460 + }, + { + "epoch": 60.66, + "learning_rate": 1.6026855123674913e-06, + "loss": 0.288, + "step": 17470 + }, + { + "epoch": 60.69, + "learning_rate": 1.6012720848056535e-06, + "loss": 0.2746, + "step": 17480 + }, + { + "epoch": 60.73, + "learning_rate": 1.5998586572438163e-06, + "loss": 0.2442, + "step": 17490 + }, + { + "epoch": 60.76, + "learning_rate": 1.598445229681979e-06, + "loss": 0.2789, + "step": 17500 + }, + { + "epoch": 60.8, + "learning_rate": 1.5970318021201411e-06, + "loss": 0.2478, + "step": 17510 + }, + { + "epoch": 60.83, + "learning_rate": 1.5956183745583037e-06, + "loss": 0.2833, + "step": 17520 + }, + { + "epoch": 60.87, + "learning_rate": 1.5942049469964664e-06, + "loss": 0.2829, + "step": 17530 + }, + { + "epoch": 60.9, + "learning_rate": 1.5927915194346288e-06, + "loss": 0.2482, + "step": 17540 + }, + { + "epoch": 60.94, + "learning_rate": 1.5913780918727914e-06, + "loss": 0.2772, + "step": 17550 + }, + { + "epoch": 60.97, + "learning_rate": 1.5899646643109538e-06, + "loss": 0.2664, + "step": 17560 + }, + { + "epoch": 61.0, + "eval_loss": 0.5191646814346313, + "eval_runtime": 133.5584, + "eval_samples_per_second": 3.983, + "eval_steps_per_second": 0.996, + "eval_wer": 0.1948961882110947, + "step": 17568 + }, + { + "epoch": 61.01, + "learning_rate": 1.5885512367491164e-06, + "loss": 0.2819, + "step": 17570 + }, + { + "epoch": 61.04, + "learning_rate": 1.587137809187279e-06, + "loss": 0.2615, + "step": 17580 + }, + { + "epoch": 61.08, + "learning_rate": 1.5857243816254414e-06, + "loss": 0.2556, + "step": 17590 + }, + { + "epoch": 61.11, + "learning_rate": 1.584310954063604e-06, + "loss": 0.2771, + "step": 17600 + }, + { + "epoch": 61.15, + "learning_rate": 1.5828975265017667e-06, + "loss": 0.2854, + "step": 17610 + }, + { + "epoch": 61.18, + "learning_rate": 1.581484098939929e-06, + "loss": 0.2554, + "step": 17620 + }, + { + "epoch": 61.21, + "learning_rate": 1.5800706713780917e-06, + "loss": 0.2597, + "step": 17630 + }, + { + "epoch": 61.25, + "learning_rate": 1.5786572438162543e-06, + "loss": 0.2422, + "step": 17640 + }, + { + "epoch": 61.28, + "learning_rate": 1.5772438162544168e-06, + "loss": 0.268, + "step": 17650 + }, + { + "epoch": 61.32, + "learning_rate": 1.5758303886925794e-06, + "loss": 0.2665, + "step": 17660 + }, + { + "epoch": 61.35, + "learning_rate": 1.574416961130742e-06, + "loss": 0.2504, + "step": 17670 + }, + { + "epoch": 61.39, + "learning_rate": 1.5730035335689044e-06, + "loss": 0.256, + "step": 17680 + }, + { + "epoch": 61.42, + "learning_rate": 1.571590106007067e-06, + "loss": 0.2634, + "step": 17690 + }, + { + "epoch": 61.46, + "learning_rate": 1.5701766784452296e-06, + "loss": 0.2538, + "step": 17700 + }, + { + "epoch": 61.49, + "learning_rate": 1.568763250883392e-06, + "loss": 0.2518, + "step": 17710 + }, + { + "epoch": 61.53, + "learning_rate": 1.5673498233215547e-06, + "loss": 0.2623, + "step": 17720 + }, + { + "epoch": 61.56, + "learning_rate": 1.565936395759717e-06, + "loss": 0.2741, + "step": 17730 + }, + { + "epoch": 61.6, + "learning_rate": 1.5645229681978797e-06, + "loss": 0.2519, + "step": 17740 + }, + { + "epoch": 61.63, + "learning_rate": 1.5631095406360423e-06, + "loss": 0.2381, + "step": 17750 + }, + { + "epoch": 61.66, + "learning_rate": 1.5616961130742047e-06, + "loss": 0.26, + "step": 17760 + }, + { + "epoch": 61.7, + "learning_rate": 1.5602826855123674e-06, + "loss": 0.2751, + "step": 17770 + }, + { + "epoch": 61.73, + "learning_rate": 1.55886925795053e-06, + "loss": 0.2536, + "step": 17780 + }, + { + "epoch": 61.77, + "learning_rate": 1.5574558303886924e-06, + "loss": 0.2614, + "step": 17790 + }, + { + "epoch": 61.8, + "learning_rate": 1.556042402826855e-06, + "loss": 0.2669, + "step": 17800 + }, + { + "epoch": 61.84, + "learning_rate": 1.5546289752650176e-06, + "loss": 0.2653, + "step": 17810 + }, + { + "epoch": 61.87, + "learning_rate": 1.55321554770318e-06, + "loss": 0.2641, + "step": 17820 + }, + { + "epoch": 61.91, + "learning_rate": 1.5518021201413427e-06, + "loss": 0.267, + "step": 17830 + }, + { + "epoch": 61.94, + "learning_rate": 1.5503886925795053e-06, + "loss": 0.2447, + "step": 17840 + }, + { + "epoch": 61.98, + "learning_rate": 1.5489752650176677e-06, + "loss": 0.2605, + "step": 17850 + }, + { + "epoch": 62.0, + "eval_loss": 0.5094706416130066, + "eval_runtime": 133.5482, + "eval_samples_per_second": 3.984, + "eval_steps_per_second": 0.996, + "eval_wer": 0.19701741981101756, + "step": 17856 + }, + { + "epoch": 62.01, + "learning_rate": 1.5475618374558303e-06, + "loss": 0.2882, + "step": 17860 + }, + { + "epoch": 62.05, + "learning_rate": 1.5461484098939927e-06, + "loss": 0.2536, + "step": 17870 + }, + { + "epoch": 62.08, + "learning_rate": 1.5447349823321554e-06, + "loss": 0.2642, + "step": 17880 + }, + { + "epoch": 62.12, + "learning_rate": 1.543321554770318e-06, + "loss": 0.2723, + "step": 17890 + }, + { + "epoch": 62.15, + "learning_rate": 1.5419081272084804e-06, + "loss": 0.2688, + "step": 17900 + }, + { + "epoch": 62.19, + "learning_rate": 1.540494699646643e-06, + "loss": 0.2406, + "step": 17910 + }, + { + "epoch": 62.22, + "learning_rate": 1.5390812720848056e-06, + "loss": 0.2617, + "step": 17920 + }, + { + "epoch": 62.26, + "learning_rate": 1.537667844522968e-06, + "loss": 0.259, + "step": 17930 + }, + { + "epoch": 62.29, + "learning_rate": 1.5362544169611307e-06, + "loss": 0.25, + "step": 17940 + }, + { + "epoch": 62.33, + "learning_rate": 1.5348409893992933e-06, + "loss": 0.2976, + "step": 17950 + }, + { + "epoch": 62.36, + "learning_rate": 1.5334275618374557e-06, + "loss": 0.2654, + "step": 17960 + }, + { + "epoch": 62.39, + "learning_rate": 1.5320141342756183e-06, + "loss": 0.2781, + "step": 17970 + }, + { + "epoch": 62.43, + "learning_rate": 1.530600706713781e-06, + "loss": 0.2588, + "step": 17980 + }, + { + "epoch": 62.46, + "learning_rate": 1.5291872791519433e-06, + "loss": 0.2336, + "step": 17990 + }, + { + "epoch": 62.5, + "learning_rate": 1.527773851590106e-06, + "loss": 0.2496, + "step": 18000 + }, + { + "epoch": 62.53, + "learning_rate": 1.5263604240282686e-06, + "loss": 0.2469, + "step": 18010 + }, + { + "epoch": 62.57, + "learning_rate": 1.524946996466431e-06, + "loss": 0.2624, + "step": 18020 + }, + { + "epoch": 62.6, + "learning_rate": 1.5235335689045936e-06, + "loss": 0.2382, + "step": 18030 + }, + { + "epoch": 62.64, + "learning_rate": 1.522120141342756e-06, + "loss": 0.2812, + "step": 18040 + }, + { + "epoch": 62.67, + "learning_rate": 1.5207067137809186e-06, + "loss": 0.2653, + "step": 18050 + }, + { + "epoch": 62.71, + "learning_rate": 1.519434628975265e-06, + "loss": 0.2644, + "step": 18060 + }, + { + "epoch": 62.74, + "learning_rate": 1.5180212014134275e-06, + "loss": 0.2725, + "step": 18070 + }, + { + "epoch": 62.78, + "learning_rate": 1.5166077738515901e-06, + "loss": 0.2444, + "step": 18080 + }, + { + "epoch": 62.81, + "learning_rate": 1.5151943462897525e-06, + "loss": 0.276, + "step": 18090 + }, + { + "epoch": 62.85, + "learning_rate": 1.5137809187279152e-06, + "loss": 0.2724, + "step": 18100 + }, + { + "epoch": 62.88, + "learning_rate": 1.5123674911660778e-06, + "loss": 0.2495, + "step": 18110 + }, + { + "epoch": 62.91, + "learning_rate": 1.5109540636042402e-06, + "loss": 0.2311, + "step": 18120 + }, + { + "epoch": 62.95, + "learning_rate": 1.5095406360424028e-06, + "loss": 0.2443, + "step": 18130 + }, + { + "epoch": 62.98, + "learning_rate": 1.5081272084805654e-06, + "loss": 0.2649, + "step": 18140 + }, + { + "epoch": 63.0, + "eval_loss": 0.5149233937263489, + "eval_runtime": 133.9576, + "eval_samples_per_second": 3.971, + "eval_steps_per_second": 0.993, + "eval_wer": 0.19695314006556533, + "step": 18144 + }, + { + "epoch": 63.02, + "learning_rate": 1.5067137809187279e-06, + "loss": 0.2642, + "step": 18150 + }, + { + "epoch": 63.06, + "learning_rate": 1.5053003533568905e-06, + "loss": 0.2526, + "step": 18160 + }, + { + "epoch": 63.09, + "learning_rate": 1.5038869257950529e-06, + "loss": 0.2483, + "step": 18170 + }, + { + "epoch": 63.12, + "learning_rate": 1.5024734982332155e-06, + "loss": 0.2617, + "step": 18180 + }, + { + "epoch": 63.16, + "learning_rate": 1.5010600706713781e-06, + "loss": 0.2942, + "step": 18190 + }, + { + "epoch": 63.19, + "learning_rate": 1.4996466431095405e-06, + "loss": 0.2672, + "step": 18200 + }, + { + "epoch": 63.23, + "learning_rate": 1.4982332155477032e-06, + "loss": 0.2541, + "step": 18210 + }, + { + "epoch": 63.26, + "learning_rate": 1.4968197879858658e-06, + "loss": 0.2403, + "step": 18220 + }, + { + "epoch": 63.3, + "learning_rate": 1.4954063604240282e-06, + "loss": 0.2749, + "step": 18230 + }, + { + "epoch": 63.33, + "learning_rate": 1.4939929328621908e-06, + "loss": 0.2812, + "step": 18240 + }, + { + "epoch": 63.37, + "learning_rate": 1.4925795053003534e-06, + "loss": 0.2279, + "step": 18250 + }, + { + "epoch": 63.4, + "learning_rate": 1.4911660777385158e-06, + "loss": 0.2552, + "step": 18260 + }, + { + "epoch": 63.44, + "learning_rate": 1.4897526501766785e-06, + "loss": 0.2594, + "step": 18270 + }, + { + "epoch": 63.47, + "learning_rate": 1.488339222614841e-06, + "loss": 0.2593, + "step": 18280 + }, + { + "epoch": 63.51, + "learning_rate": 1.4869257950530035e-06, + "loss": 0.2681, + "step": 18290 + }, + { + "epoch": 63.54, + "learning_rate": 1.4855123674911661e-06, + "loss": 0.239, + "step": 18300 + }, + { + "epoch": 63.57, + "learning_rate": 1.4840989399293287e-06, + "loss": 0.2505, + "step": 18310 + }, + { + "epoch": 63.61, + "learning_rate": 1.4826855123674911e-06, + "loss": 0.2526, + "step": 18320 + }, + { + "epoch": 63.64, + "learning_rate": 1.4812720848056538e-06, + "loss": 0.2672, + "step": 18330 + }, + { + "epoch": 63.68, + "learning_rate": 1.4798586572438162e-06, + "loss": 0.2715, + "step": 18340 + }, + { + "epoch": 63.71, + "learning_rate": 1.4784452296819788e-06, + "loss": 0.2519, + "step": 18350 + }, + { + "epoch": 63.75, + "learning_rate": 1.4770318021201414e-06, + "loss": 0.2712, + "step": 18360 + }, + { + "epoch": 63.78, + "learning_rate": 1.4756183745583038e-06, + "loss": 0.2385, + "step": 18370 + }, + { + "epoch": 63.82, + "learning_rate": 1.4742049469964664e-06, + "loss": 0.2732, + "step": 18380 + }, + { + "epoch": 63.85, + "learning_rate": 1.472791519434629e-06, + "loss": 0.2835, + "step": 18390 + }, + { + "epoch": 63.89, + "learning_rate": 1.4713780918727915e-06, + "loss": 0.2812, + "step": 18400 + }, + { + "epoch": 63.92, + "learning_rate": 1.469964664310954e-06, + "loss": 0.2488, + "step": 18410 + }, + { + "epoch": 63.96, + "learning_rate": 1.4685512367491167e-06, + "loss": 0.2607, + "step": 18420 + }, + { + "epoch": 63.99, + "learning_rate": 1.4671378091872791e-06, + "loss": 0.246, + "step": 18430 + }, + { + "epoch": 64.0, + "eval_loss": 0.5164635181427002, + "eval_runtime": 134.1849, + "eval_samples_per_second": 3.965, + "eval_steps_per_second": 0.991, + "eval_wer": 0.19753165777463522, + "step": 18432 + }, + { + "epoch": 64.03, + "learning_rate": 1.4657243816254418e-06, + "loss": 0.2641, + "step": 18440 + }, + { + "epoch": 64.06, + "learning_rate": 1.4643109540636044e-06, + "loss": 0.268, + "step": 18450 + }, + { + "epoch": 64.1, + "learning_rate": 1.4628975265017666e-06, + "loss": 0.2544, + "step": 18460 + }, + { + "epoch": 64.13, + "learning_rate": 1.4614840989399294e-06, + "loss": 0.299, + "step": 18470 + }, + { + "epoch": 64.17, + "learning_rate": 1.4600706713780916e-06, + "loss": 0.27, + "step": 18480 + }, + { + "epoch": 64.2, + "learning_rate": 1.4586572438162542e-06, + "loss": 0.2475, + "step": 18490 + }, + { + "epoch": 64.24, + "learning_rate": 1.4572438162544168e-06, + "loss": 0.262, + "step": 18500 + }, + { + "epoch": 64.27, + "learning_rate": 1.4558303886925793e-06, + "loss": 0.2591, + "step": 18510 + }, + { + "epoch": 64.3, + "learning_rate": 1.4544169611307419e-06, + "loss": 0.2448, + "step": 18520 + }, + { + "epoch": 64.34, + "learning_rate": 1.4530035335689045e-06, + "loss": 0.263, + "step": 18530 + }, + { + "epoch": 64.37, + "learning_rate": 1.451590106007067e-06, + "loss": 0.2527, + "step": 18540 + }, + { + "epoch": 64.41, + "learning_rate": 1.4501766784452295e-06, + "loss": 0.2668, + "step": 18550 + }, + { + "epoch": 64.44, + "learning_rate": 1.4487632508833921e-06, + "loss": 0.2316, + "step": 18560 + }, + { + "epoch": 64.48, + "learning_rate": 1.4473498233215546e-06, + "loss": 0.2757, + "step": 18570 + }, + { + "epoch": 64.51, + "learning_rate": 1.4459363957597172e-06, + "loss": 0.2749, + "step": 18580 + }, + { + "epoch": 64.55, + "learning_rate": 1.4445229681978798e-06, + "loss": 0.2537, + "step": 18590 + }, + { + "epoch": 64.58, + "learning_rate": 1.4431095406360422e-06, + "loss": 0.2663, + "step": 18600 + }, + { + "epoch": 64.62, + "learning_rate": 1.4416961130742048e-06, + "loss": 0.2525, + "step": 18610 + }, + { + "epoch": 64.65, + "learning_rate": 1.4402826855123675e-06, + "loss": 0.2669, + "step": 18620 + }, + { + "epoch": 64.69, + "learning_rate": 1.4388692579505299e-06, + "loss": 0.2724, + "step": 18630 + }, + { + "epoch": 64.72, + "learning_rate": 1.4374558303886925e-06, + "loss": 0.2506, + "step": 18640 + }, + { + "epoch": 64.75, + "learning_rate": 1.4360424028268549e-06, + "loss": 0.2458, + "step": 18650 + }, + { + "epoch": 64.79, + "learning_rate": 1.4346289752650175e-06, + "loss": 0.2545, + "step": 18660 + }, + { + "epoch": 64.82, + "learning_rate": 1.4332155477031801e-06, + "loss": 0.2623, + "step": 18670 + }, + { + "epoch": 64.86, + "learning_rate": 1.4318021201413425e-06, + "loss": 0.2512, + "step": 18680 + }, + { + "epoch": 64.89, + "learning_rate": 1.4303886925795052e-06, + "loss": 0.2394, + "step": 18690 + }, + { + "epoch": 64.93, + "learning_rate": 1.4289752650176678e-06, + "loss": 0.2602, + "step": 18700 + }, + { + "epoch": 64.96, + "learning_rate": 1.4275618374558302e-06, + "loss": 0.2483, + "step": 18710 + }, + { + "epoch": 65.0, + "learning_rate": 1.4261484098939928e-06, + "loss": 0.2567, + "step": 18720 + }, + { + "epoch": 65.0, + "eval_loss": 0.5072118043899536, + "eval_runtime": 134.0915, + "eval_samples_per_second": 3.967, + "eval_steps_per_second": 0.992, + "eval_wer": 0.19811017548370508, + "step": 18720 + }, + { + "epoch": 65.03, + "learning_rate": 1.4247349823321554e-06, + "loss": 0.2677, + "step": 18730 + }, + { + "epoch": 65.07, + "learning_rate": 1.4233215547703178e-06, + "loss": 0.2524, + "step": 18740 + }, + { + "epoch": 65.1, + "learning_rate": 1.4219081272084805e-06, + "loss": 0.2628, + "step": 18750 + }, + { + "epoch": 65.14, + "learning_rate": 1.420494699646643e-06, + "loss": 0.2743, + "step": 18760 + }, + { + "epoch": 65.17, + "learning_rate": 1.4190812720848055e-06, + "loss": 0.2692, + "step": 18770 + }, + { + "epoch": 65.21, + "learning_rate": 1.4176678445229681e-06, + "loss": 0.2551, + "step": 18780 + }, + { + "epoch": 65.24, + "learning_rate": 1.4162544169611305e-06, + "loss": 0.2416, + "step": 18790 + }, + { + "epoch": 65.28, + "learning_rate": 1.4148409893992932e-06, + "loss": 0.2516, + "step": 18800 + }, + { + "epoch": 65.31, + "learning_rate": 1.4134275618374558e-06, + "loss": 0.2842, + "step": 18810 + }, + { + "epoch": 65.35, + "learning_rate": 1.4120141342756182e-06, + "loss": 0.263, + "step": 18820 + }, + { + "epoch": 65.38, + "learning_rate": 1.4106007067137808e-06, + "loss": 0.2531, + "step": 18830 + }, + { + "epoch": 65.42, + "learning_rate": 1.4091872791519434e-06, + "loss": 0.2536, + "step": 18840 + }, + { + "epoch": 65.45, + "learning_rate": 1.4077738515901058e-06, + "loss": 0.2741, + "step": 18850 + }, + { + "epoch": 65.48, + "learning_rate": 1.4063604240282685e-06, + "loss": 0.2675, + "step": 18860 + }, + { + "epoch": 65.52, + "learning_rate": 1.404946996466431e-06, + "loss": 0.2597, + "step": 18870 + }, + { + "epoch": 65.55, + "learning_rate": 1.4035335689045935e-06, + "loss": 0.259, + "step": 18880 + }, + { + "epoch": 65.59, + "learning_rate": 1.4021201413427561e-06, + "loss": 0.2586, + "step": 18890 + }, + { + "epoch": 65.62, + "learning_rate": 1.4007067137809187e-06, + "loss": 0.2473, + "step": 18900 + }, + { + "epoch": 65.66, + "learning_rate": 1.3992932862190811e-06, + "loss": 0.2679, + "step": 18910 + }, + { + "epoch": 65.69, + "learning_rate": 1.3978798586572438e-06, + "loss": 0.2429, + "step": 18920 + }, + { + "epoch": 65.73, + "learning_rate": 1.3964664310954064e-06, + "loss": 0.2521, + "step": 18930 + }, + { + "epoch": 65.76, + "learning_rate": 1.3950530035335688e-06, + "loss": 0.2651, + "step": 18940 + }, + { + "epoch": 65.8, + "learning_rate": 1.3936395759717314e-06, + "loss": 0.243, + "step": 18950 + }, + { + "epoch": 65.83, + "learning_rate": 1.3922261484098938e-06, + "loss": 0.26, + "step": 18960 + }, + { + "epoch": 65.87, + "learning_rate": 1.3908127208480564e-06, + "loss": 0.2509, + "step": 18970 + }, + { + "epoch": 65.9, + "learning_rate": 1.389399293286219e-06, + "loss": 0.2528, + "step": 18980 + }, + { + "epoch": 65.94, + "learning_rate": 1.3879858657243815e-06, + "loss": 0.2602, + "step": 18990 + }, + { + "epoch": 65.97, + "learning_rate": 1.386572438162544e-06, + "loss": 0.2509, + "step": 19000 + }, + { + "epoch": 66.0, + "eval_loss": 0.5061087012290955, + "eval_runtime": 133.4932, + "eval_samples_per_second": 3.985, + "eval_steps_per_second": 0.996, + "eval_wer": 0.19778877675644405, + "step": 19008 + }, + { + "epoch": 66.01, + "learning_rate": 1.3851590106007067e-06, + "loss": 0.2801, + "step": 19010 + }, + { + "epoch": 66.04, + "learning_rate": 1.3837455830388691e-06, + "loss": 0.256, + "step": 19020 + }, + { + "epoch": 66.08, + "learning_rate": 1.3823321554770318e-06, + "loss": 0.2356, + "step": 19030 + }, + { + "epoch": 66.11, + "learning_rate": 1.3809187279151944e-06, + "loss": 0.2594, + "step": 19040 + }, + { + "epoch": 66.15, + "learning_rate": 1.3795053003533568e-06, + "loss": 0.2468, + "step": 19050 + }, + { + "epoch": 66.18, + "learning_rate": 1.3780918727915194e-06, + "loss": 0.2661, + "step": 19060 + }, + { + "epoch": 66.21, + "learning_rate": 1.376678445229682e-06, + "loss": 0.2664, + "step": 19070 + }, + { + "epoch": 66.25, + "learning_rate": 1.3752650176678444e-06, + "loss": 0.266, + "step": 19080 + }, + { + "epoch": 66.28, + "learning_rate": 1.373851590106007e-06, + "loss": 0.2531, + "step": 19090 + }, + { + "epoch": 66.32, + "learning_rate": 1.3724381625441695e-06, + "loss": 0.2631, + "step": 19100 + }, + { + "epoch": 66.35, + "learning_rate": 1.371024734982332e-06, + "loss": 0.2732, + "step": 19110 + }, + { + "epoch": 66.39, + "learning_rate": 1.3696113074204947e-06, + "loss": 0.2584, + "step": 19120 + }, + { + "epoch": 66.42, + "learning_rate": 1.3681978798586571e-06, + "loss": 0.2374, + "step": 19130 + }, + { + "epoch": 66.46, + "learning_rate": 1.3667844522968197e-06, + "loss": 0.2653, + "step": 19140 + }, + { + "epoch": 66.49, + "learning_rate": 1.3653710247349824e-06, + "loss": 0.2614, + "step": 19150 + }, + { + "epoch": 66.53, + "learning_rate": 1.3639575971731448e-06, + "loss": 0.2625, + "step": 19160 + }, + { + "epoch": 66.56, + "learning_rate": 1.3625441696113074e-06, + "loss": 0.2558, + "step": 19170 + }, + { + "epoch": 66.6, + "learning_rate": 1.36113074204947e-06, + "loss": 0.2759, + "step": 19180 + }, + { + "epoch": 66.63, + "learning_rate": 1.3597173144876324e-06, + "loss": 0.238, + "step": 19190 + }, + { + "epoch": 66.66, + "learning_rate": 1.358303886925795e-06, + "loss": 0.2661, + "step": 19200 + }, + { + "epoch": 66.7, + "learning_rate": 1.3568904593639577e-06, + "loss": 0.2439, + "step": 19210 + }, + { + "epoch": 66.73, + "learning_rate": 1.35547703180212e-06, + "loss": 0.251, + "step": 19220 + }, + { + "epoch": 66.77, + "learning_rate": 1.3540636042402827e-06, + "loss": 0.2693, + "step": 19230 + }, + { + "epoch": 66.8, + "learning_rate": 1.3526501766784453e-06, + "loss": 0.2361, + "step": 19240 + }, + { + "epoch": 66.84, + "learning_rate": 1.3512367491166077e-06, + "loss": 0.2761, + "step": 19250 + }, + { + "epoch": 66.87, + "learning_rate": 1.3498233215547703e-06, + "loss": 0.2546, + "step": 19260 + }, + { + "epoch": 66.91, + "learning_rate": 1.3484098939929328e-06, + "loss": 0.251, + "step": 19270 + }, + { + "epoch": 66.94, + "learning_rate": 1.3469964664310954e-06, + "loss": 0.2381, + "step": 19280 + }, + { + "epoch": 66.98, + "learning_rate": 1.345583038869258e-06, + "loss": 0.289, + "step": 19290 + }, + { + "epoch": 67.0, + "eval_loss": 0.5087379217147827, + "eval_runtime": 134.753, + "eval_samples_per_second": 3.948, + "eval_steps_per_second": 0.987, + "eval_wer": 0.19573182490197338, + "step": 19296 + }, + { + "epoch": 67.01, + "learning_rate": 1.3441696113074204e-06, + "loss": 0.255, + "step": 19300 + }, + { + "epoch": 67.05, + "learning_rate": 1.342756183745583e-06, + "loss": 0.2501, + "step": 19310 + }, + { + "epoch": 67.08, + "learning_rate": 1.3413427561837457e-06, + "loss": 0.2529, + "step": 19320 + }, + { + "epoch": 67.12, + "learning_rate": 1.339929328621908e-06, + "loss": 0.2559, + "step": 19330 + }, + { + "epoch": 67.15, + "learning_rate": 1.3385159010600707e-06, + "loss": 0.2783, + "step": 19340 + }, + { + "epoch": 67.19, + "learning_rate": 1.3371024734982333e-06, + "loss": 0.2495, + "step": 19350 + }, + { + "epoch": 67.22, + "learning_rate": 1.3356890459363957e-06, + "loss": 0.2414, + "step": 19360 + }, + { + "epoch": 67.26, + "learning_rate": 1.3342756183745583e-06, + "loss": 0.2584, + "step": 19370 + }, + { + "epoch": 67.29, + "learning_rate": 1.332862190812721e-06, + "loss": 0.2553, + "step": 19380 + }, + { + "epoch": 67.33, + "learning_rate": 1.3314487632508834e-06, + "loss": 0.2712, + "step": 19390 + }, + { + "epoch": 67.36, + "learning_rate": 1.330035335689046e-06, + "loss": 0.2593, + "step": 19400 + }, + { + "epoch": 67.39, + "learning_rate": 1.3286219081272084e-06, + "loss": 0.2656, + "step": 19410 + }, + { + "epoch": 67.43, + "learning_rate": 1.327208480565371e-06, + "loss": 0.237, + "step": 19420 + }, + { + "epoch": 67.46, + "learning_rate": 1.3257950530035336e-06, + "loss": 0.262, + "step": 19430 + }, + { + "epoch": 67.5, + "learning_rate": 1.324381625441696e-06, + "loss": 0.2545, + "step": 19440 + }, + { + "epoch": 67.53, + "learning_rate": 1.3229681978798587e-06, + "loss": 0.2582, + "step": 19450 + }, + { + "epoch": 67.57, + "learning_rate": 1.3215547703180213e-06, + "loss": 0.2508, + "step": 19460 + }, + { + "epoch": 67.6, + "learning_rate": 1.3201413427561837e-06, + "loss": 0.2401, + "step": 19470 + }, + { + "epoch": 67.64, + "learning_rate": 1.3187279151943463e-06, + "loss": 0.2543, + "step": 19480 + }, + { + "epoch": 67.67, + "learning_rate": 1.317314487632509e-06, + "loss": 0.2467, + "step": 19490 + }, + { + "epoch": 67.71, + "learning_rate": 1.3159010600706714e-06, + "loss": 0.2675, + "step": 19500 + }, + { + "epoch": 67.74, + "learning_rate": 1.314487632508834e-06, + "loss": 0.2792, + "step": 19510 + }, + { + "epoch": 67.78, + "learning_rate": 1.3130742049469966e-06, + "loss": 0.2734, + "step": 19520 + }, + { + "epoch": 67.81, + "learning_rate": 1.311660777385159e-06, + "loss": 0.2645, + "step": 19530 + }, + { + "epoch": 67.85, + "learning_rate": 1.3102473498233216e-06, + "loss": 0.284, + "step": 19540 + }, + { + "epoch": 67.88, + "learning_rate": 1.3088339222614842e-06, + "loss": 0.2687, + "step": 19550 + }, + { + "epoch": 67.91, + "learning_rate": 1.3074204946996464e-06, + "loss": 0.2661, + "step": 19560 + }, + { + "epoch": 67.95, + "learning_rate": 1.306007067137809e-06, + "loss": 0.2568, + "step": 19570 + }, + { + "epoch": 67.98, + "learning_rate": 1.3045936395759715e-06, + "loss": 0.2511, + "step": 19580 + }, + { + "epoch": 68.0, + "eval_loss": 0.516753077507019, + "eval_runtime": 134.5773, + "eval_samples_per_second": 3.953, + "eval_steps_per_second": 0.988, + "eval_wer": 0.1981744552291573, + "step": 19584 + }, + { + "epoch": 68.02, + "learning_rate": 1.303180212014134e-06, + "loss": 0.2656, + "step": 19590 + }, + { + "epoch": 68.06, + "learning_rate": 1.3017667844522967e-06, + "loss": 0.2578, + "step": 19600 + }, + { + "epoch": 68.09, + "learning_rate": 1.3003533568904591e-06, + "loss": 0.2424, + "step": 19610 + }, + { + "epoch": 68.12, + "learning_rate": 1.2989399293286217e-06, + "loss": 0.264, + "step": 19620 + }, + { + "epoch": 68.16, + "learning_rate": 1.2975265017667844e-06, + "loss": 0.2589, + "step": 19630 + }, + { + "epoch": 68.19, + "learning_rate": 1.2961130742049468e-06, + "loss": 0.2536, + "step": 19640 + }, + { + "epoch": 68.23, + "learning_rate": 1.2946996466431094e-06, + "loss": 0.2713, + "step": 19650 + }, + { + "epoch": 68.26, + "learning_rate": 1.293286219081272e-06, + "loss": 0.2517, + "step": 19660 + }, + { + "epoch": 68.3, + "learning_rate": 1.2918727915194344e-06, + "loss": 0.271, + "step": 19670 + }, + { + "epoch": 68.33, + "learning_rate": 1.290459363957597e-06, + "loss": 0.2754, + "step": 19680 + }, + { + "epoch": 68.37, + "learning_rate": 1.2890459363957597e-06, + "loss": 0.2486, + "step": 19690 + }, + { + "epoch": 68.4, + "learning_rate": 1.287632508833922e-06, + "loss": 0.2627, + "step": 19700 + }, + { + "epoch": 68.44, + "learning_rate": 1.2862190812720847e-06, + "loss": 0.2434, + "step": 19710 + }, + { + "epoch": 68.47, + "learning_rate": 1.2848056537102471e-06, + "loss": 0.2685, + "step": 19720 + }, + { + "epoch": 68.51, + "learning_rate": 1.2833922261484097e-06, + "loss": 0.2677, + "step": 19730 + }, + { + "epoch": 68.54, + "learning_rate": 1.2819787985865724e-06, + "loss": 0.2783, + "step": 19740 + }, + { + "epoch": 68.57, + "learning_rate": 1.2805653710247348e-06, + "loss": 0.2518, + "step": 19750 + }, + { + "epoch": 68.61, + "learning_rate": 1.2791519434628974e-06, + "loss": 0.2521, + "step": 19760 + }, + { + "epoch": 68.64, + "learning_rate": 1.27773851590106e-06, + "loss": 0.2613, + "step": 19770 + }, + { + "epoch": 68.68, + "learning_rate": 1.2763250883392224e-06, + "loss": 0.2718, + "step": 19780 + }, + { + "epoch": 68.71, + "learning_rate": 1.274911660777385e-06, + "loss": 0.2337, + "step": 19790 + }, + { + "epoch": 68.75, + "learning_rate": 1.2734982332155477e-06, + "loss": 0.2617, + "step": 19800 + }, + { + "epoch": 68.78, + "learning_rate": 1.27208480565371e-06, + "loss": 0.2588, + "step": 19810 + }, + { + "epoch": 68.82, + "learning_rate": 1.2706713780918727e-06, + "loss": 0.254, + "step": 19820 + }, + { + "epoch": 68.85, + "learning_rate": 1.2692579505300353e-06, + "loss": 0.2595, + "step": 19830 + }, + { + "epoch": 68.89, + "learning_rate": 1.2678445229681977e-06, + "loss": 0.2418, + "step": 19840 + }, + { + "epoch": 68.92, + "learning_rate": 1.2664310954063603e-06, + "loss": 0.2567, + "step": 19850 + }, + { + "epoch": 68.96, + "learning_rate": 1.265017667844523e-06, + "loss": 0.2671, + "step": 19860 + }, + { + "epoch": 68.99, + "learning_rate": 1.2636042402826854e-06, + "loss": 0.2623, + "step": 19870 + }, + { + "epoch": 69.0, + "eval_loss": 0.5109707117080688, + "eval_runtime": 133.3708, + "eval_samples_per_second": 3.989, + "eval_steps_per_second": 0.997, + "eval_wer": 0.1958603843928778, + "step": 19872 + }, + { + "epoch": 69.03, + "learning_rate": 1.262190812720848e-06, + "loss": 0.2721, + "step": 19880 + }, + { + "epoch": 69.06, + "learning_rate": 1.2607773851590104e-06, + "loss": 0.2508, + "step": 19890 + }, + { + "epoch": 69.1, + "learning_rate": 1.259363957597173e-06, + "loss": 0.2522, + "step": 19900 + }, + { + "epoch": 69.13, + "learning_rate": 1.2579505300353356e-06, + "loss": 0.2842, + "step": 19910 + }, + { + "epoch": 69.17, + "learning_rate": 1.256537102473498e-06, + "loss": 0.2641, + "step": 19920 + }, + { + "epoch": 69.2, + "learning_rate": 1.2551236749116607e-06, + "loss": 0.2427, + "step": 19930 + }, + { + "epoch": 69.24, + "learning_rate": 1.2537102473498233e-06, + "loss": 0.2805, + "step": 19940 + }, + { + "epoch": 69.27, + "learning_rate": 1.2522968197879857e-06, + "loss": 0.254, + "step": 19950 + }, + { + "epoch": 69.3, + "learning_rate": 1.2508833922261483e-06, + "loss": 0.2651, + "step": 19960 + }, + { + "epoch": 69.34, + "learning_rate": 1.249469964664311e-06, + "loss": 0.2748, + "step": 19970 + }, + { + "epoch": 69.37, + "learning_rate": 1.2480565371024734e-06, + "loss": 0.2592, + "step": 19980 + }, + { + "epoch": 69.41, + "learning_rate": 1.246643109540636e-06, + "loss": 0.2652, + "step": 19990 + }, + { + "epoch": 69.44, + "learning_rate": 1.2452296819787986e-06, + "loss": 0.2382, + "step": 20000 + }, + { + "epoch": 69.48, + "learning_rate": 1.243816254416961e-06, + "loss": 0.2769, + "step": 20010 + }, + { + "epoch": 69.51, + "learning_rate": 1.2424028268551236e-06, + "loss": 0.2448, + "step": 20020 + }, + { + "epoch": 69.55, + "learning_rate": 1.240989399293286e-06, + "loss": 0.2392, + "step": 20030 + }, + { + "epoch": 69.58, + "learning_rate": 1.2395759717314487e-06, + "loss": 0.2546, + "step": 20040 + }, + { + "epoch": 69.62, + "learning_rate": 1.2381625441696113e-06, + "loss": 0.2472, + "step": 20050 + }, + { + "epoch": 69.65, + "learning_rate": 1.2367491166077737e-06, + "loss": 0.2772, + "step": 20060 + }, + { + "epoch": 69.69, + "learning_rate": 1.2353356890459363e-06, + "loss": 0.2799, + "step": 20070 + }, + { + "epoch": 69.72, + "learning_rate": 1.233922261484099e-06, + "loss": 0.2458, + "step": 20080 + }, + { + "epoch": 69.75, + "learning_rate": 1.2325088339222613e-06, + "loss": 0.2776, + "step": 20090 + }, + { + "epoch": 69.79, + "learning_rate": 1.231095406360424e-06, + "loss": 0.2571, + "step": 20100 + }, + { + "epoch": 69.82, + "learning_rate": 1.2296819787985866e-06, + "loss": 0.2464, + "step": 20110 + }, + { + "epoch": 69.86, + "learning_rate": 1.228268551236749e-06, + "loss": 0.2765, + "step": 20120 + }, + { + "epoch": 69.89, + "learning_rate": 1.2268551236749116e-06, + "loss": 0.2443, + "step": 20130 + }, + { + "epoch": 69.93, + "learning_rate": 1.2254416961130742e-06, + "loss": 0.2432, + "step": 20140 + }, + { + "epoch": 69.96, + "learning_rate": 1.2240282685512367e-06, + "loss": 0.2482, + "step": 20150 + }, + { + "epoch": 70.0, + "learning_rate": 1.2226148409893993e-06, + "loss": 0.2762, + "step": 20160 + }, + { + "epoch": 70.0, + "eval_loss": 0.5123195648193359, + "eval_runtime": 133.6748, + "eval_samples_per_second": 3.98, + "eval_steps_per_second": 0.995, + "eval_wer": 0.19592466413833, + "step": 20160 + }, + { + "epoch": 70.03, + "learning_rate": 1.221201413427562e-06, + "loss": 0.2698, + "step": 20170 + }, + { + "epoch": 70.07, + "learning_rate": 1.2197879858657243e-06, + "loss": 0.231, + "step": 20180 + }, + { + "epoch": 70.1, + "learning_rate": 1.218374558303887e-06, + "loss": 0.2392, + "step": 20190 + }, + { + "epoch": 70.14, + "learning_rate": 1.2169611307420493e-06, + "loss": 0.2549, + "step": 20200 + }, + { + "epoch": 70.17, + "learning_rate": 1.215547703180212e-06, + "loss": 0.2701, + "step": 20210 + }, + { + "epoch": 70.21, + "learning_rate": 1.2141342756183746e-06, + "loss": 0.2526, + "step": 20220 + }, + { + "epoch": 70.24, + "learning_rate": 1.212720848056537e-06, + "loss": 0.2654, + "step": 20230 + }, + { + "epoch": 70.28, + "learning_rate": 1.2113074204946996e-06, + "loss": 0.2659, + "step": 20240 + }, + { + "epoch": 70.31, + "learning_rate": 1.2098939929328622e-06, + "loss": 0.2583, + "step": 20250 + }, + { + "epoch": 70.35, + "learning_rate": 1.2084805653710246e-06, + "loss": 0.2559, + "step": 20260 + }, + { + "epoch": 70.38, + "learning_rate": 1.2070671378091873e-06, + "loss": 0.2498, + "step": 20270 + }, + { + "epoch": 70.42, + "learning_rate": 1.2056537102473499e-06, + "loss": 0.2515, + "step": 20280 + }, + { + "epoch": 70.45, + "learning_rate": 1.2042402826855123e-06, + "loss": 0.2389, + "step": 20290 + }, + { + "epoch": 70.48, + "learning_rate": 1.202826855123675e-06, + "loss": 0.2793, + "step": 20300 + }, + { + "epoch": 70.52, + "learning_rate": 1.2014134275618375e-06, + "loss": 0.2548, + "step": 20310 + }, + { + "epoch": 70.55, + "learning_rate": 1.2e-06, + "loss": 0.243, + "step": 20320 + }, + { + "epoch": 70.59, + "learning_rate": 1.1985865724381626e-06, + "loss": 0.2314, + "step": 20330 + }, + { + "epoch": 70.62, + "learning_rate": 1.197173144876325e-06, + "loss": 0.2416, + "step": 20340 + }, + { + "epoch": 70.66, + "learning_rate": 1.1957597173144876e-06, + "loss": 0.2705, + "step": 20350 + }, + { + "epoch": 70.69, + "learning_rate": 1.1943462897526502e-06, + "loss": 0.2564, + "step": 20360 + }, + { + "epoch": 70.73, + "learning_rate": 1.1929328621908126e-06, + "loss": 0.2683, + "step": 20370 + }, + { + "epoch": 70.76, + "learning_rate": 1.1915194346289753e-06, + "loss": 0.2626, + "step": 20380 + }, + { + "epoch": 70.8, + "learning_rate": 1.1901060070671379e-06, + "loss": 0.2484, + "step": 20390 + }, + { + "epoch": 70.83, + "learning_rate": 1.1886925795053003e-06, + "loss": 0.2649, + "step": 20400 + }, + { + "epoch": 70.87, + "learning_rate": 1.187279151943463e-06, + "loss": 0.255, + "step": 20410 + }, + { + "epoch": 70.9, + "learning_rate": 1.1858657243816255e-06, + "loss": 0.253, + "step": 20420 + }, + { + "epoch": 70.94, + "learning_rate": 1.184452296819788e-06, + "loss": 0.2373, + "step": 20430 + }, + { + "epoch": 70.97, + "learning_rate": 1.1830388692579506e-06, + "loss": 0.2704, + "step": 20440 + }, + { + "epoch": 71.0, + "eval_loss": 0.5117577314376831, + "eval_runtime": 133.058, + "eval_samples_per_second": 3.998, + "eval_steps_per_second": 1.0, + "eval_wer": 0.1965674615928521, + "step": 20448 + }, + { + "epoch": 71.01, + "learning_rate": 1.1816254416961132e-06, + "loss": 0.2783, + "step": 20450 + }, + { + "epoch": 71.04, + "learning_rate": 1.1802120141342756e-06, + "loss": 0.2665, + "step": 20460 + }, + { + "epoch": 71.08, + "learning_rate": 1.1787985865724382e-06, + "loss": 0.2626, + "step": 20470 + }, + { + "epoch": 71.11, + "learning_rate": 1.1773851590106008e-06, + "loss": 0.2544, + "step": 20480 + }, + { + "epoch": 71.15, + "learning_rate": 1.1759717314487632e-06, + "loss": 0.2526, + "step": 20490 + }, + { + "epoch": 71.18, + "learning_rate": 1.1745583038869259e-06, + "loss": 0.2749, + "step": 20500 + }, + { + "epoch": 71.21, + "learning_rate": 1.1731448763250883e-06, + "loss": 0.2545, + "step": 20510 + }, + { + "epoch": 71.25, + "learning_rate": 1.1717314487632509e-06, + "loss": 0.2475, + "step": 20520 + }, + { + "epoch": 71.28, + "learning_rate": 1.1703180212014135e-06, + "loss": 0.2502, + "step": 20530 + }, + { + "epoch": 71.32, + "learning_rate": 1.168904593639576e-06, + "loss": 0.2452, + "step": 20540 + }, + { + "epoch": 71.35, + "learning_rate": 1.1676325088339224e-06, + "loss": 0.2562, + "step": 20550 + }, + { + "epoch": 71.39, + "learning_rate": 1.1662190812720846e-06, + "loss": 0.2364, + "step": 20560 + }, + { + "epoch": 71.42, + "learning_rate": 1.1648056537102472e-06, + "loss": 0.2529, + "step": 20570 + }, + { + "epoch": 71.46, + "learning_rate": 1.1633922261484098e-06, + "loss": 0.2561, + "step": 20580 + }, + { + "epoch": 71.49, + "learning_rate": 1.1619787985865722e-06, + "loss": 0.2726, + "step": 20590 + }, + { + "epoch": 71.53, + "learning_rate": 1.1605653710247349e-06, + "loss": 0.2774, + "step": 20600 + }, + { + "epoch": 71.56, + "learning_rate": 1.1591519434628975e-06, + "loss": 0.2541, + "step": 20610 + }, + { + "epoch": 71.6, + "learning_rate": 1.1577385159010599e-06, + "loss": 0.2512, + "step": 20620 + }, + { + "epoch": 71.63, + "learning_rate": 1.1563250883392225e-06, + "loss": 0.2532, + "step": 20630 + }, + { + "epoch": 71.66, + "learning_rate": 1.154911660777385e-06, + "loss": 0.2639, + "step": 20640 + }, + { + "epoch": 71.7, + "learning_rate": 1.1534982332155475e-06, + "loss": 0.2573, + "step": 20650 + }, + { + "epoch": 71.73, + "learning_rate": 1.1520848056537102e-06, + "loss": 0.2662, + "step": 20660 + }, + { + "epoch": 71.77, + "learning_rate": 1.1506713780918726e-06, + "loss": 0.2486, + "step": 20670 + }, + { + "epoch": 71.8, + "learning_rate": 1.1492579505300352e-06, + "loss": 0.2563, + "step": 20680 + }, + { + "epoch": 71.84, + "learning_rate": 1.1478445229681978e-06, + "loss": 0.2631, + "step": 20690 + }, + { + "epoch": 71.87, + "learning_rate": 1.1464310954063602e-06, + "loss": 0.2697, + "step": 20700 + }, + { + "epoch": 71.91, + "learning_rate": 1.1450176678445228e-06, + "loss": 0.2478, + "step": 20710 + }, + { + "epoch": 71.94, + "learning_rate": 1.1436042402826855e-06, + "loss": 0.2436, + "step": 20720 + }, + { + "epoch": 71.98, + "learning_rate": 1.1421908127208479e-06, + "loss": 0.2854, + "step": 20730 + }, + { + "epoch": 72.0, + "eval_loss": 0.5127651691436768, + "eval_runtime": 133.8804, + "eval_samples_per_second": 3.974, + "eval_steps_per_second": 0.993, + "eval_wer": 0.1948961882110947, + "step": 20736 + }, + { + "epoch": 72.01, + "learning_rate": 1.1407773851590105e-06, + "loss": 0.2796, + "step": 20740 + }, + { + "epoch": 72.05, + "learning_rate": 1.1393639575971731e-06, + "loss": 0.2772, + "step": 20750 + }, + { + "epoch": 72.08, + "learning_rate": 1.1379505300353355e-06, + "loss": 0.2524, + "step": 20760 + }, + { + "epoch": 72.12, + "learning_rate": 1.1365371024734981e-06, + "loss": 0.2331, + "step": 20770 + }, + { + "epoch": 72.15, + "learning_rate": 1.1351236749116608e-06, + "loss": 0.2678, + "step": 20780 + }, + { + "epoch": 72.19, + "learning_rate": 1.1337102473498232e-06, + "loss": 0.2769, + "step": 20790 + }, + { + "epoch": 72.22, + "learning_rate": 1.1322968197879858e-06, + "loss": 0.2535, + "step": 20800 + }, + { + "epoch": 72.26, + "learning_rate": 1.1308833922261482e-06, + "loss": 0.2478, + "step": 20810 + }, + { + "epoch": 72.29, + "learning_rate": 1.1294699646643108e-06, + "loss": 0.2383, + "step": 20820 + }, + { + "epoch": 72.33, + "learning_rate": 1.1280565371024735e-06, + "loss": 0.2699, + "step": 20830 + }, + { + "epoch": 72.36, + "learning_rate": 1.1266431095406359e-06, + "loss": 0.2635, + "step": 20840 + }, + { + "epoch": 72.39, + "learning_rate": 1.1252296819787985e-06, + "loss": 0.2566, + "step": 20850 + }, + { + "epoch": 72.43, + "learning_rate": 1.123816254416961e-06, + "loss": 0.2414, + "step": 20860 + }, + { + "epoch": 72.46, + "learning_rate": 1.1224028268551235e-06, + "loss": 0.2522, + "step": 20870 + }, + { + "epoch": 72.5, + "learning_rate": 1.1209893992932861e-06, + "loss": 0.2483, + "step": 20880 + }, + { + "epoch": 72.53, + "learning_rate": 1.1195759717314488e-06, + "loss": 0.2597, + "step": 20890 + }, + { + "epoch": 72.57, + "learning_rate": 1.1181625441696112e-06, + "loss": 0.2576, + "step": 20900 + }, + { + "epoch": 72.6, + "learning_rate": 1.1167491166077738e-06, + "loss": 0.2525, + "step": 20910 + }, + { + "epoch": 72.64, + "learning_rate": 1.1153356890459364e-06, + "loss": 0.2679, + "step": 20920 + }, + { + "epoch": 72.67, + "learning_rate": 1.1139222614840988e-06, + "loss": 0.2634, + "step": 20930 + }, + { + "epoch": 72.71, + "learning_rate": 1.1125088339222614e-06, + "loss": 0.2325, + "step": 20940 + }, + { + "epoch": 72.74, + "learning_rate": 1.1110954063604238e-06, + "loss": 0.2625, + "step": 20950 + }, + { + "epoch": 72.78, + "learning_rate": 1.1096819787985865e-06, + "loss": 0.2442, + "step": 20960 + }, + { + "epoch": 72.81, + "learning_rate": 1.108268551236749e-06, + "loss": 0.2651, + "step": 20970 + }, + { + "epoch": 72.85, + "learning_rate": 1.1068551236749115e-06, + "loss": 0.2531, + "step": 20980 + }, + { + "epoch": 72.88, + "learning_rate": 1.1054416961130741e-06, + "loss": 0.2444, + "step": 20990 + }, + { + "epoch": 72.91, + "learning_rate": 1.1040282685512367e-06, + "loss": 0.2735, + "step": 21000 + }, + { + "epoch": 72.95, + "learning_rate": 1.1026148409893992e-06, + "loss": 0.2528, + "step": 21010 + }, + { + "epoch": 72.98, + "learning_rate": 1.1012014134275618e-06, + "loss": 0.2602, + "step": 21020 + }, + { + "epoch": 73.0, + "eval_loss": 0.5094349384307861, + "eval_runtime": 134.0533, + "eval_samples_per_second": 3.969, + "eval_steps_per_second": 0.992, + "eval_wer": 0.1966317413383043, + "step": 21024 + }, + { + "epoch": 73.02, + "learning_rate": 1.0997879858657244e-06, + "loss": 0.2639, + "step": 21030 + }, + { + "epoch": 73.06, + "learning_rate": 1.0983745583038868e-06, + "loss": 0.2614, + "step": 21040 + }, + { + "epoch": 73.09, + "learning_rate": 1.0969611307420494e-06, + "loss": 0.2265, + "step": 21050 + }, + { + "epoch": 73.12, + "learning_rate": 1.095547703180212e-06, + "loss": 0.2721, + "step": 21060 + }, + { + "epoch": 73.16, + "learning_rate": 1.0941342756183745e-06, + "loss": 0.2645, + "step": 21070 + }, + { + "epoch": 73.19, + "learning_rate": 1.092720848056537e-06, + "loss": 0.2381, + "step": 21080 + }, + { + "epoch": 73.23, + "learning_rate": 1.0913074204946997e-06, + "loss": 0.2458, + "step": 21090 + }, + { + "epoch": 73.26, + "learning_rate": 1.0898939929328621e-06, + "loss": 0.2378, + "step": 21100 + }, + { + "epoch": 73.3, + "learning_rate": 1.0884805653710247e-06, + "loss": 0.2567, + "step": 21110 + }, + { + "epoch": 73.33, + "learning_rate": 1.0870671378091871e-06, + "loss": 0.264, + "step": 21120 + }, + { + "epoch": 73.37, + "learning_rate": 1.0856537102473498e-06, + "loss": 0.2563, + "step": 21130 + }, + { + "epoch": 73.4, + "learning_rate": 1.0842402826855124e-06, + "loss": 0.2683, + "step": 21140 + }, + { + "epoch": 73.44, + "learning_rate": 1.0828268551236748e-06, + "loss": 0.2692, + "step": 21150 + }, + { + "epoch": 73.47, + "learning_rate": 1.0814134275618374e-06, + "loss": 0.2751, + "step": 21160 + }, + { + "epoch": 73.51, + "learning_rate": 1.08e-06, + "loss": 0.2638, + "step": 21170 + }, + { + "epoch": 73.54, + "learning_rate": 1.0785865724381624e-06, + "loss": 0.2333, + "step": 21180 + }, + { + "epoch": 73.57, + "learning_rate": 1.077173144876325e-06, + "loss": 0.2784, + "step": 21190 + }, + { + "epoch": 73.61, + "learning_rate": 1.0757597173144877e-06, + "loss": 0.2539, + "step": 21200 + }, + { + "epoch": 73.64, + "learning_rate": 1.07434628975265e-06, + "loss": 0.2442, + "step": 21210 + }, + { + "epoch": 73.68, + "learning_rate": 1.0729328621908127e-06, + "loss": 0.2633, + "step": 21220 + }, + { + "epoch": 73.71, + "learning_rate": 1.0715194346289753e-06, + "loss": 0.2318, + "step": 21230 + }, + { + "epoch": 73.75, + "learning_rate": 1.0701060070671377e-06, + "loss": 0.259, + "step": 21240 + }, + { + "epoch": 73.78, + "learning_rate": 1.0686925795053004e-06, + "loss": 0.2351, + "step": 21250 + }, + { + "epoch": 73.82, + "learning_rate": 1.0672791519434628e-06, + "loss": 0.2904, + "step": 21260 + }, + { + "epoch": 73.85, + "learning_rate": 1.0658657243816254e-06, + "loss": 0.2636, + "step": 21270 + }, + { + "epoch": 73.89, + "learning_rate": 1.064452296819788e-06, + "loss": 0.2746, + "step": 21280 + }, + { + "epoch": 73.92, + "learning_rate": 1.0630388692579504e-06, + "loss": 0.2249, + "step": 21290 + }, + { + "epoch": 73.96, + "learning_rate": 1.061625441696113e-06, + "loss": 0.257, + "step": 21300 + }, + { + "epoch": 73.99, + "learning_rate": 1.0602120141342757e-06, + "loss": 0.2675, + "step": 21310 + }, + { + "epoch": 74.0, + "eval_loss": 0.5058467388153076, + "eval_runtime": 133.957, + "eval_samples_per_second": 3.971, + "eval_steps_per_second": 0.993, + "eval_wer": 0.19605322362923444, + "step": 21312 + }, + { + "epoch": 74.03, + "learning_rate": 1.058798586572438e-06, + "loss": 0.2531, + "step": 21320 + }, + { + "epoch": 74.06, + "learning_rate": 1.0573851590106007e-06, + "loss": 0.241, + "step": 21330 + }, + { + "epoch": 74.1, + "learning_rate": 1.0559717314487633e-06, + "loss": 0.2388, + "step": 21340 + }, + { + "epoch": 74.13, + "learning_rate": 1.0545583038869257e-06, + "loss": 0.2513, + "step": 21350 + }, + { + "epoch": 74.17, + "learning_rate": 1.0531448763250884e-06, + "loss": 0.2672, + "step": 21360 + }, + { + "epoch": 74.2, + "learning_rate": 1.051731448763251e-06, + "loss": 0.2415, + "step": 21370 + }, + { + "epoch": 74.24, + "learning_rate": 1.0503180212014134e-06, + "loss": 0.2492, + "step": 21380 + }, + { + "epoch": 74.27, + "learning_rate": 1.048904593639576e-06, + "loss": 0.2421, + "step": 21390 + }, + { + "epoch": 74.3, + "learning_rate": 1.0474911660777386e-06, + "loss": 0.2926, + "step": 21400 + }, + { + "epoch": 74.34, + "learning_rate": 1.046077738515901e-06, + "loss": 0.2639, + "step": 21410 + }, + { + "epoch": 74.37, + "learning_rate": 1.0446643109540637e-06, + "loss": 0.2357, + "step": 21420 + }, + { + "epoch": 74.41, + "learning_rate": 1.043250883392226e-06, + "loss": 0.2707, + "step": 21430 + }, + { + "epoch": 74.44, + "learning_rate": 1.0418374558303887e-06, + "loss": 0.2426, + "step": 21440 + }, + { + "epoch": 74.48, + "learning_rate": 1.0404240282685513e-06, + "loss": 0.2743, + "step": 21450 + }, + { + "epoch": 74.51, + "learning_rate": 1.0390106007067137e-06, + "loss": 0.2739, + "step": 21460 + }, + { + "epoch": 74.55, + "learning_rate": 1.0375971731448763e-06, + "loss": 0.2391, + "step": 21470 + }, + { + "epoch": 74.58, + "learning_rate": 1.036183745583039e-06, + "loss": 0.2781, + "step": 21480 + }, + { + "epoch": 74.62, + "learning_rate": 1.0347703180212014e-06, + "loss": 0.2666, + "step": 21490 + }, + { + "epoch": 74.65, + "learning_rate": 1.033356890459364e-06, + "loss": 0.2484, + "step": 21500 + }, + { + "epoch": 74.69, + "learning_rate": 1.0319434628975266e-06, + "loss": 0.2529, + "step": 21510 + }, + { + "epoch": 74.72, + "learning_rate": 1.030530035335689e-06, + "loss": 0.2447, + "step": 21520 + }, + { + "epoch": 74.75, + "learning_rate": 1.0291166077738516e-06, + "loss": 0.2399, + "step": 21530 + }, + { + "epoch": 74.79, + "learning_rate": 1.0277031802120143e-06, + "loss": 0.2519, + "step": 21540 + }, + { + "epoch": 74.82, + "learning_rate": 1.0262897526501767e-06, + "loss": 0.2689, + "step": 21550 + }, + { + "epoch": 74.86, + "learning_rate": 1.0248763250883393e-06, + "loss": 0.2558, + "step": 21560 + }, + { + "epoch": 74.89, + "learning_rate": 1.0234628975265017e-06, + "loss": 0.2466, + "step": 21570 + }, + { + "epoch": 74.93, + "learning_rate": 1.0220494699646643e-06, + "loss": 0.2463, + "step": 21580 + }, + { + "epoch": 74.96, + "learning_rate": 1.020636042402827e-06, + "loss": 0.2776, + "step": 21590 + }, + { + "epoch": 75.0, + "learning_rate": 1.0192226148409894e-06, + "loss": 0.2519, + "step": 21600 + }, + { + "epoch": 75.0, + "eval_loss": 0.5216230750083923, + "eval_runtime": 133.9162, + "eval_samples_per_second": 3.973, + "eval_steps_per_second": 0.993, + "eval_wer": 0.19875297293822716, + "step": 21600 + }, + { + "epoch": 75.03, + "learning_rate": 1.017809187279152e-06, + "loss": 0.2963, + "step": 21610 + }, + { + "epoch": 75.07, + "learning_rate": 1.0163957597173146e-06, + "loss": 0.2578, + "step": 21620 + }, + { + "epoch": 75.1, + "learning_rate": 1.0149823321554768e-06, + "loss": 0.2693, + "step": 21630 + }, + { + "epoch": 75.14, + "learning_rate": 1.0135689045936394e-06, + "loss": 0.2924, + "step": 21640 + }, + { + "epoch": 75.17, + "learning_rate": 1.012155477031802e-06, + "loss": 0.2423, + "step": 21650 + }, + { + "epoch": 75.21, + "learning_rate": 1.0107420494699645e-06, + "loss": 0.2563, + "step": 21660 + }, + { + "epoch": 75.24, + "learning_rate": 1.009328621908127e-06, + "loss": 0.267, + "step": 21670 + }, + { + "epoch": 75.28, + "learning_rate": 1.0079151943462897e-06, + "loss": 0.2634, + "step": 21680 + }, + { + "epoch": 75.31, + "learning_rate": 1.0065017667844521e-06, + "loss": 0.2661, + "step": 21690 + }, + { + "epoch": 75.35, + "learning_rate": 1.0050883392226147e-06, + "loss": 0.2425, + "step": 21700 + }, + { + "epoch": 75.38, + "learning_rate": 1.0036749116607774e-06, + "loss": 0.2592, + "step": 21710 + }, + { + "epoch": 75.42, + "learning_rate": 1.0022614840989398e-06, + "loss": 0.236, + "step": 21720 + }, + { + "epoch": 75.45, + "learning_rate": 1.0008480565371024e-06, + "loss": 0.2506, + "step": 21730 + }, + { + "epoch": 75.48, + "learning_rate": 9.99434628975265e-07, + "loss": 0.2746, + "step": 21740 + }, + { + "epoch": 75.52, + "learning_rate": 9.980212014134274e-07, + "loss": 0.2696, + "step": 21750 + }, + { + "epoch": 75.55, + "learning_rate": 9.9660777385159e-07, + "loss": 0.249, + "step": 21760 + }, + { + "epoch": 75.59, + "learning_rate": 9.951943462897527e-07, + "loss": 0.2845, + "step": 21770 + }, + { + "epoch": 75.62, + "learning_rate": 9.93780918727915e-07, + "loss": 0.2298, + "step": 21780 + }, + { + "epoch": 75.66, + "learning_rate": 9.923674911660777e-07, + "loss": 0.2675, + "step": 21790 + }, + { + "epoch": 75.69, + "learning_rate": 9.909540636042403e-07, + "loss": 0.2734, + "step": 21800 + }, + { + "epoch": 75.73, + "learning_rate": 9.895406360424027e-07, + "loss": 0.244, + "step": 21810 + }, + { + "epoch": 75.76, + "learning_rate": 9.881272084805653e-07, + "loss": 0.2333, + "step": 21820 + }, + { + "epoch": 75.8, + "learning_rate": 9.86713780918728e-07, + "loss": 0.226, + "step": 21830 + }, + { + "epoch": 75.83, + "learning_rate": 9.853003533568904e-07, + "loss": 0.2542, + "step": 21840 + }, + { + "epoch": 75.87, + "learning_rate": 9.83886925795053e-07, + "loss": 0.283, + "step": 21850 + }, + { + "epoch": 75.9, + "learning_rate": 9.824734982332154e-07, + "loss": 0.2332, + "step": 21860 + }, + { + "epoch": 75.94, + "learning_rate": 9.81060070671378e-07, + "loss": 0.2518, + "step": 21870 + }, + { + "epoch": 75.97, + "learning_rate": 9.796466431095406e-07, + "loss": 0.2666, + "step": 21880 + }, + { + "epoch": 76.0, + "eval_loss": 0.5116772651672363, + "eval_runtime": 134.0532, + "eval_samples_per_second": 3.969, + "eval_steps_per_second": 0.992, + "eval_wer": 0.1958603843928778, + "step": 21888 + }, + { + "epoch": 76.01, + "learning_rate": 9.78233215547703e-07, + "loss": 0.2766, + "step": 21890 + }, + { + "epoch": 76.04, + "learning_rate": 9.768197879858657e-07, + "loss": 0.2281, + "step": 21900 + }, + { + "epoch": 76.08, + "learning_rate": 9.754063604240283e-07, + "loss": 0.2703, + "step": 21910 + }, + { + "epoch": 76.11, + "learning_rate": 9.739929328621907e-07, + "loss": 0.258, + "step": 21920 + }, + { + "epoch": 76.15, + "learning_rate": 9.725795053003533e-07, + "loss": 0.2614, + "step": 21930 + }, + { + "epoch": 76.18, + "learning_rate": 9.71166077738516e-07, + "loss": 0.2773, + "step": 21940 + }, + { + "epoch": 76.21, + "learning_rate": 9.697526501766784e-07, + "loss": 0.2701, + "step": 21950 + }, + { + "epoch": 76.25, + "learning_rate": 9.68339222614841e-07, + "loss": 0.2416, + "step": 21960 + }, + { + "epoch": 76.28, + "learning_rate": 9.669257950530036e-07, + "loss": 0.2547, + "step": 21970 + }, + { + "epoch": 76.32, + "learning_rate": 9.65512367491166e-07, + "loss": 0.2483, + "step": 21980 + }, + { + "epoch": 76.35, + "learning_rate": 9.640989399293286e-07, + "loss": 0.2473, + "step": 21990 + }, + { + "epoch": 76.39, + "learning_rate": 9.62685512367491e-07, + "loss": 0.2471, + "step": 22000 + }, + { + "epoch": 76.42, + "learning_rate": 9.612720848056537e-07, + "loss": 0.2323, + "step": 22010 + }, + { + "epoch": 76.46, + "learning_rate": 9.598586572438163e-07, + "loss": 0.276, + "step": 22020 + }, + { + "epoch": 76.49, + "learning_rate": 9.584452296819787e-07, + "loss": 0.2644, + "step": 22030 + }, + { + "epoch": 76.53, + "learning_rate": 9.570318021201413e-07, + "loss": 0.2605, + "step": 22040 + }, + { + "epoch": 76.56, + "learning_rate": 9.55618374558304e-07, + "loss": 0.2717, + "step": 22050 + }, + { + "epoch": 76.6, + "learning_rate": 9.542049469964663e-07, + "loss": 0.2534, + "step": 22060 + }, + { + "epoch": 76.63, + "learning_rate": 9.52791519434629e-07, + "loss": 0.2359, + "step": 22070 + }, + { + "epoch": 76.66, + "learning_rate": 9.513780918727915e-07, + "loss": 0.2806, + "step": 22080 + }, + { + "epoch": 76.7, + "learning_rate": 9.49964664310954e-07, + "loss": 0.2575, + "step": 22090 + }, + { + "epoch": 76.73, + "learning_rate": 9.485512367491165e-07, + "loss": 0.2439, + "step": 22100 + }, + { + "epoch": 76.77, + "learning_rate": 9.471378091872791e-07, + "loss": 0.2618, + "step": 22110 + }, + { + "epoch": 76.8, + "learning_rate": 9.457243816254416e-07, + "loss": 0.2445, + "step": 22120 + }, + { + "epoch": 76.84, + "learning_rate": 9.443109540636042e-07, + "loss": 0.2525, + "step": 22130 + }, + { + "epoch": 76.87, + "learning_rate": 9.428975265017668e-07, + "loss": 0.2441, + "step": 22140 + }, + { + "epoch": 76.91, + "learning_rate": 9.414840989399293e-07, + "loss": 0.259, + "step": 22150 + }, + { + "epoch": 76.94, + "learning_rate": 9.400706713780918e-07, + "loss": 0.2506, + "step": 22160 + }, + { + "epoch": 76.98, + "learning_rate": 9.386572438162543e-07, + "loss": 0.2637, + "step": 22170 + }, + { + "epoch": 77.0, + "eval_loss": 0.5057582259178162, + "eval_runtime": 134.4046, + "eval_samples_per_second": 3.958, + "eval_steps_per_second": 0.99, + "eval_wer": 0.19566754515652118, + "step": 22176 + }, + { + "epoch": 77.01, + "learning_rate": 9.37243816254417e-07, + "loss": 0.2561, + "step": 22180 + }, + { + "epoch": 77.05, + "learning_rate": 9.358303886925795e-07, + "loss": 0.2573, + "step": 22190 + }, + { + "epoch": 77.08, + "learning_rate": 9.34416961130742e-07, + "loss": 0.2447, + "step": 22200 + }, + { + "epoch": 77.12, + "learning_rate": 9.330035335689046e-07, + "loss": 0.2532, + "step": 22210 + }, + { + "epoch": 77.15, + "learning_rate": 9.315901060070671e-07, + "loss": 0.2602, + "step": 22220 + }, + { + "epoch": 77.19, + "learning_rate": 9.301766784452296e-07, + "loss": 0.2541, + "step": 22230 + }, + { + "epoch": 77.22, + "learning_rate": 9.287632508833922e-07, + "loss": 0.2406, + "step": 22240 + }, + { + "epoch": 77.26, + "learning_rate": 9.273498233215548e-07, + "loss": 0.2469, + "step": 22250 + }, + { + "epoch": 77.29, + "learning_rate": 9.259363957597173e-07, + "loss": 0.2633, + "step": 22260 + }, + { + "epoch": 77.33, + "learning_rate": 9.245229681978798e-07, + "loss": 0.2607, + "step": 22270 + }, + { + "epoch": 77.36, + "learning_rate": 9.231095406360424e-07, + "loss": 0.2627, + "step": 22280 + }, + { + "epoch": 77.39, + "learning_rate": 9.216961130742049e-07, + "loss": 0.2787, + "step": 22290 + }, + { + "epoch": 77.43, + "learning_rate": 9.202826855123675e-07, + "loss": 0.2381, + "step": 22300 + }, + { + "epoch": 77.46, + "learning_rate": 9.1886925795053e-07, + "loss": 0.2736, + "step": 22310 + }, + { + "epoch": 77.5, + "learning_rate": 9.174558303886926e-07, + "loss": 0.2599, + "step": 22320 + }, + { + "epoch": 77.53, + "learning_rate": 9.160424028268551e-07, + "loss": 0.2563, + "step": 22330 + }, + { + "epoch": 77.57, + "learning_rate": 9.146289752650176e-07, + "loss": 0.2467, + "step": 22340 + }, + { + "epoch": 77.6, + "learning_rate": 9.132155477031802e-07, + "loss": 0.2582, + "step": 22350 + }, + { + "epoch": 77.64, + "learning_rate": 9.118021201413428e-07, + "loss": 0.2677, + "step": 22360 + }, + { + "epoch": 77.67, + "learning_rate": 9.103886925795053e-07, + "loss": 0.2752, + "step": 22370 + }, + { + "epoch": 77.71, + "learning_rate": 9.089752650176679e-07, + "loss": 0.2373, + "step": 22380 + }, + { + "epoch": 77.74, + "learning_rate": 9.075618374558304e-07, + "loss": 0.2476, + "step": 22390 + }, + { + "epoch": 77.78, + "learning_rate": 9.061484098939929e-07, + "loss": 0.2542, + "step": 22400 + }, + { + "epoch": 77.81, + "learning_rate": 9.047349823321554e-07, + "loss": 0.2466, + "step": 22410 + }, + { + "epoch": 77.85, + "learning_rate": 9.033215547703181e-07, + "loss": 0.2581, + "step": 22420 + }, + { + "epoch": 77.88, + "learning_rate": 9.019081272084806e-07, + "loss": 0.2594, + "step": 22430 + }, + { + "epoch": 77.91, + "learning_rate": 9.00494699646643e-07, + "loss": 0.2615, + "step": 22440 + }, + { + "epoch": 77.95, + "learning_rate": 8.990812720848057e-07, + "loss": 0.2566, + "step": 22450 + }, + { + "epoch": 77.98, + "learning_rate": 8.976678445229681e-07, + "loss": 0.273, + "step": 22460 + }, + { + "epoch": 78.0, + "eval_loss": 0.5186824798583984, + "eval_runtime": 133.6981, + "eval_samples_per_second": 3.979, + "eval_steps_per_second": 0.995, + "eval_wer": 0.1966317413383043, + "step": 22464 + }, + { + "epoch": 78.02, + "learning_rate": 8.962544169611306e-07, + "loss": 0.2666, + "step": 22470 + }, + { + "epoch": 78.06, + "learning_rate": 8.948409893992932e-07, + "loss": 0.2591, + "step": 22480 + }, + { + "epoch": 78.09, + "learning_rate": 8.934275618374558e-07, + "loss": 0.2377, + "step": 22490 + }, + { + "epoch": 78.12, + "learning_rate": 8.920141342756183e-07, + "loss": 0.2836, + "step": 22500 + }, + { + "epoch": 78.16, + "learning_rate": 8.906007067137808e-07, + "loss": 0.2657, + "step": 22510 + }, + { + "epoch": 78.19, + "learning_rate": 8.891872791519434e-07, + "loss": 0.2613, + "step": 22520 + }, + { + "epoch": 78.23, + "learning_rate": 8.877738515901059e-07, + "loss": 0.2644, + "step": 22530 + }, + { + "epoch": 78.26, + "learning_rate": 8.863604240282685e-07, + "loss": 0.2435, + "step": 22540 + }, + { + "epoch": 78.3, + "learning_rate": 8.84946996466431e-07, + "loss": 0.2693, + "step": 22550 + }, + { + "epoch": 78.33, + "learning_rate": 8.835335689045936e-07, + "loss": 0.2531, + "step": 22560 + }, + { + "epoch": 78.37, + "learning_rate": 8.821201413427561e-07, + "loss": 0.2535, + "step": 22570 + }, + { + "epoch": 78.4, + "learning_rate": 8.807067137809186e-07, + "loss": 0.2645, + "step": 22580 + }, + { + "epoch": 78.44, + "learning_rate": 8.792932862190812e-07, + "loss": 0.2336, + "step": 22590 + }, + { + "epoch": 78.47, + "learning_rate": 8.778798586572438e-07, + "loss": 0.2474, + "step": 22600 + }, + { + "epoch": 78.51, + "learning_rate": 8.764664310954063e-07, + "loss": 0.2524, + "step": 22610 + }, + { + "epoch": 78.54, + "learning_rate": 8.750530035335688e-07, + "loss": 0.2246, + "step": 22620 + }, + { + "epoch": 78.57, + "learning_rate": 8.736395759717314e-07, + "loss": 0.2573, + "step": 22630 + }, + { + "epoch": 78.61, + "learning_rate": 8.722261484098939e-07, + "loss": 0.2482, + "step": 22640 + }, + { + "epoch": 78.64, + "learning_rate": 8.708127208480564e-07, + "loss": 0.272, + "step": 22650 + }, + { + "epoch": 78.68, + "learning_rate": 8.693992932862191e-07, + "loss": 0.266, + "step": 22660 + }, + { + "epoch": 78.71, + "learning_rate": 8.679858657243816e-07, + "loss": 0.262, + "step": 22670 + }, + { + "epoch": 78.75, + "learning_rate": 8.665724381625441e-07, + "loss": 0.2503, + "step": 22680 + }, + { + "epoch": 78.78, + "learning_rate": 8.651590106007067e-07, + "loss": 0.2554, + "step": 22690 + }, + { + "epoch": 78.82, + "learning_rate": 8.637455830388692e-07, + "loss": 0.263, + "step": 22700 + }, + { + "epoch": 78.85, + "learning_rate": 8.623321554770318e-07, + "loss": 0.269, + "step": 22710 + }, + { + "epoch": 78.89, + "learning_rate": 8.609187279151943e-07, + "loss": 0.262, + "step": 22720 + }, + { + "epoch": 78.92, + "learning_rate": 8.595053003533569e-07, + "loss": 0.2698, + "step": 22730 + }, + { + "epoch": 78.96, + "learning_rate": 8.580918727915194e-07, + "loss": 0.255, + "step": 22740 + }, + { + "epoch": 78.99, + "learning_rate": 8.566784452296819e-07, + "loss": 0.2666, + "step": 22750 + }, + { + "epoch": 79.0, + "eval_loss": 0.5175613760948181, + "eval_runtime": 134.3104, + "eval_samples_per_second": 3.961, + "eval_steps_per_second": 0.99, + "eval_wer": 0.19579610464742558, + "step": 22752 + }, + { + "epoch": 79.03, + "learning_rate": 8.552650176678445e-07, + "loss": 0.2381, + "step": 22760 + }, + { + "epoch": 79.06, + "learning_rate": 8.538515901060071e-07, + "loss": 0.2487, + "step": 22770 + }, + { + "epoch": 79.1, + "learning_rate": 8.524381625441696e-07, + "loss": 0.2621, + "step": 22780 + }, + { + "epoch": 79.13, + "learning_rate": 8.510247349823321e-07, + "loss": 0.271, + "step": 22790 + }, + { + "epoch": 79.17, + "learning_rate": 8.496113074204947e-07, + "loss": 0.2689, + "step": 22800 + }, + { + "epoch": 79.2, + "learning_rate": 8.481978798586572e-07, + "loss": 0.2351, + "step": 22810 + }, + { + "epoch": 79.24, + "learning_rate": 8.467844522968197e-07, + "loss": 0.2733, + "step": 22820 + }, + { + "epoch": 79.27, + "learning_rate": 8.453710247349824e-07, + "loss": 0.2436, + "step": 22830 + }, + { + "epoch": 79.3, + "learning_rate": 8.439575971731449e-07, + "loss": 0.2628, + "step": 22840 + }, + { + "epoch": 79.34, + "learning_rate": 8.425441696113074e-07, + "loss": 0.251, + "step": 22850 + }, + { + "epoch": 79.37, + "learning_rate": 8.411307420494699e-07, + "loss": 0.258, + "step": 22860 + }, + { + "epoch": 79.41, + "learning_rate": 8.397173144876325e-07, + "loss": 0.242, + "step": 22870 + }, + { + "epoch": 79.44, + "learning_rate": 8.38303886925795e-07, + "loss": 0.2446, + "step": 22880 + }, + { + "epoch": 79.48, + "learning_rate": 8.368904593639576e-07, + "loss": 0.2683, + "step": 22890 + }, + { + "epoch": 79.51, + "learning_rate": 8.354770318021202e-07, + "loss": 0.2686, + "step": 22900 + }, + { + "epoch": 79.55, + "learning_rate": 8.340636042402827e-07, + "loss": 0.2717, + "step": 22910 + }, + { + "epoch": 79.58, + "learning_rate": 8.326501766784452e-07, + "loss": 0.2373, + "step": 22920 + }, + { + "epoch": 79.62, + "learning_rate": 8.312367491166077e-07, + "loss": 0.2399, + "step": 22930 + }, + { + "epoch": 79.65, + "learning_rate": 8.298233215547703e-07, + "loss": 0.2867, + "step": 22940 + }, + { + "epoch": 79.69, + "learning_rate": 8.284098939929329e-07, + "loss": 0.277, + "step": 22950 + }, + { + "epoch": 79.72, + "learning_rate": 8.269964664310954e-07, + "loss": 0.2399, + "step": 22960 + }, + { + "epoch": 79.75, + "learning_rate": 8.25583038869258e-07, + "loss": 0.2537, + "step": 22970 + }, + { + "epoch": 79.79, + "learning_rate": 8.241696113074205e-07, + "loss": 0.2491, + "step": 22980 + }, + { + "epoch": 79.82, + "learning_rate": 8.227561837455829e-07, + "loss": 0.2747, + "step": 22990 + }, + { + "epoch": 79.86, + "learning_rate": 8.213427561837457e-07, + "loss": 0.2612, + "step": 23000 + }, + { + "epoch": 79.89, + "learning_rate": 8.199293286219081e-07, + "loss": 0.2455, + "step": 23010 + }, + { + "epoch": 79.93, + "learning_rate": 8.185159010600706e-07, + "loss": 0.2593, + "step": 23020 + }, + { + "epoch": 79.96, + "learning_rate": 8.171024734982331e-07, + "loss": 0.258, + "step": 23030 + }, + { + "epoch": 80.0, + "learning_rate": 8.156890459363957e-07, + "loss": 0.2627, + "step": 23040 + }, + { + "epoch": 80.0, + "eval_loss": 0.5141689777374268, + "eval_runtime": 133.6944, + "eval_samples_per_second": 3.979, + "eval_steps_per_second": 0.995, + "eval_wer": 0.1949604679565469, + "step": 23040 + }, + { + "epoch": 80.03, + "learning_rate": 8.142756183745582e-07, + "loss": 0.2598, + "step": 23050 + }, + { + "epoch": 80.07, + "learning_rate": 8.128621908127207e-07, + "loss": 0.2679, + "step": 23060 + }, + { + "epoch": 80.1, + "learning_rate": 8.114487632508834e-07, + "loss": 0.223, + "step": 23070 + }, + { + "epoch": 80.14, + "learning_rate": 8.100353356890459e-07, + "loss": 0.2692, + "step": 23080 + }, + { + "epoch": 80.17, + "learning_rate": 8.086219081272084e-07, + "loss": 0.2647, + "step": 23090 + }, + { + "epoch": 80.21, + "learning_rate": 8.072084805653709e-07, + "loss": 0.2544, + "step": 23100 + }, + { + "epoch": 80.24, + "learning_rate": 8.057950530035335e-07, + "loss": 0.2579, + "step": 23110 + }, + { + "epoch": 80.28, + "learning_rate": 8.04381625441696e-07, + "loss": 0.246, + "step": 23120 + }, + { + "epoch": 80.31, + "learning_rate": 8.029681978798586e-07, + "loss": 0.2714, + "step": 23130 + }, + { + "epoch": 80.35, + "learning_rate": 8.015547703180212e-07, + "loss": 0.2763, + "step": 23140 + }, + { + "epoch": 80.38, + "learning_rate": 8.001413427561837e-07, + "loss": 0.2489, + "step": 23150 + }, + { + "epoch": 80.42, + "learning_rate": 7.987279151943462e-07, + "loss": 0.2382, + "step": 23160 + }, + { + "epoch": 80.45, + "learning_rate": 7.973144876325087e-07, + "loss": 0.2712, + "step": 23170 + }, + { + "epoch": 80.48, + "learning_rate": 7.959010600706714e-07, + "loss": 0.2612, + "step": 23180 + }, + { + "epoch": 80.52, + "learning_rate": 7.944876325088339e-07, + "loss": 0.2573, + "step": 23190 + }, + { + "epoch": 80.55, + "learning_rate": 7.930742049469964e-07, + "loss": 0.2412, + "step": 23200 + }, + { + "epoch": 80.59, + "learning_rate": 7.91660777385159e-07, + "loss": 0.262, + "step": 23210 + }, + { + "epoch": 80.62, + "learning_rate": 7.902473498233215e-07, + "loss": 0.2555, + "step": 23220 + }, + { + "epoch": 80.66, + "learning_rate": 7.88833922261484e-07, + "loss": 0.2685, + "step": 23230 + }, + { + "epoch": 80.69, + "learning_rate": 7.874204946996466e-07, + "loss": 0.2427, + "step": 23240 + }, + { + "epoch": 80.73, + "learning_rate": 7.860070671378092e-07, + "loss": 0.2629, + "step": 23250 + }, + { + "epoch": 80.76, + "learning_rate": 7.845936395759717e-07, + "loss": 0.248, + "step": 23260 + }, + { + "epoch": 80.8, + "learning_rate": 7.831802120141342e-07, + "loss": 0.2413, + "step": 23270 + }, + { + "epoch": 80.83, + "learning_rate": 7.817667844522968e-07, + "loss": 0.2675, + "step": 23280 + }, + { + "epoch": 80.87, + "learning_rate": 7.803533568904593e-07, + "loss": 0.263, + "step": 23290 + }, + { + "epoch": 80.9, + "learning_rate": 7.789399293286219e-07, + "loss": 0.2674, + "step": 23300 + }, + { + "epoch": 80.94, + "learning_rate": 7.775265017667845e-07, + "loss": 0.2567, + "step": 23310 + }, + { + "epoch": 80.97, + "learning_rate": 7.76113074204947e-07, + "loss": 0.2508, + "step": 23320 + }, + { + "epoch": 81.0, + "eval_loss": 0.5157809853553772, + "eval_runtime": 134.6235, + "eval_samples_per_second": 3.952, + "eval_steps_per_second": 0.988, + "eval_wer": 0.19605322362923444, + "step": 23328 + }, + { + "epoch": 81.01, + "learning_rate": 7.746996466431095e-07, + "loss": 0.289, + "step": 23330 + }, + { + "epoch": 81.04, + "learning_rate": 7.73286219081272e-07, + "loss": 0.2503, + "step": 23340 + }, + { + "epoch": 81.08, + "learning_rate": 7.718727915194346e-07, + "loss": 0.2387, + "step": 23350 + }, + { + "epoch": 81.11, + "learning_rate": 7.704593639575972e-07, + "loss": 0.2675, + "step": 23360 + }, + { + "epoch": 81.15, + "learning_rate": 7.690459363957597e-07, + "loss": 0.2534, + "step": 23370 + }, + { + "epoch": 81.18, + "learning_rate": 7.676325088339223e-07, + "loss": 0.2603, + "step": 23380 + }, + { + "epoch": 81.21, + "learning_rate": 7.662190812720848e-07, + "loss": 0.2545, + "step": 23390 + }, + { + "epoch": 81.25, + "learning_rate": 7.648056537102473e-07, + "loss": 0.2617, + "step": 23400 + }, + { + "epoch": 81.28, + "learning_rate": 7.633922261484098e-07, + "loss": 0.2495, + "step": 23410 + }, + { + "epoch": 81.32, + "learning_rate": 7.619787985865725e-07, + "loss": 0.2608, + "step": 23420 + }, + { + "epoch": 81.35, + "learning_rate": 7.60565371024735e-07, + "loss": 0.2561, + "step": 23430 + }, + { + "epoch": 81.39, + "learning_rate": 7.591519434628975e-07, + "loss": 0.2487, + "step": 23440 + }, + { + "epoch": 81.42, + "learning_rate": 7.577385159010601e-07, + "loss": 0.2522, + "step": 23450 + }, + { + "epoch": 81.46, + "learning_rate": 7.563250883392226e-07, + "loss": 0.2796, + "step": 23460 + }, + { + "epoch": 81.49, + "learning_rate": 7.549116607773851e-07, + "loss": 0.2516, + "step": 23470 + }, + { + "epoch": 81.53, + "learning_rate": 7.534982332155477e-07, + "loss": 0.2653, + "step": 23480 + }, + { + "epoch": 81.56, + "learning_rate": 7.520848056537103e-07, + "loss": 0.2627, + "step": 23490 + }, + { + "epoch": 81.6, + "learning_rate": 7.506713780918728e-07, + "loss": 0.2524, + "step": 23500 + }, + { + "epoch": 81.63, + "learning_rate": 7.492579505300353e-07, + "loss": 0.2545, + "step": 23510 + }, + { + "epoch": 81.66, + "learning_rate": 7.478445229681979e-07, + "loss": 0.2838, + "step": 23520 + }, + { + "epoch": 81.7, + "learning_rate": 7.464310954063605e-07, + "loss": 0.25, + "step": 23530 + }, + { + "epoch": 81.73, + "learning_rate": 7.450176678445229e-07, + "loss": 0.2702, + "step": 23540 + }, + { + "epoch": 81.77, + "learning_rate": 7.436042402826854e-07, + "loss": 0.2521, + "step": 23550 + }, + { + "epoch": 81.8, + "learning_rate": 7.42190812720848e-07, + "loss": 0.2537, + "step": 23560 + }, + { + "epoch": 81.84, + "learning_rate": 7.407773851590105e-07, + "loss": 0.2731, + "step": 23570 + }, + { + "epoch": 81.87, + "learning_rate": 7.39363957597173e-07, + "loss": 0.2441, + "step": 23580 + }, + { + "epoch": 81.91, + "learning_rate": 7.379505300353357e-07, + "loss": 0.2541, + "step": 23590 + }, + { + "epoch": 81.94, + "learning_rate": 7.365371024734982e-07, + "loss": 0.2546, + "step": 23600 + }, + { + "epoch": 81.98, + "learning_rate": 7.351236749116607e-07, + "loss": 0.2499, + "step": 23610 + }, + { + "epoch": 82.0, + "eval_loss": 0.5130564570426941, + "eval_runtime": 134.0023, + "eval_samples_per_second": 3.97, + "eval_steps_per_second": 0.993, + "eval_wer": 0.19695314006556533, + "step": 23616 + }, + { + "epoch": 82.01, + "learning_rate": 7.337102473498233e-07, + "loss": 0.2829, + "step": 23620 + }, + { + "epoch": 82.05, + "learning_rate": 7.322968197879858e-07, + "loss": 0.2725, + "step": 23630 + }, + { + "epoch": 82.08, + "learning_rate": 7.308833922261483e-07, + "loss": 0.2439, + "step": 23640 + }, + { + "epoch": 82.12, + "learning_rate": 7.294699646643108e-07, + "loss": 0.2534, + "step": 23650 + }, + { + "epoch": 82.15, + "learning_rate": 7.280565371024735e-07, + "loss": 0.2644, + "step": 23660 + }, + { + "epoch": 82.19, + "learning_rate": 7.26643109540636e-07, + "loss": 0.2402, + "step": 23670 + }, + { + "epoch": 82.22, + "learning_rate": 7.252296819787985e-07, + "loss": 0.2337, + "step": 23680 + }, + { + "epoch": 82.26, + "learning_rate": 7.238162544169611e-07, + "loss": 0.2612, + "step": 23690 + }, + { + "epoch": 82.29, + "learning_rate": 7.224028268551236e-07, + "loss": 0.276, + "step": 23700 + }, + { + "epoch": 82.33, + "learning_rate": 7.209893992932862e-07, + "loss": 0.275, + "step": 23710 + }, + { + "epoch": 82.36, + "learning_rate": 7.195759717314487e-07, + "loss": 0.2353, + "step": 23720 + }, + { + "epoch": 82.39, + "learning_rate": 7.181625441696113e-07, + "loss": 0.2435, + "step": 23730 + }, + { + "epoch": 82.43, + "learning_rate": 7.167491166077738e-07, + "loss": 0.2574, + "step": 23740 + }, + { + "epoch": 82.46, + "learning_rate": 7.153356890459363e-07, + "loss": 0.2834, + "step": 23750 + }, + { + "epoch": 82.5, + "learning_rate": 7.139222614840989e-07, + "loss": 0.2714, + "step": 23760 + }, + { + "epoch": 82.53, + "learning_rate": 7.125088339222615e-07, + "loss": 0.2523, + "step": 23770 + }, + { + "epoch": 82.57, + "learning_rate": 7.11095406360424e-07, + "loss": 0.2729, + "step": 23780 + }, + { + "epoch": 82.6, + "learning_rate": 7.096819787985865e-07, + "loss": 0.2366, + "step": 23790 + }, + { + "epoch": 82.64, + "learning_rate": 7.082685512367491e-07, + "loss": 0.2644, + "step": 23800 + }, + { + "epoch": 82.67, + "learning_rate": 7.068551236749116e-07, + "loss": 0.2382, + "step": 23810 + }, + { + "epoch": 82.71, + "learning_rate": 7.054416961130741e-07, + "loss": 0.2489, + "step": 23820 + }, + { + "epoch": 82.74, + "learning_rate": 7.040282685512368e-07, + "loss": 0.2933, + "step": 23830 + }, + { + "epoch": 82.78, + "learning_rate": 7.026148409893993e-07, + "loss": 0.2437, + "step": 23840 + }, + { + "epoch": 82.81, + "learning_rate": 7.012014134275618e-07, + "loss": 0.2433, + "step": 23850 + }, + { + "epoch": 82.85, + "learning_rate": 6.997879858657243e-07, + "loss": 0.2602, + "step": 23860 + }, + { + "epoch": 82.88, + "learning_rate": 6.983745583038869e-07, + "loss": 0.2693, + "step": 23870 + }, + { + "epoch": 82.91, + "learning_rate": 6.969611307420494e-07, + "loss": 0.2426, + "step": 23880 + }, + { + "epoch": 82.95, + "learning_rate": 6.95547703180212e-07, + "loss": 0.242, + "step": 23890 + }, + { + "epoch": 82.98, + "learning_rate": 6.941342756183746e-07, + "loss": 0.2583, + "step": 23900 + }, + { + "epoch": 83.0, + "eval_loss": 0.5149600505828857, + "eval_runtime": 134.0167, + "eval_samples_per_second": 3.97, + "eval_steps_per_second": 0.992, + "eval_wer": 0.19746737802918302, + "step": 23904 + }, + { + "epoch": 83.02, + "learning_rate": 6.927208480565371e-07, + "loss": 0.2692, + "step": 23910 + }, + { + "epoch": 83.06, + "learning_rate": 6.913074204946996e-07, + "loss": 0.2688, + "step": 23920 + }, + { + "epoch": 83.09, + "learning_rate": 6.898939929328622e-07, + "loss": 0.2601, + "step": 23930 + }, + { + "epoch": 83.12, + "learning_rate": 6.884805653710247e-07, + "loss": 0.2784, + "step": 23940 + }, + { + "epoch": 83.16, + "learning_rate": 6.870671378091873e-07, + "loss": 0.2408, + "step": 23950 + }, + { + "epoch": 83.19, + "learning_rate": 6.856537102473498e-07, + "loss": 0.2512, + "step": 23960 + }, + { + "epoch": 83.23, + "learning_rate": 6.842402826855124e-07, + "loss": 0.2371, + "step": 23970 + }, + { + "epoch": 83.26, + "learning_rate": 6.828268551236749e-07, + "loss": 0.2627, + "step": 23980 + }, + { + "epoch": 83.3, + "learning_rate": 6.814134275618374e-07, + "loss": 0.2642, + "step": 23990 + }, + { + "epoch": 83.33, + "learning_rate": 6.800000000000001e-07, + "loss": 0.2806, + "step": 24000 + }, + { + "epoch": 83.37, + "learning_rate": 6.785865724381626e-07, + "loss": 0.2409, + "step": 24010 + }, + { + "epoch": 83.4, + "learning_rate": 6.771731448763251e-07, + "loss": 0.256, + "step": 24020 + }, + { + "epoch": 83.44, + "learning_rate": 6.757597173144876e-07, + "loss": 0.2399, + "step": 24030 + }, + { + "epoch": 83.47, + "learning_rate": 6.743462897526502e-07, + "loss": 0.2721, + "step": 24040 + }, + { + "epoch": 83.51, + "learning_rate": 6.729328621908127e-07, + "loss": 0.2702, + "step": 24050 + }, + { + "epoch": 83.54, + "learning_rate": 6.715194346289753e-07, + "loss": 0.2252, + "step": 24060 + }, + { + "epoch": 83.57, + "learning_rate": 6.701060070671379e-07, + "loss": 0.2405, + "step": 24070 + }, + { + "epoch": 83.61, + "learning_rate": 6.686925795053003e-07, + "loss": 0.2409, + "step": 24080 + }, + { + "epoch": 83.64, + "learning_rate": 6.672791519434628e-07, + "loss": 0.257, + "step": 24090 + }, + { + "epoch": 83.68, + "learning_rate": 6.658657243816253e-07, + "loss": 0.2642, + "step": 24100 + }, + { + "epoch": 83.71, + "learning_rate": 6.644522968197879e-07, + "loss": 0.2699, + "step": 24110 + }, + { + "epoch": 83.75, + "learning_rate": 6.630388692579505e-07, + "loss": 0.2487, + "step": 24120 + }, + { + "epoch": 83.78, + "learning_rate": 6.61625441696113e-07, + "loss": 0.2505, + "step": 24130 + }, + { + "epoch": 83.82, + "learning_rate": 6.602120141342756e-07, + "loss": 0.2627, + "step": 24140 + }, + { + "epoch": 83.85, + "learning_rate": 6.587985865724381e-07, + "loss": 0.2579, + "step": 24150 + }, + { + "epoch": 83.89, + "learning_rate": 6.573851590106006e-07, + "loss": 0.2434, + "step": 24160 + }, + { + "epoch": 83.92, + "learning_rate": 6.559717314487631e-07, + "loss": 0.2344, + "step": 24170 + }, + { + "epoch": 83.96, + "learning_rate": 6.545583038869258e-07, + "loss": 0.2468, + "step": 24180 + }, + { + "epoch": 83.99, + "learning_rate": 6.531448763250883e-07, + "loss": 0.246, + "step": 24190 + }, + { + "epoch": 84.0, + "eval_loss": 0.5096983909606934, + "eval_runtime": 133.3449, + "eval_samples_per_second": 3.99, + "eval_steps_per_second": 0.997, + "eval_wer": 0.19618178312013884, + "step": 24192 + }, + { + "epoch": 84.03, + "learning_rate": 6.517314487632508e-07, + "loss": 0.2808, + "step": 24200 + }, + { + "epoch": 84.06, + "learning_rate": 6.503180212014134e-07, + "loss": 0.2582, + "step": 24210 + }, + { + "epoch": 84.1, + "learning_rate": 6.490459363957597e-07, + "loss": 0.2613, + "step": 24220 + }, + { + "epoch": 84.13, + "learning_rate": 6.476325088339223e-07, + "loss": 0.2637, + "step": 24230 + }, + { + "epoch": 84.17, + "learning_rate": 6.462190812720848e-07, + "loss": 0.2765, + "step": 24240 + }, + { + "epoch": 84.2, + "learning_rate": 6.448056537102473e-07, + "loss": 0.2515, + "step": 24250 + }, + { + "epoch": 84.24, + "learning_rate": 6.433922261484098e-07, + "loss": 0.2331, + "step": 24260 + }, + { + "epoch": 84.27, + "learning_rate": 6.419787985865724e-07, + "loss": 0.2408, + "step": 24270 + }, + { + "epoch": 84.3, + "learning_rate": 6.40565371024735e-07, + "loss": 0.2706, + "step": 24280 + }, + { + "epoch": 84.34, + "learning_rate": 6.391519434628975e-07, + "loss": 0.2605, + "step": 24290 + }, + { + "epoch": 84.37, + "learning_rate": 6.377385159010601e-07, + "loss": 0.2403, + "step": 24300 + }, + { + "epoch": 84.41, + "learning_rate": 6.363250883392226e-07, + "loss": 0.2646, + "step": 24310 + }, + { + "epoch": 84.44, + "learning_rate": 6.349116607773851e-07, + "loss": 0.262, + "step": 24320 + }, + { + "epoch": 84.48, + "learning_rate": 6.334982332155476e-07, + "loss": 0.2664, + "step": 24330 + }, + { + "epoch": 84.51, + "learning_rate": 6.320848056537103e-07, + "loss": 0.2633, + "step": 24340 + }, + { + "epoch": 84.55, + "learning_rate": 6.306713780918728e-07, + "loss": 0.2278, + "step": 24350 + }, + { + "epoch": 84.58, + "learning_rate": 6.292579505300353e-07, + "loss": 0.2645, + "step": 24360 + }, + { + "epoch": 84.62, + "learning_rate": 6.278445229681979e-07, + "loss": 0.2249, + "step": 24370 + }, + { + "epoch": 84.65, + "learning_rate": 6.264310954063604e-07, + "loss": 0.2587, + "step": 24380 + }, + { + "epoch": 84.69, + "learning_rate": 6.25017667844523e-07, + "loss": 0.2471, + "step": 24390 + }, + { + "epoch": 84.72, + "learning_rate": 6.236042402826855e-07, + "loss": 0.258, + "step": 24400 + }, + { + "epoch": 84.75, + "learning_rate": 6.221908127208481e-07, + "loss": 0.2394, + "step": 24410 + }, + { + "epoch": 84.79, + "learning_rate": 6.207773851590106e-07, + "loss": 0.252, + "step": 24420 + }, + { + "epoch": 84.82, + "learning_rate": 6.193639575971731e-07, + "loss": 0.2727, + "step": 24430 + }, + { + "epoch": 84.86, + "learning_rate": 6.179505300353357e-07, + "loss": 0.2699, + "step": 24440 + }, + { + "epoch": 84.89, + "learning_rate": 6.165371024734983e-07, + "loss": 0.2309, + "step": 24450 + }, + { + "epoch": 84.93, + "learning_rate": 6.151236749116608e-07, + "loss": 0.2637, + "step": 24460 + }, + { + "epoch": 84.96, + "learning_rate": 6.13851590106007e-07, + "loss": 0.245, + "step": 24470 + }, + { + "epoch": 85.0, + "learning_rate": 6.124381625441695e-07, + "loss": 0.272, + "step": 24480 + }, + { + "epoch": 85.0, + "eval_loss": 0.504280149936676, + "eval_runtime": 134.0604, + "eval_samples_per_second": 3.968, + "eval_steps_per_second": 0.992, + "eval_wer": 0.1949604679565469, + "step": 24480 + }, + { + "epoch": 85.03, + "learning_rate": 6.110247349823321e-07, + "loss": 0.2629, + "step": 24490 + }, + { + "epoch": 85.07, + "learning_rate": 6.096113074204947e-07, + "loss": 0.2312, + "step": 24500 + }, + { + "epoch": 85.1, + "learning_rate": 6.081978798586572e-07, + "loss": 0.265, + "step": 24510 + }, + { + "epoch": 85.14, + "learning_rate": 6.067844522968197e-07, + "loss": 0.258, + "step": 24520 + }, + { + "epoch": 85.17, + "learning_rate": 6.053710247349822e-07, + "loss": 0.244, + "step": 24530 + }, + { + "epoch": 85.21, + "learning_rate": 6.039575971731448e-07, + "loss": 0.2407, + "step": 24540 + }, + { + "epoch": 85.24, + "learning_rate": 6.025441696113074e-07, + "loss": 0.2632, + "step": 24550 + }, + { + "epoch": 85.28, + "learning_rate": 6.011307420494699e-07, + "loss": 0.2678, + "step": 24560 + }, + { + "epoch": 85.31, + "learning_rate": 5.997173144876325e-07, + "loss": 0.2483, + "step": 24570 + }, + { + "epoch": 85.35, + "learning_rate": 5.98303886925795e-07, + "loss": 0.2801, + "step": 24580 + }, + { + "epoch": 85.38, + "learning_rate": 5.968904593639575e-07, + "loss": 0.251, + "step": 24590 + }, + { + "epoch": 85.42, + "learning_rate": 5.954770318021201e-07, + "loss": 0.2588, + "step": 24600 + }, + { + "epoch": 85.45, + "learning_rate": 5.940636042402827e-07, + "loss": 0.2543, + "step": 24610 + }, + { + "epoch": 85.48, + "learning_rate": 5.926501766784452e-07, + "loss": 0.2755, + "step": 24620 + }, + { + "epoch": 85.52, + "learning_rate": 5.912367491166077e-07, + "loss": 0.2388, + "step": 24630 + }, + { + "epoch": 85.55, + "learning_rate": 5.898233215547703e-07, + "loss": 0.2517, + "step": 24640 + }, + { + "epoch": 85.59, + "learning_rate": 5.884098939929328e-07, + "loss": 0.2513, + "step": 24650 + }, + { + "epoch": 85.62, + "learning_rate": 5.869964664310953e-07, + "loss": 0.2467, + "step": 24660 + }, + { + "epoch": 85.66, + "learning_rate": 5.85583038869258e-07, + "loss": 0.2617, + "step": 24670 + }, + { + "epoch": 85.69, + "learning_rate": 5.841696113074205e-07, + "loss": 0.2484, + "step": 24680 + }, + { + "epoch": 85.73, + "learning_rate": 5.82756183745583e-07, + "loss": 0.2481, + "step": 24690 + }, + { + "epoch": 85.76, + "learning_rate": 5.813427561837455e-07, + "loss": 0.2393, + "step": 24700 + }, + { + "epoch": 85.8, + "learning_rate": 5.799293286219081e-07, + "loss": 0.2372, + "step": 24710 + }, + { + "epoch": 85.83, + "learning_rate": 5.785159010600707e-07, + "loss": 0.2828, + "step": 24720 + }, + { + "epoch": 85.87, + "learning_rate": 5.771024734982332e-07, + "loss": 0.2796, + "step": 24730 + }, + { + "epoch": 85.9, + "learning_rate": 5.756890459363958e-07, + "loss": 0.2604, + "step": 24740 + }, + { + "epoch": 85.94, + "learning_rate": 5.742756183745583e-07, + "loss": 0.2143, + "step": 24750 + }, + { + "epoch": 85.97, + "learning_rate": 5.728621908127208e-07, + "loss": 0.2601, + "step": 24760 + }, + { + "epoch": 86.0, + "eval_loss": 0.5090940594673157, + "eval_runtime": 134.139, + "eval_samples_per_second": 3.966, + "eval_steps_per_second": 0.992, + "eval_wer": 0.19605322362923444, + "step": 24768 + }, + { + "epoch": 86.01, + "learning_rate": 5.714487632508833e-07, + "loss": 0.2614, + "step": 24770 + }, + { + "epoch": 86.04, + "learning_rate": 5.70035335689046e-07, + "loss": 0.2556, + "step": 24780 + }, + { + "epoch": 86.08, + "learning_rate": 5.686219081272085e-07, + "loss": 0.2451, + "step": 24790 + }, + { + "epoch": 86.11, + "learning_rate": 5.67208480565371e-07, + "loss": 0.2619, + "step": 24800 + }, + { + "epoch": 86.15, + "learning_rate": 5.657950530035336e-07, + "loss": 0.263, + "step": 24810 + }, + { + "epoch": 86.18, + "learning_rate": 5.643816254416961e-07, + "loss": 0.2718, + "step": 24820 + }, + { + "epoch": 86.21, + "learning_rate": 5.629681978798586e-07, + "loss": 0.2349, + "step": 24830 + }, + { + "epoch": 86.25, + "learning_rate": 5.615547703180213e-07, + "loss": 0.2553, + "step": 24840 + }, + { + "epoch": 86.28, + "learning_rate": 5.601413427561838e-07, + "loss": 0.2492, + "step": 24850 + }, + { + "epoch": 86.32, + "learning_rate": 5.587279151943463e-07, + "loss": 0.2549, + "step": 24860 + }, + { + "epoch": 86.35, + "learning_rate": 5.573144876325088e-07, + "loss": 0.2416, + "step": 24870 + }, + { + "epoch": 86.39, + "learning_rate": 5.559010600706714e-07, + "loss": 0.2552, + "step": 24880 + }, + { + "epoch": 86.42, + "learning_rate": 5.544876325088339e-07, + "loss": 0.2318, + "step": 24890 + }, + { + "epoch": 86.46, + "learning_rate": 5.530742049469965e-07, + "loss": 0.2538, + "step": 24900 + }, + { + "epoch": 86.49, + "learning_rate": 5.516607773851591e-07, + "loss": 0.2483, + "step": 24910 + }, + { + "epoch": 86.53, + "learning_rate": 5.502473498233216e-07, + "loss": 0.2677, + "step": 24920 + }, + { + "epoch": 86.56, + "learning_rate": 5.488339222614841e-07, + "loss": 0.2506, + "step": 24930 + }, + { + "epoch": 86.6, + "learning_rate": 5.474204946996465e-07, + "loss": 0.2563, + "step": 24940 + }, + { + "epoch": 86.63, + "learning_rate": 5.460070671378092e-07, + "loss": 0.2429, + "step": 24950 + }, + { + "epoch": 86.66, + "learning_rate": 5.445936395759717e-07, + "loss": 0.259, + "step": 24960 + }, + { + "epoch": 86.7, + "learning_rate": 5.431802120141342e-07, + "loss": 0.2554, + "step": 24970 + }, + { + "epoch": 86.73, + "learning_rate": 5.417667844522968e-07, + "loss": 0.2534, + "step": 24980 + }, + { + "epoch": 86.77, + "learning_rate": 5.403533568904593e-07, + "loss": 0.2392, + "step": 24990 + }, + { + "epoch": 86.8, + "learning_rate": 5.389399293286218e-07, + "loss": 0.27, + "step": 25000 + }, + { + "epoch": 86.84, + "learning_rate": 5.375265017667843e-07, + "loss": 0.2516, + "step": 25010 + }, + { + "epoch": 86.87, + "learning_rate": 5.36113074204947e-07, + "loss": 0.2701, + "step": 25020 + }, + { + "epoch": 86.91, + "learning_rate": 5.346996466431095e-07, + "loss": 0.2528, + "step": 25030 + }, + { + "epoch": 86.94, + "learning_rate": 5.33286219081272e-07, + "loss": 0.2286, + "step": 25040 + }, + { + "epoch": 86.98, + "learning_rate": 5.318727915194346e-07, + "loss": 0.2719, + "step": 25050 + }, + { + "epoch": 87.0, + "eval_loss": 0.5086585283279419, + "eval_runtime": 134.1212, + "eval_samples_per_second": 3.967, + "eval_steps_per_second": 0.992, + "eval_wer": 0.19753165777463522, + "step": 25056 + }, + { + "epoch": 87.01, + "learning_rate": 5.304593639575971e-07, + "loss": 0.2532, + "step": 25060 + }, + { + "epoch": 87.05, + "learning_rate": 5.290459363957596e-07, + "loss": 0.2514, + "step": 25070 + }, + { + "epoch": 87.08, + "learning_rate": 5.276325088339222e-07, + "loss": 0.2552, + "step": 25080 + }, + { + "epoch": 87.12, + "learning_rate": 5.262190812720848e-07, + "loss": 0.265, + "step": 25090 + }, + { + "epoch": 87.15, + "learning_rate": 5.248056537102473e-07, + "loss": 0.2704, + "step": 25100 + }, + { + "epoch": 87.19, + "learning_rate": 5.233922261484098e-07, + "loss": 0.2557, + "step": 25110 + }, + { + "epoch": 87.22, + "learning_rate": 5.219787985865724e-07, + "loss": 0.2781, + "step": 25120 + }, + { + "epoch": 87.26, + "learning_rate": 5.20565371024735e-07, + "loss": 0.2355, + "step": 25130 + }, + { + "epoch": 87.29, + "learning_rate": 5.191519434628975e-07, + "loss": 0.2728, + "step": 25140 + }, + { + "epoch": 87.33, + "learning_rate": 5.177385159010601e-07, + "loss": 0.2635, + "step": 25150 + }, + { + "epoch": 87.36, + "learning_rate": 5.163250883392226e-07, + "loss": 0.2442, + "step": 25160 + }, + { + "epoch": 87.39, + "learning_rate": 5.149116607773851e-07, + "loss": 0.2409, + "step": 25170 + }, + { + "epoch": 87.43, + "learning_rate": 5.134982332155476e-07, + "loss": 0.2497, + "step": 25180 + }, + { + "epoch": 87.46, + "learning_rate": 5.120848056537103e-07, + "loss": 0.263, + "step": 25190 + }, + { + "epoch": 87.5, + "learning_rate": 5.106713780918728e-07, + "loss": 0.2511, + "step": 25200 + }, + { + "epoch": 87.53, + "learning_rate": 5.092579505300353e-07, + "loss": 0.2522, + "step": 25210 + }, + { + "epoch": 87.57, + "learning_rate": 5.078445229681979e-07, + "loss": 0.2686, + "step": 25220 + }, + { + "epoch": 87.6, + "learning_rate": 5.064310954063604e-07, + "loss": 0.2407, + "step": 25230 + }, + { + "epoch": 87.64, + "learning_rate": 5.050176678445229e-07, + "loss": 0.228, + "step": 25240 + }, + { + "epoch": 87.67, + "learning_rate": 5.036042402826855e-07, + "loss": 0.2763, + "step": 25250 + }, + { + "epoch": 87.71, + "learning_rate": 5.021908127208481e-07, + "loss": 0.2378, + "step": 25260 + }, + { + "epoch": 87.74, + "learning_rate": 5.007773851590106e-07, + "loss": 0.2532, + "step": 25270 + }, + { + "epoch": 87.78, + "learning_rate": 4.993639575971731e-07, + "loss": 0.2431, + "step": 25280 + }, + { + "epoch": 87.81, + "learning_rate": 4.979505300353356e-07, + "loss": 0.2216, + "step": 25290 + }, + { + "epoch": 87.85, + "learning_rate": 4.965371024734982e-07, + "loss": 0.2579, + "step": 25300 + }, + { + "epoch": 87.88, + "learning_rate": 4.951236749116608e-07, + "loss": 0.2501, + "step": 25310 + }, + { + "epoch": 87.91, + "learning_rate": 4.937102473498233e-07, + "loss": 0.2612, + "step": 25320 + }, + { + "epoch": 87.95, + "learning_rate": 4.922968197879858e-07, + "loss": 0.2665, + "step": 25330 + }, + { + "epoch": 87.98, + "learning_rate": 4.908833922261484e-07, + "loss": 0.269, + "step": 25340 + }, + { + "epoch": 88.0, + "eval_loss": 0.5126340389251709, + "eval_runtime": 134.1929, + "eval_samples_per_second": 3.964, + "eval_steps_per_second": 0.991, + "eval_wer": 0.1965674615928521, + "step": 25344 + }, + { + "epoch": 88.02, + "learning_rate": 4.894699646643109e-07, + "loss": 0.2832, + "step": 25350 + }, + { + "epoch": 88.06, + "learning_rate": 4.880565371024734e-07, + "loss": 0.2522, + "step": 25360 + }, + { + "epoch": 88.09, + "learning_rate": 4.866431095406361e-07, + "loss": 0.232, + "step": 25370 + }, + { + "epoch": 88.12, + "learning_rate": 4.852296819787986e-07, + "loss": 0.2669, + "step": 25380 + }, + { + "epoch": 88.16, + "learning_rate": 4.838162544169611e-07, + "loss": 0.2461, + "step": 25390 + }, + { + "epoch": 88.19, + "learning_rate": 4.824028268551237e-07, + "loss": 0.2498, + "step": 25400 + }, + { + "epoch": 88.23, + "learning_rate": 4.809893992932862e-07, + "loss": 0.2525, + "step": 25410 + }, + { + "epoch": 88.26, + "learning_rate": 4.795759717314487e-07, + "loss": 0.2603, + "step": 25420 + }, + { + "epoch": 88.3, + "learning_rate": 4.781625441696113e-07, + "loss": 0.2594, + "step": 25430 + }, + { + "epoch": 88.33, + "learning_rate": 4.7674911660777383e-07, + "loss": 0.2422, + "step": 25440 + }, + { + "epoch": 88.37, + "learning_rate": 4.7533568904593634e-07, + "loss": 0.2493, + "step": 25450 + }, + { + "epoch": 88.4, + "learning_rate": 4.739222614840989e-07, + "loss": 0.2786, + "step": 25460 + }, + { + "epoch": 88.44, + "learning_rate": 4.725088339222615e-07, + "loss": 0.2218, + "step": 25470 + }, + { + "epoch": 88.47, + "learning_rate": 4.71095406360424e-07, + "loss": 0.2634, + "step": 25480 + }, + { + "epoch": 88.51, + "learning_rate": 4.6968197879858656e-07, + "loss": 0.2572, + "step": 25490 + }, + { + "epoch": 88.54, + "learning_rate": 4.682685512367491e-07, + "loss": 0.249, + "step": 25500 + }, + { + "epoch": 88.57, + "learning_rate": 4.6685512367491165e-07, + "loss": 0.2547, + "step": 25510 + }, + { + "epoch": 88.61, + "learning_rate": 4.654416961130742e-07, + "loss": 0.2611, + "step": 25520 + }, + { + "epoch": 88.64, + "learning_rate": 4.6402826855123673e-07, + "loss": 0.2664, + "step": 25530 + }, + { + "epoch": 88.68, + "learning_rate": 4.626148409893993e-07, + "loss": 0.2758, + "step": 25540 + }, + { + "epoch": 88.71, + "learning_rate": 4.612014134275618e-07, + "loss": 0.2488, + "step": 25550 + }, + { + "epoch": 88.75, + "learning_rate": 4.597879858657244e-07, + "loss": 0.253, + "step": 25560 + }, + { + "epoch": 88.78, + "learning_rate": 4.583745583038869e-07, + "loss": 0.2381, + "step": 25570 + }, + { + "epoch": 88.82, + "learning_rate": 4.5696113074204947e-07, + "loss": 0.2643, + "step": 25580 + }, + { + "epoch": 88.85, + "learning_rate": 4.5554770318021204e-07, + "loss": 0.2523, + "step": 25590 + }, + { + "epoch": 88.89, + "learning_rate": 4.5413427561837455e-07, + "loss": 0.2507, + "step": 25600 + }, + { + "epoch": 88.92, + "learning_rate": 4.527208480565371e-07, + "loss": 0.2359, + "step": 25610 + }, + { + "epoch": 88.96, + "learning_rate": 4.5130742049469963e-07, + "loss": 0.2561, + "step": 25620 + }, + { + "epoch": 88.99, + "learning_rate": 4.498939929328622e-07, + "loss": 0.2863, + "step": 25630 + }, + { + "epoch": 89.0, + "eval_loss": 0.5174065232276917, + "eval_runtime": 135.3515, + "eval_samples_per_second": 3.931, + "eval_steps_per_second": 0.983, + "eval_wer": 0.1965674615928521, + "step": 25632 + }, + { + "epoch": 89.03, + "learning_rate": 4.4848056537102467e-07, + "loss": 0.2527, + "step": 25640 + }, + { + "epoch": 89.06, + "learning_rate": 4.4706713780918723e-07, + "loss": 0.2613, + "step": 25650 + }, + { + "epoch": 89.1, + "learning_rate": 4.456537102473498e-07, + "loss": 0.2368, + "step": 25660 + }, + { + "epoch": 89.13, + "learning_rate": 4.442402826855123e-07, + "loss": 0.2653, + "step": 25670 + }, + { + "epoch": 89.17, + "learning_rate": 4.428268551236749e-07, + "loss": 0.2636, + "step": 25680 + }, + { + "epoch": 89.2, + "learning_rate": 4.414134275618374e-07, + "loss": 0.2154, + "step": 25690 + }, + { + "epoch": 89.24, + "learning_rate": 4.3999999999999997e-07, + "loss": 0.2606, + "step": 25700 + }, + { + "epoch": 89.27, + "learning_rate": 4.3858657243816254e-07, + "loss": 0.2416, + "step": 25710 + }, + { + "epoch": 89.3, + "learning_rate": 4.3717314487632505e-07, + "loss": 0.2521, + "step": 25720 + }, + { + "epoch": 89.34, + "learning_rate": 4.357597173144876e-07, + "loss": 0.2642, + "step": 25730 + }, + { + "epoch": 89.37, + "learning_rate": 4.3434628975265014e-07, + "loss": 0.247, + "step": 25740 + }, + { + "epoch": 89.41, + "learning_rate": 4.329328621908127e-07, + "loss": 0.2563, + "step": 25750 + }, + { + "epoch": 89.44, + "learning_rate": 4.315194346289752e-07, + "loss": 0.2376, + "step": 25760 + }, + { + "epoch": 89.48, + "learning_rate": 4.301060070671378e-07, + "loss": 0.2545, + "step": 25770 + }, + { + "epoch": 89.51, + "learning_rate": 4.2869257950530036e-07, + "loss": 0.2652, + "step": 25780 + }, + { + "epoch": 89.55, + "learning_rate": 4.2727915194346287e-07, + "loss": 0.2539, + "step": 25790 + }, + { + "epoch": 89.58, + "learning_rate": 4.2586572438162544e-07, + "loss": 0.2437, + "step": 25800 + }, + { + "epoch": 89.62, + "learning_rate": 4.2445229681978796e-07, + "loss": 0.2495, + "step": 25810 + }, + { + "epoch": 89.65, + "learning_rate": 4.230388692579505e-07, + "loss": 0.2779, + "step": 25820 + }, + { + "epoch": 89.69, + "learning_rate": 4.216254416961131e-07, + "loss": 0.271, + "step": 25830 + }, + { + "epoch": 89.72, + "learning_rate": 4.202120141342756e-07, + "loss": 0.2341, + "step": 25840 + }, + { + "epoch": 89.75, + "learning_rate": 4.187985865724382e-07, + "loss": 0.2561, + "step": 25850 + }, + { + "epoch": 89.79, + "learning_rate": 4.173851590106007e-07, + "loss": 0.2337, + "step": 25860 + }, + { + "epoch": 89.82, + "learning_rate": 4.1597173144876326e-07, + "loss": 0.277, + "step": 25870 + }, + { + "epoch": 89.86, + "learning_rate": 4.145583038869258e-07, + "loss": 0.2535, + "step": 25880 + }, + { + "epoch": 89.89, + "learning_rate": 4.1314487632508834e-07, + "loss": 0.2577, + "step": 25890 + }, + { + "epoch": 89.93, + "learning_rate": 4.117314487632509e-07, + "loss": 0.232, + "step": 25900 + }, + { + "epoch": 89.96, + "learning_rate": 4.103180212014134e-07, + "loss": 0.2724, + "step": 25910 + }, + { + "epoch": 90.0, + "learning_rate": 4.0890459363957594e-07, + "loss": 0.2581, + "step": 25920 + }, + { + "epoch": 90.0, + "eval_loss": 0.5159129500389099, + "eval_runtime": 134.2388, + "eval_samples_per_second": 3.963, + "eval_steps_per_second": 0.991, + "eval_wer": 0.19688886032011313, + "step": 25920 + }, + { + "epoch": 90.03, + "learning_rate": 4.0749116607773846e-07, + "loss": 0.2464, + "step": 25930 + }, + { + "epoch": 90.07, + "learning_rate": 4.0607773851590103e-07, + "loss": 0.2409, + "step": 25940 + }, + { + "epoch": 90.1, + "learning_rate": 4.0466431095406354e-07, + "loss": 0.2413, + "step": 25950 + }, + { + "epoch": 90.14, + "learning_rate": 4.032508833922261e-07, + "loss": 0.271, + "step": 25960 + }, + { + "epoch": 90.17, + "learning_rate": 4.018374558303887e-07, + "loss": 0.2487, + "step": 25970 + }, + { + "epoch": 90.21, + "learning_rate": 4.004240282685512e-07, + "loss": 0.2356, + "step": 25980 + }, + { + "epoch": 90.24, + "learning_rate": 3.9901060070671376e-07, + "loss": 0.2434, + "step": 25990 + }, + { + "epoch": 90.28, + "learning_rate": 3.975971731448763e-07, + "loss": 0.2607, + "step": 26000 + }, + { + "epoch": 90.31, + "learning_rate": 3.9618374558303885e-07, + "loss": 0.2515, + "step": 26010 + }, + { + "epoch": 90.35, + "learning_rate": 3.947703180212014e-07, + "loss": 0.2596, + "step": 26020 + }, + { + "epoch": 90.38, + "learning_rate": 3.9335689045936393e-07, + "loss": 0.2541, + "step": 26030 + }, + { + "epoch": 90.42, + "learning_rate": 3.919434628975265e-07, + "loss": 0.2471, + "step": 26040 + }, + { + "epoch": 90.45, + "learning_rate": 3.90530035335689e-07, + "loss": 0.2417, + "step": 26050 + }, + { + "epoch": 90.48, + "learning_rate": 3.891166077738516e-07, + "loss": 0.2659, + "step": 26060 + }, + { + "epoch": 90.52, + "learning_rate": 3.877031802120141e-07, + "loss": 0.2496, + "step": 26070 + }, + { + "epoch": 90.55, + "learning_rate": 3.8628975265017667e-07, + "loss": 0.2371, + "step": 26080 + }, + { + "epoch": 90.59, + "learning_rate": 3.8487632508833924e-07, + "loss": 0.2709, + "step": 26090 + }, + { + "epoch": 90.62, + "learning_rate": 3.8346289752650175e-07, + "loss": 0.238, + "step": 26100 + }, + { + "epoch": 90.66, + "learning_rate": 3.820494699646643e-07, + "loss": 0.2642, + "step": 26110 + }, + { + "epoch": 90.69, + "learning_rate": 3.8063604240282683e-07, + "loss": 0.2699, + "step": 26120 + }, + { + "epoch": 90.73, + "learning_rate": 3.792226148409894e-07, + "loss": 0.2729, + "step": 26130 + }, + { + "epoch": 90.76, + "learning_rate": 3.7780918727915197e-07, + "loss": 0.2473, + "step": 26140 + }, + { + "epoch": 90.8, + "learning_rate": 3.763957597173145e-07, + "loss": 0.27, + "step": 26150 + }, + { + "epoch": 90.83, + "learning_rate": 3.7498233215547706e-07, + "loss": 0.267, + "step": 26160 + }, + { + "epoch": 90.87, + "learning_rate": 3.7356890459363957e-07, + "loss": 0.2617, + "step": 26170 + }, + { + "epoch": 90.9, + "learning_rate": 3.721554770318021e-07, + "loss": 0.2436, + "step": 26180 + }, + { + "epoch": 90.94, + "learning_rate": 3.707420494699646e-07, + "loss": 0.2425, + "step": 26190 + }, + { + "epoch": 90.97, + "learning_rate": 3.6932862190812717e-07, + "loss": 0.26, + "step": 26200 + }, + { + "epoch": 91.0, + "eval_loss": 0.514625608921051, + "eval_runtime": 135.1986, + "eval_samples_per_second": 3.935, + "eval_steps_per_second": 0.984, + "eval_wer": 0.19688886032011313, + "step": 26208 + }, + { + "epoch": 91.01, + "learning_rate": 3.6791519434628974e-07, + "loss": 0.2532, + "step": 26210 + }, + { + "epoch": 91.04, + "learning_rate": 3.6650176678445225e-07, + "loss": 0.2408, + "step": 26220 + }, + { + "epoch": 91.08, + "learning_rate": 3.650883392226148e-07, + "loss": 0.2654, + "step": 26230 + }, + { + "epoch": 91.11, + "learning_rate": 3.6367491166077734e-07, + "loss": 0.2836, + "step": 26240 + }, + { + "epoch": 91.15, + "learning_rate": 3.622614840989399e-07, + "loss": 0.2472, + "step": 26250 + }, + { + "epoch": 91.18, + "learning_rate": 3.608480565371024e-07, + "loss": 0.2489, + "step": 26260 + }, + { + "epoch": 91.21, + "learning_rate": 3.59434628975265e-07, + "loss": 0.2713, + "step": 26270 + }, + { + "epoch": 91.25, + "learning_rate": 3.5802120141342756e-07, + "loss": 0.2338, + "step": 26280 + }, + { + "epoch": 91.28, + "learning_rate": 3.566077738515901e-07, + "loss": 0.2466, + "step": 26290 + }, + { + "epoch": 91.32, + "learning_rate": 3.5519434628975264e-07, + "loss": 0.2362, + "step": 26300 + }, + { + "epoch": 91.35, + "learning_rate": 3.5378091872791516e-07, + "loss": 0.2476, + "step": 26310 + }, + { + "epoch": 91.39, + "learning_rate": 3.523674911660777e-07, + "loss": 0.2393, + "step": 26320 + }, + { + "epoch": 91.42, + "learning_rate": 3.509540636042403e-07, + "loss": 0.2541, + "step": 26330 + }, + { + "epoch": 91.46, + "learning_rate": 3.495406360424028e-07, + "loss": 0.2439, + "step": 26340 + }, + { + "epoch": 91.49, + "learning_rate": 3.481272084805654e-07, + "loss": 0.2573, + "step": 26350 + }, + { + "epoch": 91.53, + "learning_rate": 3.467137809187279e-07, + "loss": 0.2586, + "step": 26360 + }, + { + "epoch": 91.56, + "learning_rate": 3.4530035335689046e-07, + "loss": 0.2369, + "step": 26370 + }, + { + "epoch": 91.6, + "learning_rate": 3.43886925795053e-07, + "loss": 0.2543, + "step": 26380 + }, + { + "epoch": 91.63, + "learning_rate": 3.4247349823321555e-07, + "loss": 0.2695, + "step": 26390 + }, + { + "epoch": 91.66, + "learning_rate": 3.410600706713781e-07, + "loss": 0.2457, + "step": 26400 + }, + { + "epoch": 91.7, + "learning_rate": 3.3964664310954063e-07, + "loss": 0.2456, + "step": 26410 + }, + { + "epoch": 91.73, + "learning_rate": 3.382332155477032e-07, + "loss": 0.2432, + "step": 26420 + }, + { + "epoch": 91.77, + "learning_rate": 3.368197879858657e-07, + "loss": 0.2264, + "step": 26430 + }, + { + "epoch": 91.8, + "learning_rate": 3.354063604240283e-07, + "loss": 0.242, + "step": 26440 + }, + { + "epoch": 91.84, + "learning_rate": 3.3399293286219085e-07, + "loss": 0.2651, + "step": 26450 + }, + { + "epoch": 91.87, + "learning_rate": 3.325795053003533e-07, + "loss": 0.2717, + "step": 26460 + }, + { + "epoch": 91.91, + "learning_rate": 3.311660777385159e-07, + "loss": 0.2417, + "step": 26470 + }, + { + "epoch": 91.94, + "learning_rate": 3.297526501766784e-07, + "loss": 0.2447, + "step": 26480 + }, + { + "epoch": 91.98, + "learning_rate": 3.2833922261484096e-07, + "loss": 0.2796, + "step": 26490 + }, + { + "epoch": 92.0, + "eval_loss": 0.5150091648101807, + "eval_runtime": 134.13, + "eval_samples_per_second": 3.966, + "eval_steps_per_second": 0.992, + "eval_wer": 0.1965674615928521, + "step": 26496 + }, + { + "epoch": 92.01, + "learning_rate": 3.269257950530035e-07, + "loss": 0.2811, + "step": 26500 + }, + { + "epoch": 92.05, + "learning_rate": 3.2551236749116605e-07, + "loss": 0.2589, + "step": 26510 + }, + { + "epoch": 92.08, + "learning_rate": 3.240989399293286e-07, + "loss": 0.2453, + "step": 26520 + }, + { + "epoch": 92.12, + "learning_rate": 3.2268551236749113e-07, + "loss": 0.2482, + "step": 26530 + }, + { + "epoch": 92.15, + "learning_rate": 3.212720848056537e-07, + "loss": 0.2619, + "step": 26540 + }, + { + "epoch": 92.19, + "learning_rate": 3.198586572438162e-07, + "loss": 0.2415, + "step": 26550 + }, + { + "epoch": 92.22, + "learning_rate": 3.184452296819788e-07, + "loss": 0.2459, + "step": 26560 + }, + { + "epoch": 92.26, + "learning_rate": 3.170318021201413e-07, + "loss": 0.253, + "step": 26570 + }, + { + "epoch": 92.29, + "learning_rate": 3.1561837455830387e-07, + "loss": 0.2728, + "step": 26580 + }, + { + "epoch": 92.33, + "learning_rate": 3.1420494699646644e-07, + "loss": 0.255, + "step": 26590 + }, + { + "epoch": 92.36, + "learning_rate": 3.1279151943462895e-07, + "loss": 0.2464, + "step": 26600 + }, + { + "epoch": 92.39, + "learning_rate": 3.113780918727915e-07, + "loss": 0.24, + "step": 26610 + }, + { + "epoch": 92.43, + "learning_rate": 3.0996466431095404e-07, + "loss": 0.2343, + "step": 26620 + }, + { + "epoch": 92.46, + "learning_rate": 3.085512367491166e-07, + "loss": 0.245, + "step": 26630 + }, + { + "epoch": 92.5, + "learning_rate": 3.0713780918727917e-07, + "loss": 0.2556, + "step": 26640 + }, + { + "epoch": 92.53, + "learning_rate": 3.057243816254417e-07, + "loss": 0.2431, + "step": 26650 + }, + { + "epoch": 92.57, + "learning_rate": 3.0431095406360426e-07, + "loss": 0.2274, + "step": 26660 + }, + { + "epoch": 92.6, + "learning_rate": 3.0289752650176677e-07, + "loss": 0.254, + "step": 26670 + }, + { + "epoch": 92.64, + "learning_rate": 3.0148409893992934e-07, + "loss": 0.2559, + "step": 26680 + }, + { + "epoch": 92.67, + "learning_rate": 3.0007067137809186e-07, + "loss": 0.2563, + "step": 26690 + }, + { + "epoch": 92.71, + "learning_rate": 2.986572438162544e-07, + "loss": 0.2375, + "step": 26700 + }, + { + "epoch": 92.74, + "learning_rate": 2.97243816254417e-07, + "loss": 0.2797, + "step": 26710 + }, + { + "epoch": 92.78, + "learning_rate": 2.9583038869257945e-07, + "loss": 0.2366, + "step": 26720 + }, + { + "epoch": 92.81, + "learning_rate": 2.94416961130742e-07, + "loss": 0.2638, + "step": 26730 + }, + { + "epoch": 92.85, + "learning_rate": 2.9300353356890454e-07, + "loss": 0.2595, + "step": 26740 + }, + { + "epoch": 92.88, + "learning_rate": 2.915901060070671e-07, + "loss": 0.2488, + "step": 26750 + }, + { + "epoch": 92.91, + "learning_rate": 2.901766784452297e-07, + "loss": 0.2517, + "step": 26760 + }, + { + "epoch": 92.95, + "learning_rate": 2.887632508833922e-07, + "loss": 0.2589, + "step": 26770 + }, + { + "epoch": 92.98, + "learning_rate": 2.8734982332155476e-07, + "loss": 0.2723, + "step": 26780 + }, + { + "epoch": 93.0, + "eval_loss": 0.5132827758789062, + "eval_runtime": 134.2687, + "eval_samples_per_second": 3.962, + "eval_steps_per_second": 0.991, + "eval_wer": 0.19708169955646976, + "step": 26784 + }, + { + "epoch": 93.02, + "learning_rate": 2.859363957597173e-07, + "loss": 0.2599, + "step": 26790 + }, + { + "epoch": 93.06, + "learning_rate": 2.8452296819787984e-07, + "loss": 0.2383, + "step": 26800 + }, + { + "epoch": 93.09, + "learning_rate": 2.8310954063604236e-07, + "loss": 0.2709, + "step": 26810 + }, + { + "epoch": 93.12, + "learning_rate": 2.816961130742049e-07, + "loss": 0.2514, + "step": 26820 + }, + { + "epoch": 93.16, + "learning_rate": 2.802826855123675e-07, + "loss": 0.2503, + "step": 26830 + }, + { + "epoch": 93.19, + "learning_rate": 2.7886925795053e-07, + "loss": 0.2455, + "step": 26840 + }, + { + "epoch": 93.23, + "learning_rate": 2.774558303886926e-07, + "loss": 0.2576, + "step": 26850 + }, + { + "epoch": 93.26, + "learning_rate": 2.760424028268551e-07, + "loss": 0.2415, + "step": 26860 + }, + { + "epoch": 93.3, + "learning_rate": 2.7462897526501766e-07, + "loss": 0.2765, + "step": 26870 + }, + { + "epoch": 93.33, + "learning_rate": 2.7321554770318023e-07, + "loss": 0.2527, + "step": 26880 + }, + { + "epoch": 93.37, + "learning_rate": 2.7180212014134275e-07, + "loss": 0.2404, + "step": 26890 + }, + { + "epoch": 93.4, + "learning_rate": 2.703886925795053e-07, + "loss": 0.2534, + "step": 26900 + }, + { + "epoch": 93.44, + "learning_rate": 2.6897526501766783e-07, + "loss": 0.2223, + "step": 26910 + }, + { + "epoch": 93.47, + "learning_rate": 2.675618374558304e-07, + "loss": 0.2735, + "step": 26920 + }, + { + "epoch": 93.51, + "learning_rate": 2.661484098939929e-07, + "loss": 0.2666, + "step": 26930 + }, + { + "epoch": 93.54, + "learning_rate": 2.647349823321555e-07, + "loss": 0.2513, + "step": 26940 + }, + { + "epoch": 93.57, + "learning_rate": 2.6332155477031805e-07, + "loss": 0.2531, + "step": 26950 + }, + { + "epoch": 93.61, + "learning_rate": 2.6190812720848057e-07, + "loss": 0.2438, + "step": 26960 + }, + { + "epoch": 93.64, + "learning_rate": 2.6049469964664313e-07, + "loss": 0.2672, + "step": 26970 + }, + { + "epoch": 93.68, + "learning_rate": 2.5908127208480565e-07, + "loss": 0.2743, + "step": 26980 + }, + { + "epoch": 93.71, + "learning_rate": 2.576678445229682e-07, + "loss": 0.2549, + "step": 26990 + }, + { + "epoch": 93.75, + "learning_rate": 2.562544169611307e-07, + "loss": 0.2564, + "step": 27000 + }, + { + "epoch": 93.78, + "learning_rate": 2.5484098939929325e-07, + "loss": 0.2593, + "step": 27010 + }, + { + "epoch": 93.82, + "learning_rate": 2.534275618374558e-07, + "loss": 0.2585, + "step": 27020 + }, + { + "epoch": 93.85, + "learning_rate": 2.5201413427561833e-07, + "loss": 0.2472, + "step": 27030 + }, + { + "epoch": 93.89, + "learning_rate": 2.506007067137809e-07, + "loss": 0.2225, + "step": 27040 + }, + { + "epoch": 93.92, + "learning_rate": 2.4918727915194347e-07, + "loss": 0.2766, + "step": 27050 + }, + { + "epoch": 93.96, + "learning_rate": 2.47773851590106e-07, + "loss": 0.2493, + "step": 27060 + }, + { + "epoch": 93.99, + "learning_rate": 2.4636042402826855e-07, + "loss": 0.249, + "step": 27070 + }, + { + "epoch": 94.0, + "eval_loss": 0.509568452835083, + "eval_runtime": 135.0584, + "eval_samples_per_second": 3.939, + "eval_steps_per_second": 0.985, + "eval_wer": 0.19605322362923444, + "step": 27072 + }, + { + "epoch": 94.03, + "learning_rate": 2.4494699646643107e-07, + "loss": 0.2773, + "step": 27080 + }, + { + "epoch": 94.06, + "learning_rate": 2.4353356890459364e-07, + "loss": 0.2497, + "step": 27090 + }, + { + "epoch": 94.1, + "learning_rate": 2.421201413427562e-07, + "loss": 0.2476, + "step": 27100 + }, + { + "epoch": 94.13, + "learning_rate": 2.407067137809187e-07, + "loss": 0.268, + "step": 27110 + }, + { + "epoch": 94.17, + "learning_rate": 2.392932862190813e-07, + "loss": 0.2523, + "step": 27120 + }, + { + "epoch": 94.2, + "learning_rate": 2.378798586572438e-07, + "loss": 0.2356, + "step": 27130 + }, + { + "epoch": 94.24, + "learning_rate": 2.3646643109540635e-07, + "loss": 0.2633, + "step": 27140 + }, + { + "epoch": 94.27, + "learning_rate": 2.350530035335689e-07, + "loss": 0.2345, + "step": 27150 + }, + { + "epoch": 94.3, + "learning_rate": 2.3363957597173146e-07, + "loss": 0.2828, + "step": 27160 + }, + { + "epoch": 94.34, + "learning_rate": 2.32226148409894e-07, + "loss": 0.259, + "step": 27170 + }, + { + "epoch": 94.37, + "learning_rate": 2.3081272084805654e-07, + "loss": 0.2528, + "step": 27180 + }, + { + "epoch": 94.41, + "learning_rate": 2.2939929328621908e-07, + "loss": 0.2359, + "step": 27190 + }, + { + "epoch": 94.44, + "learning_rate": 2.279858657243816e-07, + "loss": 0.2267, + "step": 27200 + }, + { + "epoch": 94.48, + "learning_rate": 2.2657243816254414e-07, + "loss": 0.2596, + "step": 27210 + }, + { + "epoch": 94.51, + "learning_rate": 2.251590106007067e-07, + "loss": 0.259, + "step": 27220 + }, + { + "epoch": 94.55, + "learning_rate": 2.2374558303886925e-07, + "loss": 0.2455, + "step": 27230 + }, + { + "epoch": 94.58, + "learning_rate": 2.223321554770318e-07, + "loss": 0.268, + "step": 27240 + }, + { + "epoch": 94.62, + "learning_rate": 2.2091872791519433e-07, + "loss": 0.2472, + "step": 27250 + }, + { + "epoch": 94.65, + "learning_rate": 2.1950530035335688e-07, + "loss": 0.2573, + "step": 27260 + }, + { + "epoch": 94.69, + "learning_rate": 2.1809187279151942e-07, + "loss": 0.2845, + "step": 27270 + }, + { + "epoch": 94.72, + "learning_rate": 2.1667844522968196e-07, + "loss": 0.2401, + "step": 27280 + }, + { + "epoch": 94.75, + "learning_rate": 2.1526501766784453e-07, + "loss": 0.2497, + "step": 27290 + }, + { + "epoch": 94.79, + "learning_rate": 2.1385159010600707e-07, + "loss": 0.2693, + "step": 27300 + }, + { + "epoch": 94.82, + "learning_rate": 2.124381625441696e-07, + "loss": 0.2634, + "step": 27310 + }, + { + "epoch": 94.86, + "learning_rate": 2.1102473498233215e-07, + "loss": 0.2539, + "step": 27320 + }, + { + "epoch": 94.89, + "learning_rate": 2.0961130742049467e-07, + "loss": 0.2747, + "step": 27330 + }, + { + "epoch": 94.93, + "learning_rate": 2.081978798586572e-07, + "loss": 0.2487, + "step": 27340 + }, + { + "epoch": 94.96, + "learning_rate": 2.0678445229681978e-07, + "loss": 0.2491, + "step": 27350 + }, + { + "epoch": 95.0, + "learning_rate": 2.0537102473498232e-07, + "loss": 0.266, + "step": 27360 + }, + { + "epoch": 95.0, + "eval_loss": 0.5116358399391174, + "eval_runtime": 134.7906, + "eval_samples_per_second": 3.947, + "eval_steps_per_second": 0.987, + "eval_wer": 0.19637462235649547, + "step": 27360 + }, + { + "epoch": 95.03, + "learning_rate": 2.0395759717314486e-07, + "loss": 0.2359, + "step": 27370 + }, + { + "epoch": 95.07, + "learning_rate": 2.025441696113074e-07, + "loss": 0.2421, + "step": 27380 + }, + { + "epoch": 95.1, + "learning_rate": 2.0113074204946995e-07, + "loss": 0.2358, + "step": 27390 + }, + { + "epoch": 95.14, + "learning_rate": 1.997173144876325e-07, + "loss": 0.2741, + "step": 27400 + }, + { + "epoch": 95.17, + "learning_rate": 1.9830388692579506e-07, + "loss": 0.2423, + "step": 27410 + }, + { + "epoch": 95.21, + "learning_rate": 1.968904593639576e-07, + "loss": 0.2617, + "step": 27420 + }, + { + "epoch": 95.24, + "learning_rate": 1.9547703180212014e-07, + "loss": 0.2387, + "step": 27430 + }, + { + "epoch": 95.28, + "learning_rate": 1.9406360424028268e-07, + "loss": 0.2223, + "step": 27440 + }, + { + "epoch": 95.31, + "learning_rate": 1.9265017667844522e-07, + "loss": 0.2613, + "step": 27450 + }, + { + "epoch": 95.35, + "learning_rate": 1.9123674911660777e-07, + "loss": 0.2723, + "step": 27460 + }, + { + "epoch": 95.38, + "learning_rate": 1.898233215547703e-07, + "loss": 0.2495, + "step": 27470 + }, + { + "epoch": 95.42, + "learning_rate": 1.8840989399293285e-07, + "loss": 0.2446, + "step": 27480 + }, + { + "epoch": 95.45, + "learning_rate": 1.869964664310954e-07, + "loss": 0.2454, + "step": 27490 + }, + { + "epoch": 95.48, + "learning_rate": 1.8558303886925793e-07, + "loss": 0.2713, + "step": 27500 + }, + { + "epoch": 95.52, + "learning_rate": 1.8416961130742048e-07, + "loss": 0.2616, + "step": 27510 + }, + { + "epoch": 95.55, + "learning_rate": 1.8275618374558302e-07, + "loss": 0.2538, + "step": 27520 + }, + { + "epoch": 95.59, + "learning_rate": 1.8134275618374559e-07, + "loss": 0.2452, + "step": 27530 + }, + { + "epoch": 95.62, + "learning_rate": 1.7992932862190813e-07, + "loss": 0.2413, + "step": 27540 + }, + { + "epoch": 95.66, + "learning_rate": 1.7851590106007067e-07, + "loss": 0.2753, + "step": 27550 + }, + { + "epoch": 95.69, + "learning_rate": 1.771024734982332e-07, + "loss": 0.2428, + "step": 27560 + }, + { + "epoch": 95.73, + "learning_rate": 1.7568904593639575e-07, + "loss": 0.2359, + "step": 27570 + }, + { + "epoch": 95.76, + "learning_rate": 1.742756183745583e-07, + "loss": 0.2472, + "step": 27580 + }, + { + "epoch": 95.8, + "learning_rate": 1.7286219081272086e-07, + "loss": 0.2241, + "step": 27590 + }, + { + "epoch": 95.83, + "learning_rate": 1.714487632508834e-07, + "loss": 0.2494, + "step": 27600 + }, + { + "epoch": 95.87, + "learning_rate": 1.7003533568904592e-07, + "loss": 0.2686, + "step": 27610 + }, + { + "epoch": 95.9, + "learning_rate": 1.6862190812720846e-07, + "loss": 0.2426, + "step": 27620 + }, + { + "epoch": 95.94, + "learning_rate": 1.67208480565371e-07, + "loss": 0.2698, + "step": 27630 + }, + { + "epoch": 95.97, + "learning_rate": 1.6579505300353355e-07, + "loss": 0.2683, + "step": 27640 + }, + { + "epoch": 96.0, + "eval_loss": 0.5132885575294495, + "eval_runtime": 135.195, + "eval_samples_per_second": 3.935, + "eval_steps_per_second": 0.984, + "eval_wer": 0.1966960210837565, + "step": 27648 + }, + { + "epoch": 96.01, + "learning_rate": 1.643816254416961e-07, + "loss": 0.2756, + "step": 27650 + }, + { + "epoch": 96.04, + "learning_rate": 1.6296819787985866e-07, + "loss": 0.264, + "step": 27660 + }, + { + "epoch": 96.08, + "learning_rate": 1.615547703180212e-07, + "loss": 0.2275, + "step": 27670 + }, + { + "epoch": 96.11, + "learning_rate": 1.6014134275618374e-07, + "loss": 0.2498, + "step": 27680 + }, + { + "epoch": 96.15, + "learning_rate": 1.5872791519434628e-07, + "loss": 0.2453, + "step": 27690 + }, + { + "epoch": 96.18, + "learning_rate": 1.5731448763250883e-07, + "loss": 0.2527, + "step": 27700 + }, + { + "epoch": 96.21, + "learning_rate": 1.5590106007067137e-07, + "loss": 0.2548, + "step": 27710 + }, + { + "epoch": 96.25, + "learning_rate": 1.5448763250883394e-07, + "loss": 0.2589, + "step": 27720 + }, + { + "epoch": 96.28, + "learning_rate": 1.5307420494699648e-07, + "loss": 0.2361, + "step": 27730 + }, + { + "epoch": 96.32, + "learning_rate": 1.51660777385159e-07, + "loss": 0.2798, + "step": 27740 + }, + { + "epoch": 96.35, + "learning_rate": 1.5024734982332153e-07, + "loss": 0.2742, + "step": 27750 + }, + { + "epoch": 96.39, + "learning_rate": 1.4883392226148408e-07, + "loss": 0.2475, + "step": 27760 + }, + { + "epoch": 96.42, + "learning_rate": 1.4742049469964662e-07, + "loss": 0.237, + "step": 27770 + }, + { + "epoch": 96.46, + "learning_rate": 1.4600706713780919e-07, + "loss": 0.2548, + "step": 27780 + }, + { + "epoch": 96.49, + "learning_rate": 1.4459363957597173e-07, + "loss": 0.2458, + "step": 27790 + }, + { + "epoch": 96.53, + "learning_rate": 1.4318021201413427e-07, + "loss": 0.2448, + "step": 27800 + }, + { + "epoch": 96.56, + "learning_rate": 1.417667844522968e-07, + "loss": 0.2604, + "step": 27810 + }, + { + "epoch": 96.6, + "learning_rate": 1.4035335689045935e-07, + "loss": 0.252, + "step": 27820 + }, + { + "epoch": 96.63, + "learning_rate": 1.389399293286219e-07, + "loss": 0.2356, + "step": 27830 + }, + { + "epoch": 96.66, + "learning_rate": 1.3752650176678446e-07, + "loss": 0.2531, + "step": 27840 + }, + { + "epoch": 96.7, + "learning_rate": 1.36113074204947e-07, + "loss": 0.2657, + "step": 27850 + }, + { + "epoch": 96.73, + "learning_rate": 1.3469964664310955e-07, + "loss": 0.2601, + "step": 27860 + }, + { + "epoch": 96.77, + "learning_rate": 1.332862190812721e-07, + "loss": 0.2507, + "step": 27870 + }, + { + "epoch": 96.8, + "learning_rate": 1.318727915194346e-07, + "loss": 0.2657, + "step": 27880 + }, + { + "epoch": 96.84, + "learning_rate": 1.3045936395759715e-07, + "loss": 0.2588, + "step": 27890 + }, + { + "epoch": 96.87, + "learning_rate": 1.2904593639575972e-07, + "loss": 0.2474, + "step": 27900 + }, + { + "epoch": 96.91, + "learning_rate": 1.2763250883392226e-07, + "loss": 0.2616, + "step": 27910 + }, + { + "epoch": 96.94, + "learning_rate": 1.262190812720848e-07, + "loss": 0.2405, + "step": 27920 + }, + { + "epoch": 96.98, + "learning_rate": 1.2480565371024734e-07, + "loss": 0.2451, + "step": 27930 + }, + { + "epoch": 97.0, + "eval_loss": 0.5141022205352783, + "eval_runtime": 134.2101, + "eval_samples_per_second": 3.964, + "eval_steps_per_second": 0.991, + "eval_wer": 0.19650318184739987, + "step": 27936 + }, + { + "epoch": 97.01, + "learning_rate": 1.2339222614840988e-07, + "loss": 0.2512, + "step": 27940 + }, + { + "epoch": 97.05, + "learning_rate": 1.2197879858657243e-07, + "loss": 0.2491, + "step": 27950 + }, + { + "epoch": 97.08, + "learning_rate": 1.2056537102473497e-07, + "loss": 0.2663, + "step": 27960 + }, + { + "epoch": 97.12, + "learning_rate": 1.1915194346289752e-07, + "loss": 0.2532, + "step": 27970 + }, + { + "epoch": 97.15, + "learning_rate": 1.1773851590106006e-07, + "loss": 0.263, + "step": 27980 + }, + { + "epoch": 97.19, + "learning_rate": 1.163250883392226e-07, + "loss": 0.2544, + "step": 27990 + }, + { + "epoch": 97.22, + "learning_rate": 1.1491166077738515e-07, + "loss": 0.2543, + "step": 28000 + }, + { + "epoch": 97.26, + "learning_rate": 1.134982332155477e-07, + "loss": 0.2582, + "step": 28010 + }, + { + "epoch": 97.29, + "learning_rate": 1.1208480565371025e-07, + "loss": 0.2577, + "step": 28020 + }, + { + "epoch": 97.33, + "learning_rate": 1.1067137809187279e-07, + "loss": 0.2445, + "step": 28030 + }, + { + "epoch": 97.36, + "learning_rate": 1.0925795053003534e-07, + "loss": 0.2692, + "step": 28040 + }, + { + "epoch": 97.39, + "learning_rate": 1.0784452296819787e-07, + "loss": 0.2461, + "step": 28050 + }, + { + "epoch": 97.43, + "learning_rate": 1.0643109540636041e-07, + "loss": 0.2136, + "step": 28060 + }, + { + "epoch": 97.46, + "learning_rate": 1.0501766784452297e-07, + "loss": 0.2604, + "step": 28070 + }, + { + "epoch": 97.5, + "learning_rate": 1.0360424028268551e-07, + "loss": 0.2517, + "step": 28080 + }, + { + "epoch": 97.53, + "learning_rate": 1.0219081272084805e-07, + "loss": 0.247, + "step": 28090 + }, + { + "epoch": 97.57, + "learning_rate": 1.0077738515901061e-07, + "loss": 0.2481, + "step": 28100 + }, + { + "epoch": 97.6, + "learning_rate": 9.936395759717315e-08, + "loss": 0.2215, + "step": 28110 + }, + { + "epoch": 97.64, + "learning_rate": 9.795053003533568e-08, + "loss": 0.2549, + "step": 28120 + }, + { + "epoch": 97.67, + "learning_rate": 9.653710247349822e-08, + "loss": 0.2656, + "step": 28130 + }, + { + "epoch": 97.71, + "learning_rate": 9.512367491166077e-08, + "loss": 0.2415, + "step": 28140 + }, + { + "epoch": 97.74, + "learning_rate": 9.371024734982332e-08, + "loss": 0.2388, + "step": 28150 + }, + { + "epoch": 97.78, + "learning_rate": 9.229681978798586e-08, + "loss": 0.2437, + "step": 28160 + }, + { + "epoch": 97.81, + "learning_rate": 9.088339222614841e-08, + "loss": 0.2621, + "step": 28170 + }, + { + "epoch": 97.85, + "learning_rate": 8.946996466431094e-08, + "loss": 0.2629, + "step": 28180 + }, + { + "epoch": 97.88, + "learning_rate": 8.805653710247348e-08, + "loss": 0.2346, + "step": 28190 + }, + { + "epoch": 97.91, + "learning_rate": 8.664310954063604e-08, + "loss": 0.2638, + "step": 28200 + }, + { + "epoch": 97.95, + "learning_rate": 8.522968197879858e-08, + "loss": 0.2465, + "step": 28210 + }, + { + "epoch": 97.98, + "learning_rate": 8.381625441696112e-08, + "loss": 0.2723, + "step": 28220 + }, + { + "epoch": 98.0, + "eval_loss": 0.5122572779655457, + "eval_runtime": 135.6766, + "eval_samples_per_second": 3.921, + "eval_steps_per_second": 0.98, + "eval_wer": 0.19624606286559104, + "step": 28224 + }, + { + "epoch": 98.02, + "learning_rate": 8.240282685512368e-08, + "loss": 0.2508, + "step": 28230 + }, + { + "epoch": 98.06, + "learning_rate": 8.098939929328622e-08, + "loss": 0.2573, + "step": 28240 + }, + { + "epoch": 98.09, + "learning_rate": 7.957597173144875e-08, + "loss": 0.2363, + "step": 28250 + }, + { + "epoch": 98.12, + "learning_rate": 7.81625441696113e-08, + "loss": 0.2677, + "step": 28260 + }, + { + "epoch": 98.16, + "learning_rate": 7.674911660777385e-08, + "loss": 0.2611, + "step": 28270 + }, + { + "epoch": 98.19, + "learning_rate": 7.533568904593639e-08, + "loss": 0.2331, + "step": 28280 + }, + { + "epoch": 98.23, + "learning_rate": 7.392226148409894e-08, + "loss": 0.2688, + "step": 28290 + }, + { + "epoch": 98.26, + "learning_rate": 7.250883392226148e-08, + "loss": 0.2321, + "step": 28300 + }, + { + "epoch": 98.3, + "learning_rate": 7.109540636042403e-08, + "loss": 0.278, + "step": 28310 + }, + { + "epoch": 98.33, + "learning_rate": 6.968197879858657e-08, + "loss": 0.2502, + "step": 28320 + }, + { + "epoch": 98.37, + "learning_rate": 6.826855123674911e-08, + "loss": 0.2497, + "step": 28330 + }, + { + "epoch": 98.4, + "learning_rate": 6.685512367491165e-08, + "loss": 0.2593, + "step": 28340 + }, + { + "epoch": 98.44, + "learning_rate": 6.544169611307421e-08, + "loss": 0.25, + "step": 28350 + }, + { + "epoch": 98.47, + "learning_rate": 6.402826855123675e-08, + "loss": 0.2518, + "step": 28360 + }, + { + "epoch": 98.51, + "learning_rate": 6.261484098939929e-08, + "loss": 0.2586, + "step": 28370 + }, + { + "epoch": 98.54, + "learning_rate": 6.120141342756183e-08, + "loss": 0.2632, + "step": 28380 + }, + { + "epoch": 98.57, + "learning_rate": 5.978798586572437e-08, + "loss": 0.2588, + "step": 28390 + }, + { + "epoch": 98.61, + "learning_rate": 5.837455830388692e-08, + "loss": 0.2575, + "step": 28400 + }, + { + "epoch": 98.64, + "learning_rate": 5.6961130742049465e-08, + "loss": 0.2669, + "step": 28410 + }, + { + "epoch": 98.68, + "learning_rate": 5.5547703180212014e-08, + "loss": 0.2753, + "step": 28420 + }, + { + "epoch": 98.71, + "learning_rate": 5.4134275618374555e-08, + "loss": 0.2383, + "step": 28430 + }, + { + "epoch": 98.75, + "learning_rate": 5.27208480565371e-08, + "loss": 0.2534, + "step": 28440 + }, + { + "epoch": 98.78, + "learning_rate": 5.1307420494699646e-08, + "loss": 0.2444, + "step": 28450 + }, + { + "epoch": 98.82, + "learning_rate": 4.989399293286219e-08, + "loss": 0.2627, + "step": 28460 + }, + { + "epoch": 98.85, + "learning_rate": 4.848056537102473e-08, + "loss": 0.2374, + "step": 28470 + }, + { + "epoch": 98.89, + "learning_rate": 4.706713780918728e-08, + "loss": 0.2649, + "step": 28480 + }, + { + "epoch": 98.92, + "learning_rate": 4.565371024734982e-08, + "loss": 0.2567, + "step": 28490 + }, + { + "epoch": 98.96, + "learning_rate": 4.424028268551237e-08, + "loss": 0.251, + "step": 28500 + }, + { + "epoch": 98.99, + "learning_rate": 4.282685512367491e-08, + "loss": 0.2527, + "step": 28510 + }, + { + "epoch": 99.0, + "eval_loss": 0.5119685530662537, + "eval_runtime": 134.8373, + "eval_samples_per_second": 3.945, + "eval_steps_per_second": 0.986, + "eval_wer": 0.1965674615928521, + "step": 28512 + }, + { + "epoch": 99.03, + "learning_rate": 4.141342756183745e-08, + "loss": 0.2849, + "step": 28520 + }, + { + "epoch": 99.06, + "learning_rate": 4e-08, + "loss": 0.2756, + "step": 28530 + }, + { + "epoch": 99.1, + "learning_rate": 3.858657243816254e-08, + "loss": 0.2378, + "step": 28540 + }, + { + "epoch": 99.13, + "learning_rate": 3.7173144876325085e-08, + "loss": 0.2709, + "step": 28550 + }, + { + "epoch": 99.17, + "learning_rate": 3.575971731448763e-08, + "loss": 0.2569, + "step": 28560 + }, + { + "epoch": 99.2, + "learning_rate": 3.4346289752650175e-08, + "loss": 0.2597, + "step": 28570 + }, + { + "epoch": 99.24, + "learning_rate": 3.293286219081272e-08, + "loss": 0.2418, + "step": 28580 + }, + { + "epoch": 99.27, + "learning_rate": 3.1519434628975265e-08, + "loss": 0.239, + "step": 28590 + }, + { + "epoch": 99.3, + "learning_rate": 3.010600706713781e-08, + "loss": 0.2535, + "step": 28600 + }, + { + "epoch": 99.34, + "learning_rate": 2.8692579505300353e-08, + "loss": 0.2642, + "step": 28610 + }, + { + "epoch": 99.37, + "learning_rate": 2.7279151943462894e-08, + "loss": 0.2302, + "step": 28620 + }, + { + "epoch": 99.41, + "learning_rate": 2.5865724381625443e-08, + "loss": 0.2619, + "step": 28630 + }, + { + "epoch": 99.44, + "learning_rate": 2.4452296819787985e-08, + "loss": 0.232, + "step": 28640 + }, + { + "epoch": 99.48, + "learning_rate": 2.3038869257950527e-08, + "loss": 0.2763, + "step": 28650 + }, + { + "epoch": 99.51, + "learning_rate": 2.1625441696113075e-08, + "loss": 0.2569, + "step": 28660 + }, + { + "epoch": 99.55, + "learning_rate": 2.0212014134275617e-08, + "loss": 0.2466, + "step": 28670 + }, + { + "epoch": 99.58, + "learning_rate": 1.8798586572438162e-08, + "loss": 0.2511, + "step": 28680 + }, + { + "epoch": 99.62, + "learning_rate": 1.7385159010600704e-08, + "loss": 0.2401, + "step": 28690 + }, + { + "epoch": 99.65, + "learning_rate": 1.597173144876325e-08, + "loss": 0.2573, + "step": 28700 + }, + { + "epoch": 99.69, + "learning_rate": 1.4558303886925795e-08, + "loss": 0.2663, + "step": 28710 + }, + { + "epoch": 99.72, + "learning_rate": 1.314487632508834e-08, + "loss": 0.2237, + "step": 28720 + }, + { + "epoch": 99.75, + "learning_rate": 1.1731448763250882e-08, + "loss": 0.2567, + "step": 28730 + }, + { + "epoch": 99.79, + "learning_rate": 1.0318021201413427e-08, + "loss": 0.2448, + "step": 28740 + }, + { + "epoch": 99.82, + "learning_rate": 8.90459363957597e-09, + "loss": 0.2673, + "step": 28750 + }, + { + "epoch": 99.86, + "learning_rate": 7.491166077738516e-09, + "loss": 0.2539, + "step": 28760 + }, + { + "epoch": 99.89, + "learning_rate": 6.077738515901059e-09, + "loss": 0.2329, + "step": 28770 + }, + { + "epoch": 99.93, + "learning_rate": 4.6643109540636045e-09, + "loss": 0.24, + "step": 28780 + }, + { + "epoch": 99.96, + "learning_rate": 3.250883392226148e-09, + "loss": 0.2402, + "step": 28790 + }, + { + "epoch": 100.0, + "learning_rate": 1.8374558303886924e-09, + "loss": 0.2604, + "step": 28800 + }, + { + "epoch": 100.0, + "eval_loss": 0.5110756158828735, + "eval_runtime": 135.2128, + "eval_samples_per_second": 3.935, + "eval_steps_per_second": 0.984, + "eval_wer": 0.19605322362923444, + "step": 28800 + }, { "epoch": 100.0, - "step": 7200, - "total_flos": 2.7202925310621965e+20, - "train_loss": 0.2786852648191982, - "train_runtime": 194751.2153, - "train_samples_per_second": 2.371, - "train_steps_per_second": 0.037 + "step": 28800, + "total_flos": 2.718335465990856e+20, + "train_loss": 0.26551002427107756, + "train_runtime": 210411.5326, + "train_samples_per_second": 2.194, + "train_steps_per_second": 0.137 } ], - "max_steps": 7200, + "max_steps": 28800, "num_train_epochs": 100, - "total_flos": 2.7202925310621965e+20, + "total_flos": 2.718335465990856e+20, "trial_name": null, "trial_params": null }