{ "best_metric": 0.4693412184715271, "best_model_checkpoint": "ai-light-dance_singing3_ft_wav2vec2-large-xlsr-53-v1-5gram/checkpoint-288", "epoch": 99.9974025974026, "global_step": 28800, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.03, "learning_rate": 8e-08, "loss": 0.3037, "step": 10 }, { "epoch": 0.07, "learning_rate": 1.6e-07, "loss": 0.3044, "step": 20 }, { "epoch": 0.1, "learning_rate": 2.32e-07, "loss": 0.2922, "step": 30 }, { "epoch": 0.14, "learning_rate": 3.12e-07, "loss": 0.3287, "step": 40 }, { "epoch": 0.17, "learning_rate": 3.92e-07, "loss": 0.3189, "step": 50 }, { "epoch": 0.21, "learning_rate": 4.64e-07, "loss": 0.2791, "step": 60 }, { "epoch": 0.24, "learning_rate": 5.44e-07, "loss": 0.2892, "step": 70 }, { "epoch": 0.28, "learning_rate": 6.24e-07, "loss": 0.3011, "step": 80 }, { "epoch": 0.31, "learning_rate": 7.04e-07, "loss": 0.3154, "step": 90 }, { "epoch": 0.35, "learning_rate": 7.84e-07, "loss": 0.3242, "step": 100 }, { "epoch": 0.38, "learning_rate": 8.639999999999999e-07, "loss": 0.2931, "step": 110 }, { "epoch": 0.42, "learning_rate": 9.439999999999999e-07, "loss": 0.2822, "step": 120 }, { "epoch": 0.45, "learning_rate": 1.024e-06, "loss": 0.3186, "step": 130 }, { "epoch": 0.48, "learning_rate": 1.1040000000000001e-06, "loss": 0.3111, "step": 140 }, { "epoch": 0.52, "learning_rate": 1.1839999999999998e-06, "loss": 0.2909, "step": 150 }, { "epoch": 0.55, "learning_rate": 1.2639999999999999e-06, "loss": 0.299, "step": 160 }, { "epoch": 0.59, "learning_rate": 1.344e-06, "loss": 0.3338, "step": 170 }, { "epoch": 0.62, "learning_rate": 1.4239999999999998e-06, "loss": 0.2607, "step": 180 }, { "epoch": 0.66, "learning_rate": 1.504e-06, "loss": 0.2763, "step": 190 }, { "epoch": 0.69, "learning_rate": 1.584e-06, "loss": 0.296, "step": 200 }, { "epoch": 0.73, "learning_rate": 1.6639999999999999e-06, "loss": 0.2896, "step": 210 }, { "epoch": 0.76, "learning_rate": 1.744e-06, "loss": 0.2852, "step": 220 }, { "epoch": 0.8, "learning_rate": 1.824e-06, "loss": 0.2691, "step": 230 }, { "epoch": 0.83, "learning_rate": 1.904e-06, "loss": 0.3116, "step": 240 }, { "epoch": 0.87, "learning_rate": 1.976e-06, "loss": 0.3348, "step": 250 }, { "epoch": 0.9, "learning_rate": 2.056e-06, "loss": 0.2831, "step": 260 }, { "epoch": 0.94, "learning_rate": 2.136e-06, "loss": 0.2814, "step": 270 }, { "epoch": 0.97, "learning_rate": 2.216e-06, "loss": 0.3028, "step": 280 }, { "epoch": 1.0, "eval_loss": 0.4693412184715271, "eval_runtime": 130.2494, "eval_samples_per_second": 4.084, "eval_steps_per_second": 1.021, "eval_wer": 0.2046024297743781, "step": 288 }, { "epoch": 1.01, "learning_rate": 2.2959999999999997e-06, "loss": 0.3338, "step": 290 }, { "epoch": 1.04, "learning_rate": 2.3759999999999998e-06, "loss": 0.2803, "step": 300 }, { "epoch": 1.08, "learning_rate": 2.456e-06, "loss": 0.2859, "step": 310 }, { "epoch": 1.11, "learning_rate": 2.536e-06, "loss": 0.282, "step": 320 }, { "epoch": 1.15, "learning_rate": 2.616e-06, "loss": 0.2971, "step": 330 }, { "epoch": 1.18, "learning_rate": 2.696e-06, "loss": 0.2832, "step": 340 }, { "epoch": 1.21, "learning_rate": 2.7759999999999998e-06, "loss": 0.2776, "step": 350 }, { "epoch": 1.25, "learning_rate": 2.856e-06, "loss": 0.2812, "step": 360 }, { "epoch": 1.28, "learning_rate": 2.936e-06, "loss": 0.2765, "step": 370 }, { "epoch": 1.32, "learning_rate": 3.016e-06, "loss": 0.2905, "step": 380 }, { "epoch": 1.35, "learning_rate": 3.096e-06, "loss": 0.2992, "step": 390 }, { "epoch": 1.39, "learning_rate": 3.176e-06, "loss": 0.2972, "step": 400 }, { "epoch": 1.42, "learning_rate": 3.256e-06, "loss": 0.2884, "step": 410 }, { "epoch": 1.46, "learning_rate": 3.336e-06, "loss": 0.2667, "step": 420 }, { "epoch": 1.49, "learning_rate": 3.4159999999999996e-06, "loss": 0.3059, "step": 430 }, { "epoch": 1.53, "learning_rate": 3.4959999999999996e-06, "loss": 0.2853, "step": 440 }, { "epoch": 1.56, "learning_rate": 3.5759999999999997e-06, "loss": 0.2775, "step": 450 }, { "epoch": 1.6, "learning_rate": 3.656e-06, "loss": 0.2873, "step": 460 }, { "epoch": 1.63, "learning_rate": 3.736e-06, "loss": 0.2874, "step": 470 }, { "epoch": 1.66, "learning_rate": 3.8159999999999995e-06, "loss": 0.2988, "step": 480 }, { "epoch": 1.7, "learning_rate": 3.896e-06, "loss": 0.2957, "step": 490 }, { "epoch": 1.73, "learning_rate": 3.976e-06, "loss": 0.3037, "step": 500 }, { "epoch": 1.77, "learning_rate": 3.999010600706714e-06, "loss": 0.2873, "step": 510 }, { "epoch": 1.8, "learning_rate": 3.997597173144876e-06, "loss": 0.2904, "step": 520 }, { "epoch": 1.84, "learning_rate": 3.996183745583039e-06, "loss": 0.3108, "step": 530 }, { "epoch": 1.87, "learning_rate": 3.994770318021201e-06, "loss": 0.3071, "step": 540 }, { "epoch": 1.91, "learning_rate": 3.993356890459364e-06, "loss": 0.2944, "step": 550 }, { "epoch": 1.94, "learning_rate": 3.9919434628975264e-06, "loss": 0.2848, "step": 560 }, { "epoch": 1.98, "learning_rate": 3.990530035335689e-06, "loss": 0.2986, "step": 570 }, { "epoch": 2.0, "eval_loss": 0.48284950852394104, "eval_runtime": 130.0663, "eval_samples_per_second": 4.09, "eval_steps_per_second": 1.023, "eval_wer": 0.20575946519251784, "step": 576 }, { "epoch": 2.01, "learning_rate": 3.989116607773851e-06, "loss": 0.3048, "step": 580 }, { "epoch": 2.05, "learning_rate": 3.987703180212014e-06, "loss": 0.2977, "step": 590 }, { "epoch": 2.08, "learning_rate": 3.986289752650176e-06, "loss": 0.2796, "step": 600 }, { "epoch": 2.12, "learning_rate": 3.984876325088339e-06, "loss": 0.2934, "step": 610 }, { "epoch": 2.15, "learning_rate": 3.983462897526502e-06, "loss": 0.3091, "step": 620 }, { "epoch": 2.19, "learning_rate": 3.982049469964665e-06, "loss": 0.2864, "step": 630 }, { "epoch": 2.22, "learning_rate": 3.9806360424028266e-06, "loss": 0.2948, "step": 640 }, { "epoch": 2.26, "learning_rate": 3.979222614840989e-06, "loss": 0.3012, "step": 650 }, { "epoch": 2.29, "learning_rate": 3.977809187279151e-06, "loss": 0.2824, "step": 660 }, { "epoch": 2.33, "learning_rate": 3.976395759717314e-06, "loss": 0.3008, "step": 670 }, { "epoch": 2.36, "learning_rate": 3.974982332155477e-06, "loss": 0.3, "step": 680 }, { "epoch": 2.39, "learning_rate": 3.97356890459364e-06, "loss": 0.2641, "step": 690 }, { "epoch": 2.43, "learning_rate": 3.972155477031802e-06, "loss": 0.2677, "step": 700 }, { "epoch": 2.46, "learning_rate": 3.970742049469965e-06, "loss": 0.2851, "step": 710 }, { "epoch": 2.5, "learning_rate": 3.969328621908127e-06, "loss": 0.2923, "step": 720 }, { "epoch": 2.53, "learning_rate": 3.9679151943462895e-06, "loss": 0.2957, "step": 730 }, { "epoch": 2.57, "learning_rate": 3.966501766784452e-06, "loss": 0.2915, "step": 740 }, { "epoch": 2.6, "learning_rate": 3.965088339222615e-06, "loss": 0.2786, "step": 750 }, { "epoch": 2.64, "learning_rate": 3.963674911660777e-06, "loss": 0.3032, "step": 760 }, { "epoch": 2.67, "learning_rate": 3.96226148409894e-06, "loss": 0.3004, "step": 770 }, { "epoch": 2.71, "learning_rate": 3.960848056537102e-06, "loss": 0.2904, "step": 780 }, { "epoch": 2.74, "learning_rate": 3.959434628975265e-06, "loss": 0.2702, "step": 790 }, { "epoch": 2.78, "learning_rate": 3.958021201413428e-06, "loss": 0.2831, "step": 800 }, { "epoch": 2.81, "learning_rate": 3.95660777385159e-06, "loss": 0.2874, "step": 810 }, { "epoch": 2.85, "learning_rate": 3.9551943462897525e-06, "loss": 0.2791, "step": 820 }, { "epoch": 2.88, "learning_rate": 3.953780918727915e-06, "loss": 0.2896, "step": 830 }, { "epoch": 2.91, "learning_rate": 3.952367491166077e-06, "loss": 0.2694, "step": 840 }, { "epoch": 2.95, "learning_rate": 3.95095406360424e-06, "loss": 0.277, "step": 850 }, { "epoch": 2.98, "learning_rate": 3.949540636042403e-06, "loss": 0.297, "step": 860 }, { "epoch": 3.0, "eval_loss": 0.5019953846931458, "eval_runtime": 130.2566, "eval_samples_per_second": 4.084, "eval_steps_per_second": 1.021, "eval_wer": 0.2038310728289516, "step": 864 }, { "epoch": 3.02, "learning_rate": 3.948127208480565e-06, "loss": 0.2977, "step": 870 }, { "epoch": 3.06, "learning_rate": 3.946713780918728e-06, "loss": 0.3039, "step": 880 }, { "epoch": 3.09, "learning_rate": 3.945300353356891e-06, "loss": 0.2913, "step": 890 }, { "epoch": 3.12, "learning_rate": 3.943886925795053e-06, "loss": 0.307, "step": 900 }, { "epoch": 3.16, "learning_rate": 3.9424734982332154e-06, "loss": 0.3053, "step": 910 }, { "epoch": 3.19, "learning_rate": 3.941060070671378e-06, "loss": 0.2781, "step": 920 }, { "epoch": 3.23, "learning_rate": 3.93964664310954e-06, "loss": 0.2978, "step": 930 }, { "epoch": 3.26, "learning_rate": 3.938233215547703e-06, "loss": 0.2859, "step": 940 }, { "epoch": 3.3, "learning_rate": 3.936819787985866e-06, "loss": 0.3001, "step": 950 }, { "epoch": 3.33, "learning_rate": 3.935406360424028e-06, "loss": 0.3167, "step": 960 }, { "epoch": 3.37, "learning_rate": 3.933992932862191e-06, "loss": 0.307, "step": 970 }, { "epoch": 3.4, "learning_rate": 3.932579505300353e-06, "loss": 0.3129, "step": 980 }, { "epoch": 3.44, "learning_rate": 3.9311660777385156e-06, "loss": 0.2694, "step": 990 }, { "epoch": 3.47, "learning_rate": 3.929752650176678e-06, "loss": 0.3088, "step": 1000 }, { "epoch": 3.51, "learning_rate": 3.928339222614841e-06, "loss": 0.2849, "step": 1010 }, { "epoch": 3.54, "learning_rate": 3.926925795053003e-06, "loss": 0.3203, "step": 1020 }, { "epoch": 3.57, "learning_rate": 3.925512367491166e-06, "loss": 0.3022, "step": 1030 }, { "epoch": 3.61, "learning_rate": 3.924098939929328e-06, "loss": 0.2711, "step": 1040 }, { "epoch": 3.64, "learning_rate": 3.922685512367491e-06, "loss": 0.2765, "step": 1050 }, { "epoch": 3.68, "learning_rate": 3.921272084805654e-06, "loss": 0.2897, "step": 1060 }, { "epoch": 3.71, "learning_rate": 3.9198586572438165e-06, "loss": 0.2561, "step": 1070 }, { "epoch": 3.75, "learning_rate": 3.9184452296819785e-06, "loss": 0.2596, "step": 1080 }, { "epoch": 3.78, "learning_rate": 3.917031802120141e-06, "loss": 0.2759, "step": 1090 }, { "epoch": 3.82, "learning_rate": 3.915618374558303e-06, "loss": 0.3017, "step": 1100 }, { "epoch": 3.85, "learning_rate": 3.914204946996466e-06, "loss": 0.2668, "step": 1110 }, { "epoch": 3.89, "learning_rate": 3.912791519434629e-06, "loss": 0.284, "step": 1120 }, { "epoch": 3.92, "learning_rate": 3.911378091872792e-06, "loss": 0.2808, "step": 1130 }, { "epoch": 3.96, "learning_rate": 3.909964664310954e-06, "loss": 0.2801, "step": 1140 }, { "epoch": 3.99, "learning_rate": 3.908551236749117e-06, "loss": 0.2863, "step": 1150 }, { "epoch": 4.0, "eval_loss": 0.5215898752212524, "eval_runtime": 130.8056, "eval_samples_per_second": 4.067, "eval_steps_per_second": 1.017, "eval_wer": 0.20203123995628977, "step": 1152 }, { "epoch": 4.03, "learning_rate": 3.907137809187279e-06, "loss": 0.2845, "step": 1160 }, { "epoch": 4.06, "learning_rate": 3.9057243816254415e-06, "loss": 0.2787, "step": 1170 }, { "epoch": 4.1, "learning_rate": 3.904310954063604e-06, "loss": 0.2562, "step": 1180 }, { "epoch": 4.13, "learning_rate": 3.902897526501767e-06, "loss": 0.2833, "step": 1190 }, { "epoch": 4.17, "learning_rate": 3.901484098939929e-06, "loss": 0.2655, "step": 1200 }, { "epoch": 4.2, "learning_rate": 3.900070671378092e-06, "loss": 0.2865, "step": 1210 }, { "epoch": 4.24, "learning_rate": 3.898657243816254e-06, "loss": 0.2702, "step": 1220 }, { "epoch": 4.27, "learning_rate": 3.897243816254417e-06, "loss": 0.2733, "step": 1230 }, { "epoch": 4.3, "learning_rate": 3.89583038869258e-06, "loss": 0.3136, "step": 1240 }, { "epoch": 4.34, "learning_rate": 3.8944169611307424e-06, "loss": 0.2846, "step": 1250 }, { "epoch": 4.37, "learning_rate": 3.8930035335689044e-06, "loss": 0.2756, "step": 1260 }, { "epoch": 4.41, "learning_rate": 3.891590106007066e-06, "loss": 0.2934, "step": 1270 }, { "epoch": 4.44, "learning_rate": 3.890176678445229e-06, "loss": 0.2851, "step": 1280 }, { "epoch": 4.48, "learning_rate": 3.888763250883392e-06, "loss": 0.2979, "step": 1290 }, { "epoch": 4.51, "learning_rate": 3.887349823321555e-06, "loss": 0.2944, "step": 1300 }, { "epoch": 4.55, "learning_rate": 3.885936395759717e-06, "loss": 0.2839, "step": 1310 }, { "epoch": 4.58, "learning_rate": 3.88452296819788e-06, "loss": 0.287, "step": 1320 }, { "epoch": 4.62, "learning_rate": 3.883109540636042e-06, "loss": 0.2757, "step": 1330 }, { "epoch": 4.65, "learning_rate": 3.8816961130742046e-06, "loss": 0.3039, "step": 1340 }, { "epoch": 4.69, "learning_rate": 3.880282685512367e-06, "loss": 0.2852, "step": 1350 }, { "epoch": 4.72, "learning_rate": 3.87886925795053e-06, "loss": 0.2655, "step": 1360 }, { "epoch": 4.75, "learning_rate": 3.877455830388692e-06, "loss": 0.2777, "step": 1370 }, { "epoch": 4.79, "learning_rate": 3.876042402826855e-06, "loss": 0.2714, "step": 1380 }, { "epoch": 4.82, "learning_rate": 3.874628975265017e-06, "loss": 0.2803, "step": 1390 }, { "epoch": 4.86, "learning_rate": 3.87321554770318e-06, "loss": 0.3032, "step": 1400 }, { "epoch": 4.89, "learning_rate": 3.871802120141343e-06, "loss": 0.2808, "step": 1410 }, { "epoch": 4.93, "learning_rate": 3.8703886925795055e-06, "loss": 0.2795, "step": 1420 }, { "epoch": 4.96, "learning_rate": 3.8689752650176675e-06, "loss": 0.2664, "step": 1430 }, { "epoch": 5.0, "learning_rate": 3.86756183745583e-06, "loss": 0.3036, "step": 1440 }, { "epoch": 5.0, "eval_loss": 0.49630099534988403, "eval_runtime": 131.2377, "eval_samples_per_second": 4.054, "eval_steps_per_second": 1.013, "eval_wer": 0.20080992479269782, "step": 1440 }, { "epoch": 5.03, "learning_rate": 3.866148409893992e-06, "loss": 0.2955, "step": 1450 }, { "epoch": 5.07, "learning_rate": 3.864734982332155e-06, "loss": 0.2806, "step": 1460 }, { "epoch": 5.1, "learning_rate": 3.863321554770318e-06, "loss": 0.2625, "step": 1470 }, { "epoch": 5.14, "learning_rate": 3.861908127208481e-06, "loss": 0.2775, "step": 1480 }, { "epoch": 5.17, "learning_rate": 3.860494699646643e-06, "loss": 0.2916, "step": 1490 }, { "epoch": 5.21, "learning_rate": 3.859081272084806e-06, "loss": 0.2783, "step": 1500 }, { "epoch": 5.24, "learning_rate": 3.857667844522968e-06, "loss": 0.2728, "step": 1510 }, { "epoch": 5.28, "learning_rate": 3.8562544169611305e-06, "loss": 0.2706, "step": 1520 }, { "epoch": 5.31, "learning_rate": 3.854840989399293e-06, "loss": 0.2857, "step": 1530 }, { "epoch": 5.35, "learning_rate": 3.853427561837456e-06, "loss": 0.2956, "step": 1540 }, { "epoch": 5.38, "learning_rate": 3.852014134275618e-06, "loss": 0.2629, "step": 1550 }, { "epoch": 5.42, "learning_rate": 3.850600706713781e-06, "loss": 0.2656, "step": 1560 }, { "epoch": 5.45, "learning_rate": 3.849187279151943e-06, "loss": 0.2842, "step": 1570 }, { "epoch": 5.48, "learning_rate": 3.847773851590106e-06, "loss": 0.3061, "step": 1580 }, { "epoch": 5.52, "learning_rate": 3.846360424028269e-06, "loss": 0.2755, "step": 1590 }, { "epoch": 5.55, "learning_rate": 3.844946996466431e-06, "loss": 0.2695, "step": 1600 }, { "epoch": 5.59, "learning_rate": 3.843533568904593e-06, "loss": 0.2636, "step": 1610 }, { "epoch": 5.62, "learning_rate": 3.842120141342756e-06, "loss": 0.2822, "step": 1620 }, { "epoch": 5.66, "learning_rate": 3.840706713780918e-06, "loss": 0.2815, "step": 1630 }, { "epoch": 5.69, "learning_rate": 3.839293286219081e-06, "loss": 0.3095, "step": 1640 }, { "epoch": 5.73, "learning_rate": 3.837879858657244e-06, "loss": 0.2825, "step": 1650 }, { "epoch": 5.76, "learning_rate": 3.836466431095406e-06, "loss": 0.2883, "step": 1660 }, { "epoch": 5.8, "learning_rate": 3.835053003533569e-06, "loss": 0.2781, "step": 1670 }, { "epoch": 5.83, "learning_rate": 3.8336395759717316e-06, "loss": 0.3046, "step": 1680 }, { "epoch": 5.87, "learning_rate": 3.8322261484098935e-06, "loss": 0.2752, "step": 1690 }, { "epoch": 5.9, "learning_rate": 3.830812720848056e-06, "loss": 0.2571, "step": 1700 }, { "epoch": 5.94, "learning_rate": 3.829399293286218e-06, "loss": 0.2836, "step": 1710 }, { "epoch": 5.97, "learning_rate": 3.827985865724381e-06, "loss": 0.3141, "step": 1720 }, { "epoch": 6.0, "eval_loss": 0.5004593729972839, "eval_runtime": 130.6889, "eval_samples_per_second": 4.071, "eval_steps_per_second": 1.018, "eval_wer": 0.20203123995628977, "step": 1728 }, { "epoch": 6.01, "learning_rate": 3.826572438162544e-06, "loss": 0.299, "step": 1730 }, { "epoch": 6.04, "learning_rate": 3.825159010600707e-06, "loss": 0.3013, "step": 1740 }, { "epoch": 6.08, "learning_rate": 3.823745583038869e-06, "loss": 0.2818, "step": 1750 }, { "epoch": 6.11, "learning_rate": 3.822332155477032e-06, "loss": 0.2743, "step": 1760 }, { "epoch": 6.15, "learning_rate": 3.820918727915194e-06, "loss": 0.2774, "step": 1770 }, { "epoch": 6.18, "learning_rate": 3.8195053003533565e-06, "loss": 0.2833, "step": 1780 }, { "epoch": 6.21, "learning_rate": 3.818091872791519e-06, "loss": 0.2895, "step": 1790 }, { "epoch": 6.25, "learning_rate": 3.816678445229682e-06, "loss": 0.2511, "step": 1800 }, { "epoch": 6.28, "learning_rate": 3.815265017667844e-06, "loss": 0.2567, "step": 1810 }, { "epoch": 6.32, "learning_rate": 3.813851590106007e-06, "loss": 0.3127, "step": 1820 }, { "epoch": 6.35, "learning_rate": 3.8124381625441694e-06, "loss": 0.3125, "step": 1830 }, { "epoch": 6.39, "learning_rate": 3.811024734982332e-06, "loss": 0.2699, "step": 1840 }, { "epoch": 6.42, "learning_rate": 3.8096113074204946e-06, "loss": 0.2896, "step": 1850 }, { "epoch": 6.46, "learning_rate": 3.808197879858657e-06, "loss": 0.3067, "step": 1860 }, { "epoch": 6.49, "learning_rate": 3.80678445229682e-06, "loss": 0.2647, "step": 1870 }, { "epoch": 6.53, "learning_rate": 3.805371024734982e-06, "loss": 0.2916, "step": 1880 }, { "epoch": 6.56, "learning_rate": 3.8039575971731447e-06, "loss": 0.2825, "step": 1890 }, { "epoch": 6.6, "learning_rate": 3.802544169611307e-06, "loss": 0.283, "step": 1900 }, { "epoch": 6.63, "learning_rate": 3.80113074204947e-06, "loss": 0.2913, "step": 1910 }, { "epoch": 6.66, "learning_rate": 3.7997173144876324e-06, "loss": 0.2937, "step": 1920 }, { "epoch": 6.7, "learning_rate": 3.798303886925795e-06, "loss": 0.2815, "step": 1930 }, { "epoch": 6.73, "learning_rate": 3.796890459363957e-06, "loss": 0.261, "step": 1940 }, { "epoch": 6.77, "learning_rate": 3.79547703180212e-06, "loss": 0.2883, "step": 1950 }, { "epoch": 6.8, "learning_rate": 3.7940636042402824e-06, "loss": 0.2678, "step": 1960 }, { "epoch": 6.84, "learning_rate": 3.7926501766784452e-06, "loss": 0.2959, "step": 1970 }, { "epoch": 6.87, "learning_rate": 3.7912367491166077e-06, "loss": 0.2933, "step": 1980 }, { "epoch": 6.91, "learning_rate": 3.7898233215547705e-06, "loss": 0.2634, "step": 1990 }, { "epoch": 6.94, "learning_rate": 3.7884098939929325e-06, "loss": 0.2767, "step": 2000 }, { "epoch": 6.98, "learning_rate": 3.7869964664310953e-06, "loss": 0.2898, "step": 2010 }, { "epoch": 7.0, "eval_loss": 0.4961535334587097, "eval_runtime": 131.6974, "eval_samples_per_second": 4.04, "eval_steps_per_second": 1.01, "eval_wer": 0.2029311563926207, "step": 2016 }, { "epoch": 7.01, "learning_rate": 3.7855830388692577e-06, "loss": 0.295, "step": 2020 }, { "epoch": 7.05, "learning_rate": 3.7841696113074206e-06, "loss": 0.2862, "step": 2030 }, { "epoch": 7.08, "learning_rate": 3.782756183745583e-06, "loss": 0.2683, "step": 2040 }, { "epoch": 7.12, "learning_rate": 3.7813427561837454e-06, "loss": 0.2845, "step": 2050 }, { "epoch": 7.15, "learning_rate": 3.7799293286219078e-06, "loss": 0.2863, "step": 2060 }, { "epoch": 7.19, "learning_rate": 3.7785159010600706e-06, "loss": 0.2889, "step": 2070 }, { "epoch": 7.22, "learning_rate": 3.777102473498233e-06, "loss": 0.2837, "step": 2080 }, { "epoch": 7.26, "learning_rate": 3.775689045936396e-06, "loss": 0.2816, "step": 2090 }, { "epoch": 7.29, "learning_rate": 3.7742756183745583e-06, "loss": 0.2938, "step": 2100 }, { "epoch": 7.33, "learning_rate": 3.7728621908127207e-06, "loss": 0.3051, "step": 2110 }, { "epoch": 7.36, "learning_rate": 3.771448763250883e-06, "loss": 0.2662, "step": 2120 }, { "epoch": 7.39, "learning_rate": 3.770035335689046e-06, "loss": 0.26, "step": 2130 }, { "epoch": 7.43, "learning_rate": 3.7686219081272083e-06, "loss": 0.2823, "step": 2140 }, { "epoch": 7.46, "learning_rate": 3.767208480565371e-06, "loss": 0.2766, "step": 2150 }, { "epoch": 7.5, "learning_rate": 3.7657950530035336e-06, "loss": 0.275, "step": 2160 }, { "epoch": 7.53, "learning_rate": 3.764381625441696e-06, "loss": 0.2968, "step": 2170 }, { "epoch": 7.57, "learning_rate": 3.7629681978798584e-06, "loss": 0.2965, "step": 2180 }, { "epoch": 7.6, "learning_rate": 3.7615547703180212e-06, "loss": 0.2724, "step": 2190 }, { "epoch": 7.64, "learning_rate": 3.7601413427561836e-06, "loss": 0.2829, "step": 2200 }, { "epoch": 7.67, "learning_rate": 3.7587279151943465e-06, "loss": 0.2952, "step": 2210 }, { "epoch": 7.71, "learning_rate": 3.7573144876325085e-06, "loss": 0.2675, "step": 2220 }, { "epoch": 7.74, "learning_rate": 3.7559010600706713e-06, "loss": 0.2608, "step": 2230 }, { "epoch": 7.78, "learning_rate": 3.7544876325088337e-06, "loss": 0.2701, "step": 2240 }, { "epoch": 7.81, "learning_rate": 3.7530742049469965e-06, "loss": 0.2797, "step": 2250 }, { "epoch": 7.85, "learning_rate": 3.7518021201413426e-06, "loss": 0.2733, "step": 2260 }, { "epoch": 7.88, "learning_rate": 3.750388692579505e-06, "loss": 0.3008, "step": 2270 }, { "epoch": 7.91, "learning_rate": 3.748975265017668e-06, "loss": 0.2855, "step": 2280 }, { "epoch": 7.95, "learning_rate": 3.7475618374558306e-06, "loss": 0.2587, "step": 2290 }, { "epoch": 7.98, "learning_rate": 3.7461484098939926e-06, "loss": 0.2922, "step": 2300 }, { "epoch": 8.0, "eval_loss": 0.507337212562561, "eval_runtime": 130.1898, "eval_samples_per_second": 4.086, "eval_steps_per_second": 1.022, "eval_wer": 0.2030597158835251, "step": 2304 }, { "epoch": 8.02, "learning_rate": 3.744734982332155e-06, "loss": 0.2721, "step": 2310 }, { "epoch": 8.06, "learning_rate": 3.743321554770318e-06, "loss": 0.305, "step": 2320 }, { "epoch": 8.09, "learning_rate": 3.7419081272084803e-06, "loss": 0.2736, "step": 2330 }, { "epoch": 8.12, "learning_rate": 3.740494699646643e-06, "loss": 0.2865, "step": 2340 }, { "epoch": 8.16, "learning_rate": 3.739081272084805e-06, "loss": 0.2774, "step": 2350 }, { "epoch": 8.19, "learning_rate": 3.737667844522968e-06, "loss": 0.2621, "step": 2360 }, { "epoch": 8.23, "learning_rate": 3.7362544169611303e-06, "loss": 0.2849, "step": 2370 }, { "epoch": 8.26, "learning_rate": 3.734840989399293e-06, "loss": 0.2744, "step": 2380 }, { "epoch": 8.3, "learning_rate": 3.7334275618374556e-06, "loss": 0.3042, "step": 2390 }, { "epoch": 8.33, "learning_rate": 3.7320141342756184e-06, "loss": 0.2861, "step": 2400 }, { "epoch": 8.37, "learning_rate": 3.7306007067137804e-06, "loss": 0.2774, "step": 2410 }, { "epoch": 8.4, "learning_rate": 3.7291872791519432e-06, "loss": 0.2846, "step": 2420 }, { "epoch": 8.44, "learning_rate": 3.7277738515901056e-06, "loss": 0.2448, "step": 2430 }, { "epoch": 8.47, "learning_rate": 3.7263604240282685e-06, "loss": 0.2937, "step": 2440 }, { "epoch": 8.51, "learning_rate": 3.724946996466431e-06, "loss": 0.2963, "step": 2450 }, { "epoch": 8.54, "learning_rate": 3.7235335689045937e-06, "loss": 0.2583, "step": 2460 }, { "epoch": 8.57, "learning_rate": 3.7221201413427557e-06, "loss": 0.2691, "step": 2470 }, { "epoch": 8.61, "learning_rate": 3.7207067137809185e-06, "loss": 0.2798, "step": 2480 }, { "epoch": 8.64, "learning_rate": 3.719293286219081e-06, "loss": 0.2915, "step": 2490 }, { "epoch": 8.68, "learning_rate": 3.7178798586572438e-06, "loss": 0.2906, "step": 2500 }, { "epoch": 8.71, "learning_rate": 3.716466431095406e-06, "loss": 0.2885, "step": 2510 }, { "epoch": 8.75, "learning_rate": 3.7150530035335686e-06, "loss": 0.2899, "step": 2520 }, { "epoch": 8.78, "learning_rate": 3.713639575971731e-06, "loss": 0.2726, "step": 2530 }, { "epoch": 8.82, "learning_rate": 3.712226148409894e-06, "loss": 0.2824, "step": 2540 }, { "epoch": 8.85, "learning_rate": 3.7108127208480563e-06, "loss": 0.2846, "step": 2550 }, { "epoch": 8.89, "learning_rate": 3.709399293286219e-06, "loss": 0.2734, "step": 2560 }, { "epoch": 8.92, "learning_rate": 3.7079858657243815e-06, "loss": 0.2696, "step": 2570 }, { "epoch": 8.96, "learning_rate": 3.706572438162544e-06, "loss": 0.2703, "step": 2580 }, { "epoch": 8.99, "learning_rate": 3.7051590106007063e-06, "loss": 0.266, "step": 2590 }, { "epoch": 9.0, "eval_loss": 0.5159009695053101, "eval_runtime": 130.5433, "eval_samples_per_second": 4.075, "eval_steps_per_second": 1.019, "eval_wer": 0.2023526386835508, "step": 2592 }, { "epoch": 9.03, "learning_rate": 3.703745583038869e-06, "loss": 0.2807, "step": 2600 }, { "epoch": 9.06, "learning_rate": 3.7023321554770316e-06, "loss": 0.2772, "step": 2610 }, { "epoch": 9.1, "learning_rate": 3.7009187279151944e-06, "loss": 0.2813, "step": 2620 }, { "epoch": 9.13, "learning_rate": 3.6995053003533564e-06, "loss": 0.2878, "step": 2630 }, { "epoch": 9.17, "learning_rate": 3.6980918727915192e-06, "loss": 0.2934, "step": 2640 }, { "epoch": 9.2, "learning_rate": 3.6966784452296816e-06, "loss": 0.2755, "step": 2650 }, { "epoch": 9.24, "learning_rate": 3.6952650176678445e-06, "loss": 0.2921, "step": 2660 }, { "epoch": 9.27, "learning_rate": 3.693851590106007e-06, "loss": 0.2499, "step": 2670 }, { "epoch": 9.3, "learning_rate": 3.6924381625441697e-06, "loss": 0.2904, "step": 2680 }, { "epoch": 9.34, "learning_rate": 3.6910247349823317e-06, "loss": 0.2853, "step": 2690 }, { "epoch": 9.37, "learning_rate": 3.6896113074204945e-06, "loss": 0.2855, "step": 2700 }, { "epoch": 9.41, "learning_rate": 3.688197879858657e-06, "loss": 0.2839, "step": 2710 }, { "epoch": 9.44, "learning_rate": 3.6867844522968198e-06, "loss": 0.2615, "step": 2720 }, { "epoch": 9.48, "learning_rate": 3.685371024734982e-06, "loss": 0.3092, "step": 2730 }, { "epoch": 9.51, "learning_rate": 3.683957597173145e-06, "loss": 0.2576, "step": 2740 }, { "epoch": 9.55, "learning_rate": 3.682544169611307e-06, "loss": 0.2947, "step": 2750 }, { "epoch": 9.58, "learning_rate": 3.68113074204947e-06, "loss": 0.2769, "step": 2760 }, { "epoch": 9.62, "learning_rate": 3.6797173144876322e-06, "loss": 0.2569, "step": 2770 }, { "epoch": 9.65, "learning_rate": 3.678303886925795e-06, "loss": 0.2908, "step": 2780 }, { "epoch": 9.69, "learning_rate": 3.6768904593639575e-06, "loss": 0.2975, "step": 2790 }, { "epoch": 9.72, "learning_rate": 3.67547703180212e-06, "loss": 0.26, "step": 2800 }, { "epoch": 9.75, "learning_rate": 3.6740636042402823e-06, "loss": 0.2551, "step": 2810 }, { "epoch": 9.79, "learning_rate": 3.672650176678445e-06, "loss": 0.2701, "step": 2820 }, { "epoch": 9.82, "learning_rate": 3.6712367491166075e-06, "loss": 0.2922, "step": 2830 }, { "epoch": 9.86, "learning_rate": 3.6698233215547704e-06, "loss": 0.2951, "step": 2840 }, { "epoch": 9.89, "learning_rate": 3.6684098939929328e-06, "loss": 0.2508, "step": 2850 }, { "epoch": 9.93, "learning_rate": 3.666996466431095e-06, "loss": 0.2844, "step": 2860 }, { "epoch": 9.96, "learning_rate": 3.6655830388692576e-06, "loss": 0.2914, "step": 2870 }, { "epoch": 10.0, "learning_rate": 3.6641696113074204e-06, "loss": 0.2817, "step": 2880 }, { "epoch": 10.0, "eval_loss": 0.523847222328186, "eval_runtime": 131.2872, "eval_samples_per_second": 4.052, "eval_steps_per_second": 1.013, "eval_wer": 0.20106704377450665, "step": 2880 }, { "epoch": 10.03, "learning_rate": 3.662756183745583e-06, "loss": 0.2805, "step": 2890 }, { "epoch": 10.07, "learning_rate": 3.6613427561837457e-06, "loss": 0.2565, "step": 2900 }, { "epoch": 10.1, "learning_rate": 3.659929328621908e-06, "loss": 0.2575, "step": 2910 }, { "epoch": 10.14, "learning_rate": 3.6585159010600705e-06, "loss": 0.2875, "step": 2920 }, { "epoch": 10.17, "learning_rate": 3.657102473498233e-06, "loss": 0.2961, "step": 2930 }, { "epoch": 10.21, "learning_rate": 3.6556890459363957e-06, "loss": 0.2588, "step": 2940 }, { "epoch": 10.24, "learning_rate": 3.654275618374558e-06, "loss": 0.2574, "step": 2950 }, { "epoch": 10.28, "learning_rate": 3.652862190812721e-06, "loss": 0.269, "step": 2960 }, { "epoch": 10.31, "learning_rate": 3.651448763250883e-06, "loss": 0.281, "step": 2970 }, { "epoch": 10.35, "learning_rate": 3.650035335689046e-06, "loss": 0.2859, "step": 2980 }, { "epoch": 10.38, "learning_rate": 3.648621908127208e-06, "loss": 0.2844, "step": 2990 }, { "epoch": 10.42, "learning_rate": 3.647208480565371e-06, "loss": 0.3113, "step": 3000 }, { "epoch": 10.45, "learning_rate": 3.6457950530035334e-06, "loss": 0.2806, "step": 3010 }, { "epoch": 10.48, "learning_rate": 3.6443816254416963e-06, "loss": 0.2926, "step": 3020 }, { "epoch": 10.52, "learning_rate": 3.6429681978798583e-06, "loss": 0.3066, "step": 3030 }, { "epoch": 10.55, "learning_rate": 3.641554770318021e-06, "loss": 0.278, "step": 3040 }, { "epoch": 10.59, "learning_rate": 3.6401413427561835e-06, "loss": 0.276, "step": 3050 }, { "epoch": 10.62, "learning_rate": 3.6387279151943463e-06, "loss": 0.2589, "step": 3060 }, { "epoch": 10.66, "learning_rate": 3.6373144876325088e-06, "loss": 0.2792, "step": 3070 }, { "epoch": 10.69, "learning_rate": 3.6359010600706716e-06, "loss": 0.2706, "step": 3080 }, { "epoch": 10.73, "learning_rate": 3.6344876325088336e-06, "loss": 0.2702, "step": 3090 }, { "epoch": 10.76, "learning_rate": 3.6330742049469964e-06, "loss": 0.2818, "step": 3100 }, { "epoch": 10.8, "learning_rate": 3.631660777385159e-06, "loss": 0.2898, "step": 3110 }, { "epoch": 10.83, "learning_rate": 3.6302473498233216e-06, "loss": 0.2893, "step": 3120 }, { "epoch": 10.87, "learning_rate": 3.628833922261484e-06, "loss": 0.275, "step": 3130 }, { "epoch": 10.9, "learning_rate": 3.6274204946996465e-06, "loss": 0.283, "step": 3140 }, { "epoch": 10.94, "learning_rate": 3.626007067137809e-06, "loss": 0.2606, "step": 3150 }, { "epoch": 10.97, "learning_rate": 3.6245936395759717e-06, "loss": 0.2922, "step": 3160 }, { "epoch": 11.0, "eval_loss": 0.508041262626648, "eval_runtime": 130.0766, "eval_samples_per_second": 4.09, "eval_steps_per_second": 1.022, "eval_wer": 0.20113132351995885, "step": 3168 }, { "epoch": 11.01, "learning_rate": 3.623180212014134e-06, "loss": 0.3119, "step": 3170 }, { "epoch": 11.04, "learning_rate": 3.621766784452297e-06, "loss": 0.2549, "step": 3180 }, { "epoch": 11.08, "learning_rate": 3.6203533568904594e-06, "loss": 0.2656, "step": 3190 }, { "epoch": 11.11, "learning_rate": 3.6189399293286218e-06, "loss": 0.2914, "step": 3200 }, { "epoch": 11.15, "learning_rate": 3.617526501766784e-06, "loss": 0.2861, "step": 3210 }, { "epoch": 11.18, "learning_rate": 3.616113074204947e-06, "loss": 0.2998, "step": 3220 }, { "epoch": 11.21, "learning_rate": 3.6146996466431094e-06, "loss": 0.2821, "step": 3230 }, { "epoch": 11.25, "learning_rate": 3.6132862190812723e-06, "loss": 0.3008, "step": 3240 }, { "epoch": 11.28, "learning_rate": 3.6118727915194342e-06, "loss": 0.26, "step": 3250 }, { "epoch": 11.32, "learning_rate": 3.610459363957597e-06, "loss": 0.2877, "step": 3260 }, { "epoch": 11.35, "learning_rate": 3.6090459363957595e-06, "loss": 0.3065, "step": 3270 }, { "epoch": 11.39, "learning_rate": 3.6076325088339223e-06, "loss": 0.2815, "step": 3280 }, { "epoch": 11.42, "learning_rate": 3.6062190812720847e-06, "loss": 0.2649, "step": 3290 }, { "epoch": 11.46, "learning_rate": 3.6048056537102476e-06, "loss": 0.2859, "step": 3300 }, { "epoch": 11.49, "learning_rate": 3.6033922261484095e-06, "loss": 0.2826, "step": 3310 }, { "epoch": 11.53, "learning_rate": 3.601978798586572e-06, "loss": 0.2882, "step": 3320 }, { "epoch": 11.56, "learning_rate": 3.600565371024735e-06, "loss": 0.2772, "step": 3330 }, { "epoch": 11.6, "learning_rate": 3.5991519434628976e-06, "loss": 0.2678, "step": 3340 }, { "epoch": 11.63, "learning_rate": 3.59773851590106e-06, "loss": 0.2841, "step": 3350 }, { "epoch": 11.66, "learning_rate": 3.596325088339223e-06, "loss": 0.2982, "step": 3360 }, { "epoch": 11.7, "learning_rate": 3.594911660777385e-06, "loss": 0.2904, "step": 3370 }, { "epoch": 11.73, "learning_rate": 3.5934982332155473e-06, "loss": 0.2908, "step": 3380 }, { "epoch": 11.77, "learning_rate": 3.59208480565371e-06, "loss": 0.2629, "step": 3390 }, { "epoch": 11.8, "learning_rate": 3.5906713780918725e-06, "loss": 0.2953, "step": 3400 }, { "epoch": 11.84, "learning_rate": 3.5892579505300353e-06, "loss": 0.2857, "step": 3410 }, { "epoch": 11.87, "learning_rate": 3.5878445229681973e-06, "loss": 0.2671, "step": 3420 }, { "epoch": 11.91, "learning_rate": 3.58643109540636e-06, "loss": 0.2685, "step": 3430 }, { "epoch": 11.94, "learning_rate": 3.5850176678445226e-06, "loss": 0.287, "step": 3440 }, { "epoch": 11.98, "learning_rate": 3.5836042402826854e-06, "loss": 0.2869, "step": 3450 }, { "epoch": 12.0, "eval_loss": 0.4973689019680023, "eval_runtime": 129.1272, "eval_samples_per_second": 4.12, "eval_steps_per_second": 1.03, "eval_wer": 0.20267403741081186, "step": 3456 }, { "epoch": 12.01, "learning_rate": 3.582190812720848e-06, "loss": 0.2896, "step": 3460 }, { "epoch": 12.05, "learning_rate": 3.5807773851590106e-06, "loss": 0.2994, "step": 3470 }, { "epoch": 12.08, "learning_rate": 3.5793639575971726e-06, "loss": 0.2556, "step": 3480 }, { "epoch": 12.12, "learning_rate": 3.5779505300353355e-06, "loss": 0.2681, "step": 3490 }, { "epoch": 12.15, "learning_rate": 3.576537102473498e-06, "loss": 0.2913, "step": 3500 }, { "epoch": 12.19, "learning_rate": 3.5751236749116607e-06, "loss": 0.2544, "step": 3510 }, { "epoch": 12.22, "learning_rate": 3.573710247349823e-06, "loss": 0.2785, "step": 3520 }, { "epoch": 12.26, "learning_rate": 3.572296819787986e-06, "loss": 0.2865, "step": 3530 }, { "epoch": 12.29, "learning_rate": 3.570883392226148e-06, "loss": 0.3012, "step": 3540 }, { "epoch": 12.33, "learning_rate": 3.5694699646643108e-06, "loss": 0.2854, "step": 3550 }, { "epoch": 12.36, "learning_rate": 3.568056537102473e-06, "loss": 0.3029, "step": 3560 }, { "epoch": 12.39, "learning_rate": 3.566643109540636e-06, "loss": 0.2927, "step": 3570 }, { "epoch": 12.43, "learning_rate": 3.5652296819787984e-06, "loss": 0.2681, "step": 3580 }, { "epoch": 12.46, "learning_rate": 3.563816254416961e-06, "loss": 0.2767, "step": 3590 }, { "epoch": 12.5, "learning_rate": 3.5624028268551232e-06, "loss": 0.2824, "step": 3600 }, { "epoch": 12.53, "learning_rate": 3.5611307420494697e-06, "loss": 0.2764, "step": 3610 }, { "epoch": 12.57, "learning_rate": 3.559717314487632e-06, "loss": 0.2487, "step": 3620 }, { "epoch": 12.6, "learning_rate": 3.558303886925795e-06, "loss": 0.2881, "step": 3630 }, { "epoch": 12.64, "learning_rate": 3.5568904593639574e-06, "loss": 0.2865, "step": 3640 }, { "epoch": 12.67, "learning_rate": 3.55547703180212e-06, "loss": 0.2817, "step": 3650 }, { "epoch": 12.71, "learning_rate": 3.5540636042402826e-06, "loss": 0.2677, "step": 3660 }, { "epoch": 12.74, "learning_rate": 3.552650176678445e-06, "loss": 0.3031, "step": 3670 }, { "epoch": 12.78, "learning_rate": 3.5512367491166074e-06, "loss": 0.2787, "step": 3680 }, { "epoch": 12.81, "learning_rate": 3.5498233215547702e-06, "loss": 0.2761, "step": 3690 }, { "epoch": 12.85, "learning_rate": 3.5484098939929327e-06, "loss": 0.2749, "step": 3700 }, { "epoch": 12.88, "learning_rate": 3.5469964664310955e-06, "loss": 0.2977, "step": 3710 }, { "epoch": 12.91, "learning_rate": 3.5455830388692575e-06, "loss": 0.2686, "step": 3720 }, { "epoch": 12.95, "learning_rate": 3.5441696113074203e-06, "loss": 0.2724, "step": 3730 }, { "epoch": 12.98, "learning_rate": 3.5427561837455827e-06, "loss": 0.284, "step": 3740 }, { "epoch": 13.0, "eval_loss": 0.5104484558105469, "eval_runtime": 128.6455, "eval_samples_per_second": 4.135, "eval_steps_per_second": 1.034, "eval_wer": 0.200552805810889, "step": 3744 }, { "epoch": 13.02, "learning_rate": 3.5413427561837456e-06, "loss": 0.2975, "step": 3750 }, { "epoch": 13.06, "learning_rate": 3.539929328621908e-06, "loss": 0.2805, "step": 3760 }, { "epoch": 13.09, "learning_rate": 3.538515901060071e-06, "loss": 0.2694, "step": 3770 }, { "epoch": 13.12, "learning_rate": 3.5371024734982328e-06, "loss": 0.2523, "step": 3780 }, { "epoch": 13.16, "learning_rate": 3.5356890459363956e-06, "loss": 0.2933, "step": 3790 }, { "epoch": 13.19, "learning_rate": 3.534275618374558e-06, "loss": 0.2829, "step": 3800 }, { "epoch": 13.23, "learning_rate": 3.532862190812721e-06, "loss": 0.261, "step": 3810 }, { "epoch": 13.26, "learning_rate": 3.5314487632508833e-06, "loss": 0.2829, "step": 3820 }, { "epoch": 13.3, "learning_rate": 3.530035335689046e-06, "loss": 0.2911, "step": 3830 }, { "epoch": 13.33, "learning_rate": 3.528621908127208e-06, "loss": 0.2769, "step": 3840 }, { "epoch": 13.37, "learning_rate": 3.527208480565371e-06, "loss": 0.2595, "step": 3850 }, { "epoch": 13.4, "learning_rate": 3.5257950530035333e-06, "loss": 0.2858, "step": 3860 }, { "epoch": 13.44, "learning_rate": 3.524381625441696e-06, "loss": 0.2498, "step": 3870 }, { "epoch": 13.47, "learning_rate": 3.5229681978798586e-06, "loss": 0.2919, "step": 3880 }, { "epoch": 13.51, "learning_rate": 3.521554770318021e-06, "loss": 0.3099, "step": 3890 }, { "epoch": 13.54, "learning_rate": 3.5201413427561834e-06, "loss": 0.2785, "step": 3900 }, { "epoch": 13.57, "learning_rate": 3.5187279151943462e-06, "loss": 0.2562, "step": 3910 }, { "epoch": 13.61, "learning_rate": 3.5173144876325086e-06, "loss": 0.2876, "step": 3920 }, { "epoch": 13.64, "learning_rate": 3.5159010600706715e-06, "loss": 0.2982, "step": 3930 }, { "epoch": 13.68, "learning_rate": 3.514487632508834e-06, "loss": 0.2774, "step": 3940 }, { "epoch": 13.71, "learning_rate": 3.5130742049469963e-06, "loss": 0.2651, "step": 3950 }, { "epoch": 13.75, "learning_rate": 3.5116607773851587e-06, "loss": 0.2769, "step": 3960 }, { "epoch": 13.78, "learning_rate": 3.5102473498233215e-06, "loss": 0.2744, "step": 3970 }, { "epoch": 13.82, "learning_rate": 3.508833922261484e-06, "loss": 0.2922, "step": 3980 }, { "epoch": 13.85, "learning_rate": 3.5074204946996468e-06, "loss": 0.2784, "step": 3990 }, { "epoch": 13.89, "learning_rate": 3.506007067137809e-06, "loss": 0.2871, "step": 4000 }, { "epoch": 13.92, "learning_rate": 3.5045936395759716e-06, "loss": 0.2628, "step": 4010 }, { "epoch": 13.96, "learning_rate": 3.503180212014134e-06, "loss": 0.2794, "step": 4020 }, { "epoch": 13.99, "learning_rate": 3.501766784452297e-06, "loss": 0.2911, "step": 4030 }, { "epoch": 14.0, "eval_loss": 0.5025652050971985, "eval_runtime": 129.3001, "eval_samples_per_second": 4.114, "eval_steps_per_second": 1.029, "eval_wer": 0.20170984122902874, "step": 4032 }, { "epoch": 14.03, "learning_rate": 3.5003533568904592e-06, "loss": 0.2873, "step": 4040 }, { "epoch": 14.06, "learning_rate": 3.498939929328622e-06, "loss": 0.2802, "step": 4050 }, { "epoch": 14.1, "learning_rate": 3.497526501766784e-06, "loss": 0.2649, "step": 4060 }, { "epoch": 14.13, "learning_rate": 3.496113074204947e-06, "loss": 0.2909, "step": 4070 }, { "epoch": 14.17, "learning_rate": 3.4946996466431093e-06, "loss": 0.2844, "step": 4080 }, { "epoch": 14.2, "learning_rate": 3.493286219081272e-06, "loss": 0.2669, "step": 4090 }, { "epoch": 14.24, "learning_rate": 3.4918727915194345e-06, "loss": 0.2757, "step": 4100 }, { "epoch": 14.27, "learning_rate": 3.4904593639575974e-06, "loss": 0.2774, "step": 4110 }, { "epoch": 14.3, "learning_rate": 3.4890459363957594e-06, "loss": 0.2773, "step": 4120 }, { "epoch": 14.34, "learning_rate": 3.487632508833922e-06, "loss": 0.2743, "step": 4130 }, { "epoch": 14.37, "learning_rate": 3.4862190812720846e-06, "loss": 0.2583, "step": 4140 }, { "epoch": 14.41, "learning_rate": 3.4848056537102474e-06, "loss": 0.2636, "step": 4150 }, { "epoch": 14.44, "learning_rate": 3.48339222614841e-06, "loss": 0.2344, "step": 4160 }, { "epoch": 14.48, "learning_rate": 3.4819787985865723e-06, "loss": 0.2904, "step": 4170 }, { "epoch": 14.51, "learning_rate": 3.4805653710247347e-06, "loss": 0.2892, "step": 4180 }, { "epoch": 14.55, "learning_rate": 3.4791519434628975e-06, "loss": 0.2607, "step": 4190 }, { "epoch": 14.58, "learning_rate": 3.47773851590106e-06, "loss": 0.2952, "step": 4200 }, { "epoch": 14.62, "learning_rate": 3.4763250883392227e-06, "loss": 0.2731, "step": 4210 }, { "epoch": 14.65, "learning_rate": 3.474911660777385e-06, "loss": 0.2973, "step": 4220 }, { "epoch": 14.69, "learning_rate": 3.4734982332155476e-06, "loss": 0.2897, "step": 4230 }, { "epoch": 14.72, "learning_rate": 3.47208480565371e-06, "loss": 0.2761, "step": 4240 }, { "epoch": 14.75, "learning_rate": 3.470671378091873e-06, "loss": 0.2716, "step": 4250 }, { "epoch": 14.79, "learning_rate": 3.4692579505300352e-06, "loss": 0.2473, "step": 4260 }, { "epoch": 14.82, "learning_rate": 3.467844522968198e-06, "loss": 0.3024, "step": 4270 }, { "epoch": 14.86, "learning_rate": 3.4664310954063605e-06, "loss": 0.2873, "step": 4280 }, { "epoch": 14.89, "learning_rate": 3.4650176678445224e-06, "loss": 0.278, "step": 4290 }, { "epoch": 14.93, "learning_rate": 3.4636042402826853e-06, "loss": 0.2486, "step": 4300 }, { "epoch": 14.96, "learning_rate": 3.462190812720848e-06, "loss": 0.2668, "step": 4310 }, { "epoch": 15.0, "learning_rate": 3.4607773851590105e-06, "loss": 0.2864, "step": 4320 }, { "epoch": 15.0, "eval_loss": 0.5064656138420105, "eval_runtime": 129.204, "eval_samples_per_second": 4.118, "eval_steps_per_second": 1.029, "eval_wer": 0.20023140708362794, "step": 4320 }, { "epoch": 15.03, "learning_rate": 3.4593639575971734e-06, "loss": 0.2883, "step": 4330 }, { "epoch": 15.07, "learning_rate": 3.4579505300353353e-06, "loss": 0.2741, "step": 4340 }, { "epoch": 15.1, "learning_rate": 3.4565371024734977e-06, "loss": 0.2775, "step": 4350 }, { "epoch": 15.14, "learning_rate": 3.4551236749116606e-06, "loss": 0.287, "step": 4360 }, { "epoch": 15.17, "learning_rate": 3.453710247349823e-06, "loss": 0.2964, "step": 4370 }, { "epoch": 15.21, "learning_rate": 3.452296819787986e-06, "loss": 0.2907, "step": 4380 }, { "epoch": 15.24, "learning_rate": 3.4508833922261482e-06, "loss": 0.282, "step": 4390 }, { "epoch": 15.28, "learning_rate": 3.4494699646643106e-06, "loss": 0.2511, "step": 4400 }, { "epoch": 15.31, "learning_rate": 3.448056537102473e-06, "loss": 0.284, "step": 4410 }, { "epoch": 15.35, "learning_rate": 3.446643109540636e-06, "loss": 0.2856, "step": 4420 }, { "epoch": 15.38, "learning_rate": 3.4452296819787983e-06, "loss": 0.2694, "step": 4430 }, { "epoch": 15.42, "learning_rate": 3.443816254416961e-06, "loss": 0.2572, "step": 4440 }, { "epoch": 15.45, "learning_rate": 3.4424028268551235e-06, "loss": 0.2929, "step": 4450 }, { "epoch": 15.48, "learning_rate": 3.440989399293286e-06, "loss": 0.2973, "step": 4460 }, { "epoch": 15.52, "learning_rate": 3.4395759717314484e-06, "loss": 0.2767, "step": 4470 }, { "epoch": 15.55, "learning_rate": 3.438162544169611e-06, "loss": 0.26, "step": 4480 }, { "epoch": 15.59, "learning_rate": 3.4367491166077736e-06, "loss": 0.2813, "step": 4490 }, { "epoch": 15.62, "learning_rate": 3.4353356890459364e-06, "loss": 0.2703, "step": 4500 }, { "epoch": 15.66, "learning_rate": 3.4339222614840984e-06, "loss": 0.2875, "step": 4510 }, { "epoch": 15.69, "learning_rate": 3.4325088339222613e-06, "loss": 0.2561, "step": 4520 }, { "epoch": 15.73, "learning_rate": 3.4310954063604237e-06, "loss": 0.271, "step": 4530 }, { "epoch": 15.76, "learning_rate": 3.4296819787985865e-06, "loss": 0.2934, "step": 4540 }, { "epoch": 15.8, "learning_rate": 3.428268551236749e-06, "loss": 0.2791, "step": 4550 }, { "epoch": 15.83, "learning_rate": 3.4268551236749117e-06, "loss": 0.2896, "step": 4560 }, { "epoch": 15.87, "learning_rate": 3.4254416961130737e-06, "loss": 0.3179, "step": 4570 }, { "epoch": 15.9, "learning_rate": 3.4240282685512366e-06, "loss": 0.2716, "step": 4580 }, { "epoch": 15.94, "learning_rate": 3.422614840989399e-06, "loss": 0.3019, "step": 4590 }, { "epoch": 15.97, "learning_rate": 3.421201413427562e-06, "loss": 0.2779, "step": 4600 }, { "epoch": 16.0, "eval_loss": 0.5024499297142029, "eval_runtime": 129.1181, "eval_samples_per_second": 4.12, "eval_steps_per_second": 1.03, "eval_wer": 0.20100276402905445, "step": 4608 }, { "epoch": 16.01, "learning_rate": 3.419787985865724e-06, "loss": 0.3, "step": 4610 }, { "epoch": 16.04, "learning_rate": 3.418374558303887e-06, "loss": 0.2691, "step": 4620 }, { "epoch": 16.08, "learning_rate": 3.416961130742049e-06, "loss": 0.2599, "step": 4630 }, { "epoch": 16.11, "learning_rate": 3.415547703180212e-06, "loss": 0.2636, "step": 4640 }, { "epoch": 16.15, "learning_rate": 3.4141342756183743e-06, "loss": 0.2902, "step": 4650 }, { "epoch": 16.18, "learning_rate": 3.412720848056537e-06, "loss": 0.2577, "step": 4660 }, { "epoch": 16.21, "learning_rate": 3.4113074204946995e-06, "loss": 0.2813, "step": 4670 }, { "epoch": 16.25, "learning_rate": 3.409893992932862e-06, "loss": 0.2619, "step": 4680 }, { "epoch": 16.28, "learning_rate": 3.4084805653710243e-06, "loss": 0.2685, "step": 4690 }, { "epoch": 16.32, "learning_rate": 3.407067137809187e-06, "loss": 0.2886, "step": 4700 }, { "epoch": 16.35, "learning_rate": 3.4056537102473496e-06, "loss": 0.2828, "step": 4710 }, { "epoch": 16.39, "learning_rate": 3.4042402826855124e-06, "loss": 0.2643, "step": 4720 }, { "epoch": 16.42, "learning_rate": 3.402826855123675e-06, "loss": 0.2722, "step": 4730 }, { "epoch": 16.46, "learning_rate": 3.4014134275618372e-06, "loss": 0.2868, "step": 4740 }, { "epoch": 16.49, "learning_rate": 3.3999999999999996e-06, "loss": 0.2736, "step": 4750 }, { "epoch": 16.53, "learning_rate": 3.3985865724381625e-06, "loss": 0.2888, "step": 4760 }, { "epoch": 16.56, "learning_rate": 3.397173144876325e-06, "loss": 0.2616, "step": 4770 }, { "epoch": 16.6, "learning_rate": 3.3957597173144877e-06, "loss": 0.2736, "step": 4780 }, { "epoch": 16.63, "learning_rate": 3.3943462897526497e-06, "loss": 0.2678, "step": 4790 }, { "epoch": 16.66, "learning_rate": 3.3929328621908125e-06, "loss": 0.2739, "step": 4800 }, { "epoch": 16.7, "learning_rate": 3.391519434628975e-06, "loss": 0.252, "step": 4810 }, { "epoch": 16.73, "learning_rate": 3.3901060070671378e-06, "loss": 0.2913, "step": 4820 }, { "epoch": 16.77, "learning_rate": 3.3886925795053e-06, "loss": 0.2935, "step": 4830 }, { "epoch": 16.8, "learning_rate": 3.387279151943463e-06, "loss": 0.2672, "step": 4840 }, { "epoch": 16.84, "learning_rate": 3.385865724381625e-06, "loss": 0.2693, "step": 4850 }, { "epoch": 16.87, "learning_rate": 3.384452296819788e-06, "loss": 0.2723, "step": 4860 }, { "epoch": 16.91, "learning_rate": 3.3830388692579502e-06, "loss": 0.2571, "step": 4870 }, { "epoch": 16.94, "learning_rate": 3.381625441696113e-06, "loss": 0.2511, "step": 4880 }, { "epoch": 16.98, "learning_rate": 3.3802120141342755e-06, "loss": 0.2766, "step": 4890 }, { "epoch": 17.0, "eval_loss": 0.5078305006027222, "eval_runtime": 129.3828, "eval_samples_per_second": 4.112, "eval_steps_per_second": 1.028, "eval_wer": 0.1998457286109147, "step": 4896 }, { "epoch": 17.01, "learning_rate": 3.3787985865724383e-06, "loss": 0.2968, "step": 4900 }, { "epoch": 17.05, "learning_rate": 3.3773851590106003e-06, "loss": 0.2869, "step": 4910 }, { "epoch": 17.08, "learning_rate": 3.375971731448763e-06, "loss": 0.2671, "step": 4920 }, { "epoch": 17.12, "learning_rate": 3.3745583038869255e-06, "loss": 0.2651, "step": 4930 }, { "epoch": 17.15, "learning_rate": 3.3731448763250884e-06, "loss": 0.262, "step": 4940 }, { "epoch": 17.19, "learning_rate": 3.371731448763251e-06, "loss": 0.2579, "step": 4950 }, { "epoch": 17.22, "learning_rate": 3.370318021201413e-06, "loss": 0.2801, "step": 4960 }, { "epoch": 17.26, "learning_rate": 3.3689045936395756e-06, "loss": 0.2667, "step": 4970 }, { "epoch": 17.29, "learning_rate": 3.3674911660777384e-06, "loss": 0.2852, "step": 4980 }, { "epoch": 17.33, "learning_rate": 3.366077738515901e-06, "loss": 0.2515, "step": 4990 }, { "epoch": 17.36, "learning_rate": 3.3646643109540637e-06, "loss": 0.2632, "step": 5000 }, { "epoch": 17.39, "learning_rate": 3.363250883392226e-06, "loss": 0.2756, "step": 5010 }, { "epoch": 17.43, "learning_rate": 3.3618374558303885e-06, "loss": 0.2703, "step": 5020 }, { "epoch": 17.46, "learning_rate": 3.360424028268551e-06, "loss": 0.2706, "step": 5030 }, { "epoch": 17.5, "learning_rate": 3.3590106007067137e-06, "loss": 0.3145, "step": 5040 }, { "epoch": 17.53, "learning_rate": 3.357597173144876e-06, "loss": 0.2588, "step": 5050 }, { "epoch": 17.57, "learning_rate": 3.356183745583039e-06, "loss": 0.278, "step": 5060 }, { "epoch": 17.6, "learning_rate": 3.3547703180212014e-06, "loss": 0.2612, "step": 5070 }, { "epoch": 17.64, "learning_rate": 3.353356890459364e-06, "loss": 0.2747, "step": 5080 }, { "epoch": 17.67, "learning_rate": 3.3519434628975262e-06, "loss": 0.2839, "step": 5090 }, { "epoch": 17.71, "learning_rate": 3.350530035335689e-06, "loss": 0.3041, "step": 5100 }, { "epoch": 17.74, "learning_rate": 3.3491166077738515e-06, "loss": 0.28, "step": 5110 }, { "epoch": 17.78, "learning_rate": 3.3477031802120143e-06, "loss": 0.2479, "step": 5120 }, { "epoch": 17.81, "learning_rate": 3.3462897526501763e-06, "loss": 0.2859, "step": 5130 }, { "epoch": 17.85, "learning_rate": 3.344876325088339e-06, "loss": 0.2879, "step": 5140 }, { "epoch": 17.88, "learning_rate": 3.3434628975265015e-06, "loss": 0.2668, "step": 5150 }, { "epoch": 17.91, "learning_rate": 3.3420494699646644e-06, "loss": 0.2703, "step": 5160 }, { "epoch": 17.95, "learning_rate": 3.3406360424028268e-06, "loss": 0.2949, "step": 5170 }, { "epoch": 17.98, "learning_rate": 3.3392226148409896e-06, "loss": 0.2872, "step": 5180 }, { "epoch": 18.0, "eval_loss": 0.5114011764526367, "eval_runtime": 129.1607, "eval_samples_per_second": 4.119, "eval_steps_per_second": 1.03, "eval_wer": 0.19811017548370508, "step": 5184 }, { "epoch": 18.02, "learning_rate": 3.3378091872791516e-06, "loss": 0.2889, "step": 5190 }, { "epoch": 18.06, "learning_rate": 3.3363957597173144e-06, "loss": 0.2601, "step": 5200 }, { "epoch": 18.09, "learning_rate": 3.334982332155477e-06, "loss": 0.2864, "step": 5210 }, { "epoch": 18.12, "learning_rate": 3.3335689045936397e-06, "loss": 0.2753, "step": 5220 }, { "epoch": 18.16, "learning_rate": 3.332155477031802e-06, "loss": 0.298, "step": 5230 }, { "epoch": 18.19, "learning_rate": 3.330742049469965e-06, "loss": 0.2637, "step": 5240 }, { "epoch": 18.23, "learning_rate": 3.329328621908127e-06, "loss": 0.2674, "step": 5250 }, { "epoch": 18.26, "learning_rate": 3.3279151943462897e-06, "loss": 0.2606, "step": 5260 }, { "epoch": 18.3, "learning_rate": 3.326501766784452e-06, "loss": 0.2987, "step": 5270 }, { "epoch": 18.33, "learning_rate": 3.325088339222615e-06, "loss": 0.2924, "step": 5280 }, { "epoch": 18.37, "learning_rate": 3.3236749116607774e-06, "loss": 0.3043, "step": 5290 }, { "epoch": 18.4, "learning_rate": 3.3222614840989398e-06, "loss": 0.2727, "step": 5300 }, { "epoch": 18.44, "learning_rate": 3.320848056537102e-06, "loss": 0.2463, "step": 5310 }, { "epoch": 18.47, "learning_rate": 3.319434628975265e-06, "loss": 0.3037, "step": 5320 }, { "epoch": 18.51, "learning_rate": 3.3180212014134274e-06, "loss": 0.2611, "step": 5330 }, { "epoch": 18.54, "learning_rate": 3.3166077738515903e-06, "loss": 0.2597, "step": 5340 }, { "epoch": 18.57, "learning_rate": 3.3151943462897527e-06, "loss": 0.2875, "step": 5350 }, { "epoch": 18.61, "learning_rate": 3.313780918727915e-06, "loss": 0.2847, "step": 5360 }, { "epoch": 18.64, "learning_rate": 3.3123674911660775e-06, "loss": 0.2741, "step": 5370 }, { "epoch": 18.68, "learning_rate": 3.3109540636042403e-06, "loss": 0.2683, "step": 5380 }, { "epoch": 18.71, "learning_rate": 3.3095406360424027e-06, "loss": 0.2637, "step": 5390 }, { "epoch": 18.75, "learning_rate": 3.3081272084805656e-06, "loss": 0.2755, "step": 5400 }, { "epoch": 18.78, "learning_rate": 3.3067137809187276e-06, "loss": 0.2604, "step": 5410 }, { "epoch": 18.82, "learning_rate": 3.30530035335689e-06, "loss": 0.3166, "step": 5420 }, { "epoch": 18.85, "learning_rate": 3.303886925795053e-06, "loss": 0.2882, "step": 5430 }, { "epoch": 18.89, "learning_rate": 3.302473498233215e-06, "loss": 0.2685, "step": 5440 }, { "epoch": 18.92, "learning_rate": 3.301060070671378e-06, "loss": 0.2697, "step": 5450 }, { "epoch": 18.96, "learning_rate": 3.2996466431095405e-06, "loss": 0.2673, "step": 5460 }, { "epoch": 18.99, "learning_rate": 3.298233215547703e-06, "loss": 0.268, "step": 5470 }, { "epoch": 19.0, "eval_loss": 0.5078134536743164, "eval_runtime": 128.8142, "eval_samples_per_second": 4.13, "eval_steps_per_second": 1.032, "eval_wer": 0.19798161599280067, "step": 5472 }, { "epoch": 19.03, "learning_rate": 3.2968197879858653e-06, "loss": 0.2845, "step": 5480 }, { "epoch": 19.06, "learning_rate": 3.295406360424028e-06, "loss": 0.2673, "step": 5490 }, { "epoch": 19.1, "learning_rate": 3.2939929328621905e-06, "loss": 0.2458, "step": 5500 }, { "epoch": 19.13, "learning_rate": 3.2925795053003533e-06, "loss": 0.288, "step": 5510 }, { "epoch": 19.17, "learning_rate": 3.2911660777385158e-06, "loss": 0.2833, "step": 5520 }, { "epoch": 19.2, "learning_rate": 3.289752650176678e-06, "loss": 0.264, "step": 5530 }, { "epoch": 19.24, "learning_rate": 3.2883392226148406e-06, "loss": 0.2782, "step": 5540 }, { "epoch": 19.27, "learning_rate": 3.2869257950530034e-06, "loss": 0.2702, "step": 5550 }, { "epoch": 19.3, "learning_rate": 3.285512367491166e-06, "loss": 0.2908, "step": 5560 }, { "epoch": 19.34, "learning_rate": 3.2840989399293287e-06, "loss": 0.2852, "step": 5570 }, { "epoch": 19.37, "learning_rate": 3.2826855123674906e-06, "loss": 0.2657, "step": 5580 }, { "epoch": 19.41, "learning_rate": 3.2812720848056535e-06, "loss": 0.2553, "step": 5590 }, { "epoch": 19.44, "learning_rate": 3.279858657243816e-06, "loss": 0.2556, "step": 5600 }, { "epoch": 19.48, "learning_rate": 3.2784452296819787e-06, "loss": 0.2677, "step": 5610 }, { "epoch": 19.51, "learning_rate": 3.277031802120141e-06, "loss": 0.276, "step": 5620 }, { "epoch": 19.55, "learning_rate": 3.275618374558304e-06, "loss": 0.2622, "step": 5630 }, { "epoch": 19.58, "learning_rate": 3.274204946996466e-06, "loss": 0.2778, "step": 5640 }, { "epoch": 19.62, "learning_rate": 3.2727915194346288e-06, "loss": 0.2744, "step": 5650 }, { "epoch": 19.65, "learning_rate": 3.271378091872791e-06, "loss": 0.287, "step": 5660 }, { "epoch": 19.69, "learning_rate": 3.269964664310954e-06, "loss": 0.2831, "step": 5670 }, { "epoch": 19.72, "learning_rate": 3.2685512367491164e-06, "loss": 0.256, "step": 5680 }, { "epoch": 19.75, "learning_rate": 3.2671378091872793e-06, "loss": 0.2609, "step": 5690 }, { "epoch": 19.79, "learning_rate": 3.2657243816254412e-06, "loss": 0.2601, "step": 5700 }, { "epoch": 19.82, "learning_rate": 3.264310954063604e-06, "loss": 0.2834, "step": 5710 }, { "epoch": 19.86, "learning_rate": 3.2628975265017665e-06, "loss": 0.2889, "step": 5720 }, { "epoch": 19.89, "learning_rate": 3.2614840989399293e-06, "loss": 0.2617, "step": 5730 }, { "epoch": 19.93, "learning_rate": 3.2600706713780917e-06, "loss": 0.2747, "step": 5740 }, { "epoch": 19.96, "learning_rate": 3.258657243816254e-06, "loss": 0.2867, "step": 5750 }, { "epoch": 20.0, "learning_rate": 3.2572438162544166e-06, "loss": 0.2631, "step": 5760 }, { "epoch": 20.0, "eval_loss": 0.5262243747711182, "eval_runtime": 129.2103, "eval_samples_per_second": 4.117, "eval_steps_per_second": 1.029, "eval_wer": 0.20209551970174197, "step": 5760 }, { "epoch": 20.03, "learning_rate": 3.2558303886925794e-06, "loss": 0.2689, "step": 5770 }, { "epoch": 20.07, "learning_rate": 3.254416961130742e-06, "loss": 0.2906, "step": 5780 }, { "epoch": 20.1, "learning_rate": 3.2530035335689046e-06, "loss": 0.2586, "step": 5790 }, { "epoch": 20.14, "learning_rate": 3.251590106007067e-06, "loss": 0.2732, "step": 5800 }, { "epoch": 20.17, "learning_rate": 3.2501766784452294e-06, "loss": 0.2528, "step": 5810 }, { "epoch": 20.21, "learning_rate": 3.248763250883392e-06, "loss": 0.26, "step": 5820 }, { "epoch": 20.24, "learning_rate": 3.2473498233215547e-06, "loss": 0.279, "step": 5830 }, { "epoch": 20.28, "learning_rate": 3.245936395759717e-06, "loss": 0.2506, "step": 5840 }, { "epoch": 20.31, "learning_rate": 3.24452296819788e-06, "loss": 0.2886, "step": 5850 }, { "epoch": 20.35, "learning_rate": 3.2431095406360423e-06, "loss": 0.2779, "step": 5860 }, { "epoch": 20.38, "learning_rate": 3.2416961130742048e-06, "loss": 0.2731, "step": 5870 }, { "epoch": 20.42, "learning_rate": 3.240282685512367e-06, "loss": 0.2575, "step": 5880 }, { "epoch": 20.45, "learning_rate": 3.23886925795053e-06, "loss": 0.2671, "step": 5890 }, { "epoch": 20.48, "learning_rate": 3.2374558303886924e-06, "loss": 0.2901, "step": 5900 }, { "epoch": 20.52, "learning_rate": 3.2360424028268552e-06, "loss": 0.2778, "step": 5910 }, { "epoch": 20.55, "learning_rate": 3.2346289752650172e-06, "loss": 0.2629, "step": 5920 }, { "epoch": 20.59, "learning_rate": 3.23321554770318e-06, "loss": 0.2539, "step": 5930 }, { "epoch": 20.62, "learning_rate": 3.2318021201413425e-06, "loss": 0.2697, "step": 5940 }, { "epoch": 20.66, "learning_rate": 3.2303886925795053e-06, "loss": 0.279, "step": 5950 }, { "epoch": 20.69, "learning_rate": 3.2289752650176677e-06, "loss": 0.2869, "step": 5960 }, { "epoch": 20.73, "learning_rate": 3.2275618374558305e-06, "loss": 0.2761, "step": 5970 }, { "epoch": 20.76, "learning_rate": 3.2261484098939925e-06, "loss": 0.2775, "step": 5980 }, { "epoch": 20.8, "learning_rate": 3.2247349823321554e-06, "loss": 0.2639, "step": 5990 }, { "epoch": 20.83, "learning_rate": 3.2233215547703178e-06, "loss": 0.2925, "step": 6000 }, { "epoch": 20.87, "learning_rate": 3.2219081272084806e-06, "loss": 0.2851, "step": 6010 }, { "epoch": 20.9, "learning_rate": 3.220494699646643e-06, "loss": 0.2682, "step": 6020 }, { "epoch": 20.94, "learning_rate": 3.2190812720848054e-06, "loss": 0.2541, "step": 6030 }, { "epoch": 20.97, "learning_rate": 3.217667844522968e-06, "loss": 0.2753, "step": 6040 }, { "epoch": 21.0, "eval_loss": 0.5161154866218567, "eval_runtime": 128.857, "eval_samples_per_second": 4.129, "eval_steps_per_second": 1.032, "eval_wer": 0.19913865141094042, "step": 6048 }, { "epoch": 21.01, "learning_rate": 3.2162544169611307e-06, "loss": 0.296, "step": 6050 }, { "epoch": 21.04, "learning_rate": 3.214840989399293e-06, "loss": 0.2774, "step": 6060 }, { "epoch": 21.08, "learning_rate": 3.213427561837456e-06, "loss": 0.2601, "step": 6070 }, { "epoch": 21.11, "learning_rate": 3.2120141342756183e-06, "loss": 0.2738, "step": 6080 }, { "epoch": 21.15, "learning_rate": 3.2106007067137807e-06, "loss": 0.2756, "step": 6090 }, { "epoch": 21.18, "learning_rate": 3.209187279151943e-06, "loss": 0.2851, "step": 6100 }, { "epoch": 21.21, "learning_rate": 3.207773851590106e-06, "loss": 0.2786, "step": 6110 }, { "epoch": 21.25, "learning_rate": 3.2063604240282684e-06, "loss": 0.2685, "step": 6120 }, { "epoch": 21.28, "learning_rate": 3.204946996466431e-06, "loss": 0.2652, "step": 6130 }, { "epoch": 21.32, "learning_rate": 3.2035335689045936e-06, "loss": 0.278, "step": 6140 }, { "epoch": 21.35, "learning_rate": 3.202120141342756e-06, "loss": 0.2855, "step": 6150 }, { "epoch": 21.39, "learning_rate": 3.2007067137809184e-06, "loss": 0.2757, "step": 6160 }, { "epoch": 21.42, "learning_rate": 3.1992932862190813e-06, "loss": 0.2702, "step": 6170 }, { "epoch": 21.46, "learning_rate": 3.1978798586572437e-06, "loss": 0.2765, "step": 6180 }, { "epoch": 21.49, "learning_rate": 3.1964664310954065e-06, "loss": 0.2616, "step": 6190 }, { "epoch": 21.53, "learning_rate": 3.1950530035335685e-06, "loss": 0.2795, "step": 6200 }, { "epoch": 21.56, "learning_rate": 3.1936395759717313e-06, "loss": 0.2716, "step": 6210 }, { "epoch": 21.6, "learning_rate": 3.1922261484098937e-06, "loss": 0.2697, "step": 6220 }, { "epoch": 21.63, "learning_rate": 3.1908127208480566e-06, "loss": 0.2416, "step": 6230 }, { "epoch": 21.66, "learning_rate": 3.189399293286219e-06, "loss": 0.2782, "step": 6240 }, { "epoch": 21.7, "learning_rate": 3.187985865724382e-06, "loss": 0.2617, "step": 6250 }, { "epoch": 21.73, "learning_rate": 3.186572438162544e-06, "loss": 0.2701, "step": 6260 }, { "epoch": 21.77, "learning_rate": 3.1851590106007066e-06, "loss": 0.2894, "step": 6270 }, { "epoch": 21.8, "learning_rate": 3.183745583038869e-06, "loss": 0.2634, "step": 6280 }, { "epoch": 21.84, "learning_rate": 3.182332155477032e-06, "loss": 0.2928, "step": 6290 }, { "epoch": 21.87, "learning_rate": 3.1809187279151943e-06, "loss": 0.2425, "step": 6300 }, { "epoch": 21.91, "learning_rate": 3.179505300353357e-06, "loss": 0.272, "step": 6310 }, { "epoch": 21.94, "learning_rate": 3.178091872791519e-06, "loss": 0.2818, "step": 6320 }, { "epoch": 21.98, "learning_rate": 3.176678445229682e-06, "loss": 0.2797, "step": 6330 }, { "epoch": 22.0, "eval_loss": 0.5096527338027954, "eval_runtime": 129.6264, "eval_samples_per_second": 4.104, "eval_steps_per_second": 1.026, "eval_wer": 0.20093848428360223, "step": 6336 }, { "epoch": 22.01, "learning_rate": 3.1752650176678444e-06, "loss": 0.3083, "step": 6340 }, { "epoch": 22.05, "learning_rate": 3.173851590106007e-06, "loss": 0.2683, "step": 6350 }, { "epoch": 22.08, "learning_rate": 3.1724381625441696e-06, "loss": 0.2614, "step": 6360 }, { "epoch": 22.12, "learning_rate": 3.171024734982332e-06, "loss": 0.2664, "step": 6370 }, { "epoch": 22.15, "learning_rate": 3.1696113074204944e-06, "loss": 0.2813, "step": 6380 }, { "epoch": 22.19, "learning_rate": 3.1681978798586572e-06, "loss": 0.2609, "step": 6390 }, { "epoch": 22.22, "learning_rate": 3.1667844522968197e-06, "loss": 0.2811, "step": 6400 }, { "epoch": 22.26, "learning_rate": 3.1653710247349825e-06, "loss": 0.2664, "step": 6410 }, { "epoch": 22.29, "learning_rate": 3.163957597173145e-06, "loss": 0.3003, "step": 6420 }, { "epoch": 22.33, "learning_rate": 3.1625441696113073e-06, "loss": 0.2665, "step": 6430 }, { "epoch": 22.36, "learning_rate": 3.1611307420494697e-06, "loss": 0.2603, "step": 6440 }, { "epoch": 22.39, "learning_rate": 3.1597173144876326e-06, "loss": 0.2702, "step": 6450 }, { "epoch": 22.43, "learning_rate": 3.158303886925795e-06, "loss": 0.2403, "step": 6460 }, { "epoch": 22.46, "learning_rate": 3.156890459363958e-06, "loss": 0.272, "step": 6470 }, { "epoch": 22.5, "learning_rate": 3.15547703180212e-06, "loss": 0.308, "step": 6480 }, { "epoch": 22.53, "learning_rate": 3.154063604240282e-06, "loss": 0.275, "step": 6490 }, { "epoch": 22.57, "learning_rate": 3.152650176678445e-06, "loss": 0.2824, "step": 6500 }, { "epoch": 22.6, "learning_rate": 3.1512367491166074e-06, "loss": 0.2734, "step": 6510 }, { "epoch": 22.64, "learning_rate": 3.1498233215547703e-06, "loss": 0.2686, "step": 6520 }, { "epoch": 22.67, "learning_rate": 3.148409893992933e-06, "loss": 0.2826, "step": 6530 }, { "epoch": 22.71, "learning_rate": 3.146996466431095e-06, "loss": 0.2878, "step": 6540 }, { "epoch": 22.74, "learning_rate": 3.1455830388692575e-06, "loss": 0.2793, "step": 6550 }, { "epoch": 22.78, "learning_rate": 3.1441696113074203e-06, "loss": 0.2574, "step": 6560 }, { "epoch": 22.81, "learning_rate": 3.1427561837455827e-06, "loss": 0.2733, "step": 6570 }, { "epoch": 22.85, "learning_rate": 3.1413427561837456e-06, "loss": 0.2887, "step": 6580 }, { "epoch": 22.88, "learning_rate": 3.139929328621908e-06, "loss": 0.2801, "step": 6590 }, { "epoch": 22.91, "learning_rate": 3.1385159010600704e-06, "loss": 0.2739, "step": 6600 }, { "epoch": 22.95, "learning_rate": 3.137102473498233e-06, "loss": 0.2622, "step": 6610 }, { "epoch": 22.98, "learning_rate": 3.1356890459363956e-06, "loss": 0.2667, "step": 6620 }, { "epoch": 23.0, "eval_loss": 0.5130947828292847, "eval_runtime": 130.2324, "eval_samples_per_second": 4.085, "eval_steps_per_second": 1.021, "eval_wer": 0.19952432988365365, "step": 6624 }, { "epoch": 23.02, "learning_rate": 3.134275618374558e-06, "loss": 0.2649, "step": 6630 }, { "epoch": 23.06, "learning_rate": 3.132862190812721e-06, "loss": 0.2847, "step": 6640 }, { "epoch": 23.09, "learning_rate": 3.131448763250883e-06, "loss": 0.2679, "step": 6650 }, { "epoch": 23.12, "learning_rate": 3.1300353356890457e-06, "loss": 0.284, "step": 6660 }, { "epoch": 23.16, "learning_rate": 3.128621908127208e-06, "loss": 0.2729, "step": 6670 }, { "epoch": 23.19, "learning_rate": 3.127208480565371e-06, "loss": 0.2708, "step": 6680 }, { "epoch": 23.23, "learning_rate": 3.1257950530035333e-06, "loss": 0.2851, "step": 6690 }, { "epoch": 23.26, "learning_rate": 3.124381625441696e-06, "loss": 0.262, "step": 6700 }, { "epoch": 23.3, "learning_rate": 3.122968197879858e-06, "loss": 0.2997, "step": 6710 }, { "epoch": 23.33, "learning_rate": 3.121554770318021e-06, "loss": 0.2653, "step": 6720 }, { "epoch": 23.37, "learning_rate": 3.1201413427561834e-06, "loss": 0.2544, "step": 6730 }, { "epoch": 23.4, "learning_rate": 3.1187279151943462e-06, "loss": 0.2888, "step": 6740 }, { "epoch": 23.44, "learning_rate": 3.1173144876325086e-06, "loss": 0.2837, "step": 6750 }, { "epoch": 23.47, "learning_rate": 3.1159010600706715e-06, "loss": 0.2824, "step": 6760 }, { "epoch": 23.51, "learning_rate": 3.1144876325088335e-06, "loss": 0.3101, "step": 6770 }, { "epoch": 23.54, "learning_rate": 3.1130742049469963e-06, "loss": 0.2965, "step": 6780 }, { "epoch": 23.57, "learning_rate": 3.1116607773851587e-06, "loss": 0.2739, "step": 6790 }, { "epoch": 23.61, "learning_rate": 3.1102473498233215e-06, "loss": 0.2697, "step": 6800 }, { "epoch": 23.64, "learning_rate": 3.108833922261484e-06, "loss": 0.2837, "step": 6810 }, { "epoch": 23.68, "learning_rate": 3.1074204946996464e-06, "loss": 0.277, "step": 6820 }, { "epoch": 23.71, "learning_rate": 3.1060070671378088e-06, "loss": 0.2887, "step": 6830 }, { "epoch": 23.75, "learning_rate": 3.1045936395759716e-06, "loss": 0.2765, "step": 6840 }, { "epoch": 23.78, "learning_rate": 3.103180212014134e-06, "loss": 0.2468, "step": 6850 }, { "epoch": 23.82, "learning_rate": 3.101766784452297e-06, "loss": 0.2786, "step": 6860 }, { "epoch": 23.85, "learning_rate": 3.1003533568904593e-06, "loss": 0.2561, "step": 6870 }, { "epoch": 23.89, "learning_rate": 3.0989399293286217e-06, "loss": 0.2494, "step": 6880 }, { "epoch": 23.92, "learning_rate": 3.097526501766784e-06, "loss": 0.2619, "step": 6890 }, { "epoch": 23.96, "learning_rate": 3.096113074204947e-06, "loss": 0.2629, "step": 6900 }, { "epoch": 23.99, "learning_rate": 3.0946996466431093e-06, "loss": 0.2722, "step": 6910 }, { "epoch": 24.0, "eval_loss": 0.5097522735595703, "eval_runtime": 129.544, "eval_samples_per_second": 4.107, "eval_steps_per_second": 1.027, "eval_wer": 0.199010091920036, "step": 6912 }, { "epoch": 24.03, "learning_rate": 3.093286219081272e-06, "loss": 0.2714, "step": 6920 }, { "epoch": 24.06, "learning_rate": 3.0918727915194346e-06, "loss": 0.2682, "step": 6930 }, { "epoch": 24.1, "learning_rate": 3.090459363957597e-06, "loss": 0.2623, "step": 6940 }, { "epoch": 24.13, "learning_rate": 3.0890459363957594e-06, "loss": 0.279, "step": 6950 }, { "epoch": 24.17, "learning_rate": 3.0876325088339222e-06, "loss": 0.2612, "step": 6960 }, { "epoch": 24.2, "learning_rate": 3.0862190812720846e-06, "loss": 0.2505, "step": 6970 }, { "epoch": 24.24, "learning_rate": 3.0848056537102475e-06, "loss": 0.281, "step": 6980 }, { "epoch": 24.27, "learning_rate": 3.0833922261484094e-06, "loss": 0.2653, "step": 6990 }, { "epoch": 24.3, "learning_rate": 3.0819787985865723e-06, "loss": 0.2881, "step": 7000 }, { "epoch": 24.34, "learning_rate": 3.0805653710247347e-06, "loss": 0.2596, "step": 7010 }, { "epoch": 24.37, "learning_rate": 3.0791519434628975e-06, "loss": 0.2459, "step": 7020 }, { "epoch": 24.41, "learning_rate": 3.07773851590106e-06, "loss": 0.2838, "step": 7030 }, { "epoch": 24.44, "learning_rate": 3.0763250883392228e-06, "loss": 0.2497, "step": 7040 }, { "epoch": 24.48, "learning_rate": 3.0749116607773847e-06, "loss": 0.2907, "step": 7050 }, { "epoch": 24.51, "learning_rate": 3.0734982332155476e-06, "loss": 0.2954, "step": 7060 }, { "epoch": 24.55, "learning_rate": 3.07208480565371e-06, "loss": 0.2536, "step": 7070 }, { "epoch": 24.58, "learning_rate": 3.070671378091873e-06, "loss": 0.2554, "step": 7080 }, { "epoch": 24.62, "learning_rate": 3.0692579505300352e-06, "loss": 0.2779, "step": 7090 }, { "epoch": 24.65, "learning_rate": 3.067844522968198e-06, "loss": 0.2681, "step": 7100 }, { "epoch": 24.69, "learning_rate": 3.06643109540636e-06, "loss": 0.2715, "step": 7110 }, { "epoch": 24.72, "learning_rate": 3.065017667844523e-06, "loss": 0.2692, "step": 7120 }, { "epoch": 24.75, "learning_rate": 3.0636042402826853e-06, "loss": 0.2646, "step": 7130 }, { "epoch": 24.79, "learning_rate": 3.062190812720848e-06, "loss": 0.2585, "step": 7140 }, { "epoch": 24.82, "learning_rate": 3.0607773851590105e-06, "loss": 0.2706, "step": 7150 }, { "epoch": 24.86, "learning_rate": 3.059363957597173e-06, "loss": 0.2796, "step": 7160 }, { "epoch": 24.89, "learning_rate": 3.0579505300353354e-06, "loss": 0.2645, "step": 7170 }, { "epoch": 24.93, "learning_rate": 3.056537102473498e-06, "loss": 0.2374, "step": 7180 }, { "epoch": 24.96, "learning_rate": 3.0551236749116606e-06, "loss": 0.285, "step": 7190 }, { "epoch": 25.0, "learning_rate": 3.0537102473498234e-06, "loss": 0.3026, "step": 7200 }, { "epoch": 25.0, "eval_loss": 0.5193008780479431, "eval_runtime": 129.4939, "eval_samples_per_second": 4.108, "eval_steps_per_second": 1.027, "eval_wer": 0.200552805810889, "step": 7200 }, { "epoch": 25.03, "learning_rate": 3.052296819787986e-06, "loss": 0.3016, "step": 7210 }, { "epoch": 25.07, "learning_rate": 3.0508833922261483e-06, "loss": 0.2787, "step": 7220 }, { "epoch": 25.1, "learning_rate": 3.0494699646643107e-06, "loss": 0.2695, "step": 7230 }, { "epoch": 25.14, "learning_rate": 3.048197879858657e-06, "loss": 0.2666, "step": 7240 }, { "epoch": 25.17, "learning_rate": 3.0467844522968195e-06, "loss": 0.2892, "step": 7250 }, { "epoch": 25.21, "learning_rate": 3.0453710247349824e-06, "loss": 0.262, "step": 7260 }, { "epoch": 25.24, "learning_rate": 3.0439575971731448e-06, "loss": 0.2557, "step": 7270 }, { "epoch": 25.28, "learning_rate": 3.0425441696113076e-06, "loss": 0.255, "step": 7280 }, { "epoch": 25.31, "learning_rate": 3.0411307420494696e-06, "loss": 0.2848, "step": 7290 }, { "epoch": 25.35, "learning_rate": 3.0397173144876324e-06, "loss": 0.2734, "step": 7300 }, { "epoch": 25.38, "learning_rate": 3.038303886925795e-06, "loss": 0.2719, "step": 7310 }, { "epoch": 25.42, "learning_rate": 3.0368904593639577e-06, "loss": 0.2672, "step": 7320 }, { "epoch": 25.45, "learning_rate": 3.03547703180212e-06, "loss": 0.266, "step": 7330 }, { "epoch": 25.48, "learning_rate": 3.034063604240283e-06, "loss": 0.3005, "step": 7340 }, { "epoch": 25.52, "learning_rate": 3.032650176678445e-06, "loss": 0.2512, "step": 7350 }, { "epoch": 25.55, "learning_rate": 3.0312367491166077e-06, "loss": 0.2525, "step": 7360 }, { "epoch": 25.59, "learning_rate": 3.02982332155477e-06, "loss": 0.2543, "step": 7370 }, { "epoch": 25.62, "learning_rate": 3.028409893992933e-06, "loss": 0.2881, "step": 7380 }, { "epoch": 25.66, "learning_rate": 3.0269964664310954e-06, "loss": 0.2569, "step": 7390 }, { "epoch": 25.69, "learning_rate": 3.0255830388692582e-06, "loss": 0.2721, "step": 7400 }, { "epoch": 25.73, "learning_rate": 3.02416961130742e-06, "loss": 0.2717, "step": 7410 }, { "epoch": 25.76, "learning_rate": 3.022756183745583e-06, "loss": 0.2897, "step": 7420 }, { "epoch": 25.8, "learning_rate": 3.0213427561837454e-06, "loss": 0.2652, "step": 7430 }, { "epoch": 25.83, "learning_rate": 3.0199293286219083e-06, "loss": 0.2545, "step": 7440 }, { "epoch": 25.87, "learning_rate": 3.0185159010600707e-06, "loss": 0.2826, "step": 7450 }, { "epoch": 25.9, "learning_rate": 3.0171024734982327e-06, "loss": 0.2638, "step": 7460 }, { "epoch": 25.94, "learning_rate": 3.0156890459363955e-06, "loss": 0.2592, "step": 7470 }, { "epoch": 25.97, "learning_rate": 3.014275618374558e-06, "loss": 0.2888, "step": 7480 }, { "epoch": 26.0, "eval_loss": 0.49870219826698303, "eval_runtime": 130.4803, "eval_samples_per_second": 4.077, "eval_steps_per_second": 1.019, "eval_wer": 0.19856013370187053, "step": 7488 }, { "epoch": 26.01, "learning_rate": 3.0128621908127208e-06, "loss": 0.2858, "step": 7490 }, { "epoch": 26.04, "learning_rate": 3.011448763250883e-06, "loss": 0.28, "step": 7500 }, { "epoch": 26.08, "learning_rate": 3.010035335689046e-06, "loss": 0.2725, "step": 7510 }, { "epoch": 26.11, "learning_rate": 3.008621908127208e-06, "loss": 0.271, "step": 7520 }, { "epoch": 26.15, "learning_rate": 3.007208480565371e-06, "loss": 0.2829, "step": 7530 }, { "epoch": 26.18, "learning_rate": 3.0057950530035332e-06, "loss": 0.2639, "step": 7540 }, { "epoch": 26.21, "learning_rate": 3.004381625441696e-06, "loss": 0.256, "step": 7550 }, { "epoch": 26.25, "learning_rate": 3.0029681978798585e-06, "loss": 0.2738, "step": 7560 }, { "epoch": 26.28, "learning_rate": 3.001554770318021e-06, "loss": 0.2642, "step": 7570 }, { "epoch": 26.32, "learning_rate": 3.0001413427561833e-06, "loss": 0.2953, "step": 7580 }, { "epoch": 26.35, "learning_rate": 2.998727915194346e-06, "loss": 0.2696, "step": 7590 }, { "epoch": 26.39, "learning_rate": 2.9973144876325085e-06, "loss": 0.2801, "step": 7600 }, { "epoch": 26.42, "learning_rate": 2.9959010600706714e-06, "loss": 0.2846, "step": 7610 }, { "epoch": 26.46, "learning_rate": 2.9944876325088338e-06, "loss": 0.2726, "step": 7620 }, { "epoch": 26.49, "learning_rate": 2.993074204946996e-06, "loss": 0.2773, "step": 7630 }, { "epoch": 26.53, "learning_rate": 2.9916607773851586e-06, "loss": 0.2555, "step": 7640 }, { "epoch": 26.56, "learning_rate": 2.9902473498233214e-06, "loss": 0.2797, "step": 7650 }, { "epoch": 26.6, "learning_rate": 2.988833922261484e-06, "loss": 0.2519, "step": 7660 }, { "epoch": 26.63, "learning_rate": 2.9874204946996467e-06, "loss": 0.2665, "step": 7670 }, { "epoch": 26.66, "learning_rate": 2.986007067137809e-06, "loss": 0.2618, "step": 7680 }, { "epoch": 26.7, "learning_rate": 2.9845936395759715e-06, "loss": 0.2807, "step": 7690 }, { "epoch": 26.73, "learning_rate": 2.983180212014134e-06, "loss": 0.2786, "step": 7700 }, { "epoch": 26.77, "learning_rate": 2.9817667844522967e-06, "loss": 0.2579, "step": 7710 }, { "epoch": 26.8, "learning_rate": 2.980353356890459e-06, "loss": 0.2748, "step": 7720 }, { "epoch": 26.84, "learning_rate": 2.978939929328622e-06, "loss": 0.2755, "step": 7730 }, { "epoch": 26.87, "learning_rate": 2.977526501766784e-06, "loss": 0.2483, "step": 7740 }, { "epoch": 26.91, "learning_rate": 2.9761130742049468e-06, "loss": 0.2753, "step": 7750 }, { "epoch": 26.94, "learning_rate": 2.974699646643109e-06, "loss": 0.2455, "step": 7760 }, { "epoch": 26.98, "learning_rate": 2.973286219081272e-06, "loss": 0.2732, "step": 7770 }, { "epoch": 27.0, "eval_loss": 0.5063392519950867, "eval_runtime": 129.9156, "eval_samples_per_second": 4.095, "eval_steps_per_second": 1.024, "eval_wer": 0.20074564504724562, "step": 7776 }, { "epoch": 27.01, "learning_rate": 2.9718727915194344e-06, "loss": 0.2939, "step": 7780 }, { "epoch": 27.05, "learning_rate": 2.9704593639575973e-06, "loss": 0.2713, "step": 7790 }, { "epoch": 27.08, "learning_rate": 2.9690459363957593e-06, "loss": 0.2683, "step": 7800 }, { "epoch": 27.12, "learning_rate": 2.967632508833922e-06, "loss": 0.2905, "step": 7810 }, { "epoch": 27.15, "learning_rate": 2.9662190812720845e-06, "loss": 0.2755, "step": 7820 }, { "epoch": 27.19, "learning_rate": 2.9648056537102473e-06, "loss": 0.2745, "step": 7830 }, { "epoch": 27.22, "learning_rate": 2.9633922261484097e-06, "loss": 0.2813, "step": 7840 }, { "epoch": 27.26, "learning_rate": 2.9619787985865726e-06, "loss": 0.2405, "step": 7850 }, { "epoch": 27.29, "learning_rate": 2.9605653710247346e-06, "loss": 0.2778, "step": 7860 }, { "epoch": 27.33, "learning_rate": 2.9591519434628974e-06, "loss": 0.2785, "step": 7870 }, { "epoch": 27.36, "learning_rate": 2.95773851590106e-06, "loss": 0.2665, "step": 7880 }, { "epoch": 27.39, "learning_rate": 2.9563250883392226e-06, "loss": 0.2905, "step": 7890 }, { "epoch": 27.43, "learning_rate": 2.954911660777385e-06, "loss": 0.2611, "step": 7900 }, { "epoch": 27.46, "learning_rate": 2.9534982332155475e-06, "loss": 0.2633, "step": 7910 }, { "epoch": 27.5, "learning_rate": 2.95208480565371e-06, "loss": 0.2525, "step": 7920 }, { "epoch": 27.53, "learning_rate": 2.9506713780918727e-06, "loss": 0.2627, "step": 7930 }, { "epoch": 27.57, "learning_rate": 2.949257950530035e-06, "loss": 0.2834, "step": 7940 }, { "epoch": 27.6, "learning_rate": 2.947844522968198e-06, "loss": 0.2709, "step": 7950 }, { "epoch": 27.64, "learning_rate": 2.9464310954063604e-06, "loss": 0.2637, "step": 7960 }, { "epoch": 27.67, "learning_rate": 2.9450176678445228e-06, "loss": 0.304, "step": 7970 }, { "epoch": 27.71, "learning_rate": 2.943604240282685e-06, "loss": 0.2664, "step": 7980 }, { "epoch": 27.74, "learning_rate": 2.942190812720848e-06, "loss": 0.2684, "step": 7990 }, { "epoch": 27.78, "learning_rate": 2.9407773851590104e-06, "loss": 0.2641, "step": 8000 }, { "epoch": 27.81, "learning_rate": 2.9393639575971732e-06, "loss": 0.2767, "step": 8010 }, { "epoch": 27.85, "learning_rate": 2.9379505300353357e-06, "loss": 0.2825, "step": 8020 }, { "epoch": 27.88, "learning_rate": 2.936537102473498e-06, "loss": 0.2747, "step": 8030 }, { "epoch": 27.91, "learning_rate": 2.9351236749116605e-06, "loss": 0.2877, "step": 8040 }, { "epoch": 27.95, "learning_rate": 2.9337102473498233e-06, "loss": 0.2703, "step": 8050 }, { "epoch": 27.98, "learning_rate": 2.9322968197879857e-06, "loss": 0.2567, "step": 8060 }, { "epoch": 28.0, "eval_loss": 0.5102671980857849, "eval_runtime": 130.0784, "eval_samples_per_second": 4.09, "eval_steps_per_second": 1.022, "eval_wer": 0.2015170019926721, "step": 8064 }, { "epoch": 28.02, "learning_rate": 2.9308833922261486e-06, "loss": 0.2758, "step": 8070 }, { "epoch": 28.06, "learning_rate": 2.9294699646643105e-06, "loss": 0.2866, "step": 8080 }, { "epoch": 28.09, "learning_rate": 2.9280565371024734e-06, "loss": 0.2397, "step": 8090 }, { "epoch": 28.12, "learning_rate": 2.9266431095406358e-06, "loss": 0.2718, "step": 8100 }, { "epoch": 28.16, "learning_rate": 2.9252296819787986e-06, "loss": 0.2795, "step": 8110 }, { "epoch": 28.19, "learning_rate": 2.923816254416961e-06, "loss": 0.258, "step": 8120 }, { "epoch": 28.23, "learning_rate": 2.922402826855124e-06, "loss": 0.2651, "step": 8130 }, { "epoch": 28.26, "learning_rate": 2.920989399293286e-06, "loss": 0.2741, "step": 8140 }, { "epoch": 28.3, "learning_rate": 2.9195759717314487e-06, "loss": 0.286, "step": 8150 }, { "epoch": 28.33, "learning_rate": 2.918162544169611e-06, "loss": 0.2716, "step": 8160 }, { "epoch": 28.37, "learning_rate": 2.916749116607774e-06, "loss": 0.2594, "step": 8170 }, { "epoch": 28.4, "learning_rate": 2.9153356890459363e-06, "loss": 0.2958, "step": 8180 }, { "epoch": 28.44, "learning_rate": 2.9139222614840987e-06, "loss": 0.2742, "step": 8190 }, { "epoch": 28.47, "learning_rate": 2.912508833922261e-06, "loss": 0.2678, "step": 8200 }, { "epoch": 28.51, "learning_rate": 2.911095406360424e-06, "loss": 0.2961, "step": 8210 }, { "epoch": 28.54, "learning_rate": 2.9096819787985864e-06, "loss": 0.2675, "step": 8220 }, { "epoch": 28.57, "learning_rate": 2.9082685512367492e-06, "loss": 0.2722, "step": 8230 }, { "epoch": 28.61, "learning_rate": 2.9068551236749116e-06, "loss": 0.257, "step": 8240 }, { "epoch": 28.64, "learning_rate": 2.905441696113074e-06, "loss": 0.3073, "step": 8250 }, { "epoch": 28.68, "learning_rate": 2.9040282685512365e-06, "loss": 0.2852, "step": 8260 }, { "epoch": 28.71, "learning_rate": 2.9026148409893993e-06, "loss": 0.275, "step": 8270 }, { "epoch": 28.75, "learning_rate": 2.9012014134275617e-06, "loss": 0.272, "step": 8280 }, { "epoch": 28.78, "learning_rate": 2.8997879858657245e-06, "loss": 0.2732, "step": 8290 }, { "epoch": 28.82, "learning_rate": 2.898374558303887e-06, "loss": 0.2734, "step": 8300 }, { "epoch": 28.85, "learning_rate": 2.8969611307420493e-06, "loss": 0.2581, "step": 8310 }, { "epoch": 28.89, "learning_rate": 2.8955477031802118e-06, "loss": 0.2689, "step": 8320 }, { "epoch": 28.92, "learning_rate": 2.8941342756183746e-06, "loss": 0.2592, "step": 8330 }, { "epoch": 28.96, "learning_rate": 2.892720848056537e-06, "loss": 0.261, "step": 8340 }, { "epoch": 28.99, "learning_rate": 2.8913074204947e-06, "loss": 0.2845, "step": 8350 }, { "epoch": 29.0, "eval_loss": 0.5084418058395386, "eval_runtime": 129.7694, "eval_samples_per_second": 4.1, "eval_steps_per_second": 1.025, "eval_wer": 0.20203123995628977, "step": 8352 }, { "epoch": 29.03, "learning_rate": 2.889893992932862e-06, "loss": 0.2541, "step": 8360 }, { "epoch": 29.06, "learning_rate": 2.8884805653710247e-06, "loss": 0.2822, "step": 8370 }, { "epoch": 29.1, "learning_rate": 2.887067137809187e-06, "loss": 0.2498, "step": 8380 }, { "epoch": 29.13, "learning_rate": 2.88565371024735e-06, "loss": 0.2908, "step": 8390 }, { "epoch": 29.17, "learning_rate": 2.8842402826855123e-06, "loss": 0.2679, "step": 8400 }, { "epoch": 29.2, "learning_rate": 2.882826855123675e-06, "loss": 0.2352, "step": 8410 }, { "epoch": 29.24, "learning_rate": 2.881413427561837e-06, "loss": 0.2733, "step": 8420 }, { "epoch": 29.27, "learning_rate": 2.88e-06, "loss": 0.2427, "step": 8430 }, { "epoch": 29.3, "learning_rate": 2.8785865724381624e-06, "loss": 0.2692, "step": 8440 }, { "epoch": 29.34, "learning_rate": 2.877173144876325e-06, "loss": 0.27, "step": 8450 }, { "epoch": 29.37, "learning_rate": 2.8757597173144876e-06, "loss": 0.2465, "step": 8460 }, { "epoch": 29.41, "learning_rate": 2.8743462897526504e-06, "loss": 0.2853, "step": 8470 }, { "epoch": 29.44, "learning_rate": 2.8729328621908124e-06, "loss": 0.2536, "step": 8480 }, { "epoch": 29.48, "learning_rate": 2.8715194346289753e-06, "loss": 0.2824, "step": 8490 }, { "epoch": 29.51, "learning_rate": 2.8701060070671377e-06, "loss": 0.2749, "step": 8500 }, { "epoch": 29.55, "learning_rate": 2.8686925795053005e-06, "loss": 0.2399, "step": 8510 }, { "epoch": 29.58, "learning_rate": 2.867279151943463e-06, "loss": 0.2557, "step": 8520 }, { "epoch": 29.62, "learning_rate": 2.865865724381625e-06, "loss": 0.2561, "step": 8530 }, { "epoch": 29.65, "learning_rate": 2.8644522968197877e-06, "loss": 0.2758, "step": 8540 }, { "epoch": 29.69, "learning_rate": 2.86303886925795e-06, "loss": 0.2755, "step": 8550 }, { "epoch": 29.72, "learning_rate": 2.861625441696113e-06, "loss": 0.2732, "step": 8560 }, { "epoch": 29.75, "learning_rate": 2.860212014134276e-06, "loss": 0.282, "step": 8570 }, { "epoch": 29.79, "learning_rate": 2.8587985865724382e-06, "loss": 0.2516, "step": 8580 }, { "epoch": 29.82, "learning_rate": 2.8573851590106e-06, "loss": 0.2953, "step": 8590 }, { "epoch": 29.86, "learning_rate": 2.855971731448763e-06, "loss": 0.3114, "step": 8600 }, { "epoch": 29.89, "learning_rate": 2.8545583038869254e-06, "loss": 0.2853, "step": 8610 }, { "epoch": 29.93, "learning_rate": 2.8531448763250883e-06, "loss": 0.2648, "step": 8620 }, { "epoch": 29.96, "learning_rate": 2.8517314487632507e-06, "loss": 0.2812, "step": 8630 }, { "epoch": 30.0, "learning_rate": 2.8503180212014135e-06, "loss": 0.2591, "step": 8640 }, { "epoch": 30.0, "eval_loss": 0.5109365582466125, "eval_runtime": 129.6483, "eval_samples_per_second": 4.103, "eval_steps_per_second": 1.026, "eval_wer": 0.1989458121745838, "step": 8640 }, { "epoch": 30.03, "learning_rate": 2.8489045936395755e-06, "loss": 0.272, "step": 8650 }, { "epoch": 30.07, "learning_rate": 2.8474911660777383e-06, "loss": 0.2787, "step": 8660 }, { "epoch": 30.1, "learning_rate": 2.8460777385159007e-06, "loss": 0.2711, "step": 8670 }, { "epoch": 30.14, "learning_rate": 2.8446643109540636e-06, "loss": 0.2828, "step": 8680 }, { "epoch": 30.17, "learning_rate": 2.843250883392226e-06, "loss": 0.2688, "step": 8690 }, { "epoch": 30.21, "learning_rate": 2.8418374558303884e-06, "loss": 0.2588, "step": 8700 }, { "epoch": 30.24, "learning_rate": 2.840424028268551e-06, "loss": 0.2539, "step": 8710 }, { "epoch": 30.28, "learning_rate": 2.8390106007067136e-06, "loss": 0.2443, "step": 8720 }, { "epoch": 30.31, "learning_rate": 2.837597173144876e-06, "loss": 0.2713, "step": 8730 }, { "epoch": 30.35, "learning_rate": 2.836183745583039e-06, "loss": 0.2811, "step": 8740 }, { "epoch": 30.38, "learning_rate": 2.8347703180212013e-06, "loss": 0.2653, "step": 8750 }, { "epoch": 30.42, "learning_rate": 2.8333568904593637e-06, "loss": 0.276, "step": 8760 }, { "epoch": 30.45, "learning_rate": 2.831943462897526e-06, "loss": 0.2519, "step": 8770 }, { "epoch": 30.48, "learning_rate": 2.830530035335689e-06, "loss": 0.2805, "step": 8780 }, { "epoch": 30.52, "learning_rate": 2.8291166077738514e-06, "loss": 0.2823, "step": 8790 }, { "epoch": 30.55, "learning_rate": 2.827703180212014e-06, "loss": 0.2714, "step": 8800 }, { "epoch": 30.59, "learning_rate": 2.826289752650176e-06, "loss": 0.2786, "step": 8810 }, { "epoch": 30.62, "learning_rate": 2.824876325088339e-06, "loss": 0.2636, "step": 8820 }, { "epoch": 30.66, "learning_rate": 2.8234628975265014e-06, "loss": 0.2723, "step": 8830 }, { "epoch": 30.69, "learning_rate": 2.8220494699646643e-06, "loss": 0.2795, "step": 8840 }, { "epoch": 30.73, "learning_rate": 2.8206360424028267e-06, "loss": 0.2547, "step": 8850 }, { "epoch": 30.76, "learning_rate": 2.8192226148409895e-06, "loss": 0.256, "step": 8860 }, { "epoch": 30.8, "learning_rate": 2.8178091872791515e-06, "loss": 0.2494, "step": 8870 }, { "epoch": 30.83, "learning_rate": 2.8163957597173143e-06, "loss": 0.2634, "step": 8880 }, { "epoch": 30.87, "learning_rate": 2.8149823321554767e-06, "loss": 0.2868, "step": 8890 }, { "epoch": 30.9, "learning_rate": 2.8135689045936396e-06, "loss": 0.247, "step": 8900 }, { "epoch": 30.94, "learning_rate": 2.812155477031802e-06, "loss": 0.2527, "step": 8910 }, { "epoch": 30.97, "learning_rate": 2.810742049469965e-06, "loss": 0.2777, "step": 8920 }, { "epoch": 31.0, "eval_loss": 0.5179172158241272, "eval_runtime": 129.9918, "eval_samples_per_second": 4.093, "eval_steps_per_second": 1.023, "eval_wer": 0.19939577039274925, "step": 8928 }, { "epoch": 31.01, "learning_rate": 2.8093286219081268e-06, "loss": 0.2692, "step": 8930 }, { "epoch": 31.04, "learning_rate": 2.8079151943462896e-06, "loss": 0.2848, "step": 8940 }, { "epoch": 31.08, "learning_rate": 2.806501766784452e-06, "loss": 0.2704, "step": 8950 }, { "epoch": 31.11, "learning_rate": 2.805088339222615e-06, "loss": 0.253, "step": 8960 }, { "epoch": 31.15, "learning_rate": 2.8036749116607773e-06, "loss": 0.3008, "step": 8970 }, { "epoch": 31.18, "learning_rate": 2.8022614840989397e-06, "loss": 0.2674, "step": 8980 }, { "epoch": 31.21, "learning_rate": 2.800848056537102e-06, "loss": 0.2581, "step": 8990 }, { "epoch": 31.25, "learning_rate": 2.799434628975265e-06, "loss": 0.2539, "step": 9000 }, { "epoch": 31.28, "learning_rate": 2.7980212014134273e-06, "loss": 0.2625, "step": 9010 }, { "epoch": 31.32, "learning_rate": 2.79660777385159e-06, "loss": 0.2533, "step": 9020 }, { "epoch": 31.35, "learning_rate": 2.7951943462897526e-06, "loss": 0.2822, "step": 9030 }, { "epoch": 31.39, "learning_rate": 2.793780918727915e-06, "loss": 0.2678, "step": 9040 }, { "epoch": 31.42, "learning_rate": 2.7923674911660774e-06, "loss": 0.26, "step": 9050 }, { "epoch": 31.46, "learning_rate": 2.7909540636042402e-06, "loss": 0.2568, "step": 9060 }, { "epoch": 31.49, "learning_rate": 2.7895406360424026e-06, "loss": 0.2713, "step": 9070 }, { "epoch": 31.53, "learning_rate": 2.7881272084805655e-06, "loss": 0.2664, "step": 9080 }, { "epoch": 31.56, "learning_rate": 2.786713780918728e-06, "loss": 0.2682, "step": 9090 }, { "epoch": 31.6, "learning_rate": 2.7853003533568903e-06, "loss": 0.2739, "step": 9100 }, { "epoch": 31.63, "learning_rate": 2.7838869257950527e-06, "loss": 0.2553, "step": 9110 }, { "epoch": 31.66, "learning_rate": 2.7824734982332155e-06, "loss": 0.2882, "step": 9120 }, { "epoch": 31.7, "learning_rate": 2.781060070671378e-06, "loss": 0.252, "step": 9130 }, { "epoch": 31.73, "learning_rate": 2.7796466431095408e-06, "loss": 0.257, "step": 9140 }, { "epoch": 31.77, "learning_rate": 2.7782332155477028e-06, "loss": 0.271, "step": 9150 }, { "epoch": 31.8, "learning_rate": 2.7768197879858656e-06, "loss": 0.263, "step": 9160 }, { "epoch": 31.84, "learning_rate": 2.775406360424028e-06, "loss": 0.2663, "step": 9170 }, { "epoch": 31.87, "learning_rate": 2.773992932862191e-06, "loss": 0.274, "step": 9180 }, { "epoch": 31.91, "learning_rate": 2.7725795053003532e-06, "loss": 0.2567, "step": 9190 }, { "epoch": 31.94, "learning_rate": 2.771166077738516e-06, "loss": 0.2676, "step": 9200 }, { "epoch": 31.98, "learning_rate": 2.769752650176678e-06, "loss": 0.2784, "step": 9210 }, { "epoch": 32.0, "eval_loss": 0.518265962600708, "eval_runtime": 129.4613, "eval_samples_per_second": 4.109, "eval_steps_per_second": 1.027, "eval_wer": 0.1989458121745838, "step": 9216 }, { "epoch": 32.01, "learning_rate": 2.768339222614841e-06, "loss": 0.2617, "step": 9220 }, { "epoch": 32.05, "learning_rate": 2.7669257950530033e-06, "loss": 0.2787, "step": 9230 }, { "epoch": 32.08, "learning_rate": 2.765512367491166e-06, "loss": 0.2495, "step": 9240 }, { "epoch": 32.12, "learning_rate": 2.7640989399293285e-06, "loss": 0.249, "step": 9250 }, { "epoch": 32.15, "learning_rate": 2.7626855123674914e-06, "loss": 0.2824, "step": 9260 }, { "epoch": 32.19, "learning_rate": 2.7612720848056534e-06, "loss": 0.2872, "step": 9270 }, { "epoch": 32.22, "learning_rate": 2.759858657243816e-06, "loss": 0.2743, "step": 9280 }, { "epoch": 32.26, "learning_rate": 2.7585865724381622e-06, "loss": 0.2752, "step": 9290 }, { "epoch": 32.29, "learning_rate": 2.757173144876325e-06, "loss": 0.2671, "step": 9300 }, { "epoch": 32.33, "learning_rate": 2.7557597173144875e-06, "loss": 0.2559, "step": 9310 }, { "epoch": 32.36, "learning_rate": 2.7543462897526503e-06, "loss": 0.2762, "step": 9320 }, { "epoch": 32.39, "learning_rate": 2.7529328621908127e-06, "loss": 0.2633, "step": 9330 }, { "epoch": 32.43, "learning_rate": 2.751519434628975e-06, "loss": 0.2554, "step": 9340 }, { "epoch": 32.46, "learning_rate": 2.7501060070671375e-06, "loss": 0.2922, "step": 9350 }, { "epoch": 32.5, "learning_rate": 2.7486925795053004e-06, "loss": 0.2827, "step": 9360 }, { "epoch": 32.53, "learning_rate": 2.747279151943463e-06, "loss": 0.2491, "step": 9370 }, { "epoch": 32.57, "learning_rate": 2.7458657243816256e-06, "loss": 0.2386, "step": 9380 }, { "epoch": 32.6, "learning_rate": 2.744452296819788e-06, "loss": 0.2375, "step": 9390 }, { "epoch": 32.64, "learning_rate": 2.7430388692579504e-06, "loss": 0.2663, "step": 9400 }, { "epoch": 32.67, "learning_rate": 2.741625441696113e-06, "loss": 0.2674, "step": 9410 }, { "epoch": 32.71, "learning_rate": 2.7402120141342757e-06, "loss": 0.2609, "step": 9420 }, { "epoch": 32.74, "learning_rate": 2.738798586572438e-06, "loss": 0.2538, "step": 9430 }, { "epoch": 32.78, "learning_rate": 2.737385159010601e-06, "loss": 0.268, "step": 9440 }, { "epoch": 32.81, "learning_rate": 2.735971731448763e-06, "loss": 0.2698, "step": 9450 }, { "epoch": 32.85, "learning_rate": 2.7345583038869257e-06, "loss": 0.2826, "step": 9460 }, { "epoch": 32.88, "learning_rate": 2.733144876325088e-06, "loss": 0.249, "step": 9470 }, { "epoch": 32.91, "learning_rate": 2.731731448763251e-06, "loss": 0.2555, "step": 9480 }, { "epoch": 32.95, "learning_rate": 2.7303180212014134e-06, "loss": 0.243, "step": 9490 }, { "epoch": 32.98, "learning_rate": 2.7289045936395762e-06, "loss": 0.2801, "step": 9500 }, { "epoch": 33.0, "eval_loss": 0.5222018957138062, "eval_runtime": 129.2645, "eval_samples_per_second": 4.116, "eval_steps_per_second": 1.029, "eval_wer": 0.20029568682908017, "step": 9504 }, { "epoch": 33.02, "learning_rate": 2.7274911660777382e-06, "loss": 0.2721, "step": 9510 }, { "epoch": 33.06, "learning_rate": 2.7260777385159006e-06, "loss": 0.2799, "step": 9520 }, { "epoch": 33.09, "learning_rate": 2.7246643109540635e-06, "loss": 0.2719, "step": 9530 }, { "epoch": 33.12, "learning_rate": 2.7232508833922263e-06, "loss": 0.2716, "step": 9540 }, { "epoch": 33.16, "learning_rate": 2.7218374558303887e-06, "loss": 0.2768, "step": 9550 }, { "epoch": 33.19, "learning_rate": 2.7204240282685515e-06, "loss": 0.2619, "step": 9560 }, { "epoch": 33.23, "learning_rate": 2.7190106007067135e-06, "loss": 0.2864, "step": 9570 }, { "epoch": 33.26, "learning_rate": 2.717597173144876e-06, "loss": 0.2651, "step": 9580 }, { "epoch": 33.3, "learning_rate": 2.7161837455830388e-06, "loss": 0.2799, "step": 9590 }, { "epoch": 33.33, "learning_rate": 2.714770318021201e-06, "loss": 0.2821, "step": 9600 }, { "epoch": 33.37, "learning_rate": 2.713356890459364e-06, "loss": 0.2742, "step": 9610 }, { "epoch": 33.4, "learning_rate": 2.711943462897526e-06, "loss": 0.267, "step": 9620 }, { "epoch": 33.44, "learning_rate": 2.710530035335689e-06, "loss": 0.2676, "step": 9630 }, { "epoch": 33.47, "learning_rate": 2.7091166077738512e-06, "loss": 0.2992, "step": 9640 }, { "epoch": 33.51, "learning_rate": 2.707703180212014e-06, "loss": 0.3028, "step": 9650 }, { "epoch": 33.54, "learning_rate": 2.7062897526501765e-06, "loss": 0.2624, "step": 9660 }, { "epoch": 33.57, "learning_rate": 2.7048763250883393e-06, "loss": 0.2673, "step": 9670 }, { "epoch": 33.61, "learning_rate": 2.7034628975265013e-06, "loss": 0.2599, "step": 9680 }, { "epoch": 33.64, "learning_rate": 2.702049469964664e-06, "loss": 0.2548, "step": 9690 }, { "epoch": 33.68, "learning_rate": 2.7006360424028265e-06, "loss": 0.2647, "step": 9700 }, { "epoch": 33.71, "learning_rate": 2.6992226148409894e-06, "loss": 0.264, "step": 9710 }, { "epoch": 33.75, "learning_rate": 2.6978091872791518e-06, "loss": 0.2615, "step": 9720 }, { "epoch": 33.78, "learning_rate": 2.696395759717314e-06, "loss": 0.2579, "step": 9730 }, { "epoch": 33.82, "learning_rate": 2.6949823321554766e-06, "loss": 0.2806, "step": 9740 }, { "epoch": 33.85, "learning_rate": 2.6935689045936394e-06, "loss": 0.2679, "step": 9750 }, { "epoch": 33.89, "learning_rate": 2.692155477031802e-06, "loss": 0.2415, "step": 9760 }, { "epoch": 33.92, "learning_rate": 2.6907420494699647e-06, "loss": 0.2645, "step": 9770 }, { "epoch": 33.96, "learning_rate": 2.689328621908127e-06, "loss": 0.2602, "step": 9780 }, { "epoch": 33.99, "learning_rate": 2.6879151943462895e-06, "loss": 0.2554, "step": 9790 }, { "epoch": 34.0, "eval_loss": 0.5137259364128113, "eval_runtime": 129.6969, "eval_samples_per_second": 4.102, "eval_steps_per_second": 1.025, "eval_wer": 0.199010091920036, "step": 9792 }, { "epoch": 34.03, "learning_rate": 2.686501766784452e-06, "loss": 0.2962, "step": 9800 }, { "epoch": 34.06, "learning_rate": 2.6850883392226147e-06, "loss": 0.2692, "step": 9810 }, { "epoch": 34.1, "learning_rate": 2.683674911660777e-06, "loss": 0.2522, "step": 9820 }, { "epoch": 34.13, "learning_rate": 2.68226148409894e-06, "loss": 0.2894, "step": 9830 }, { "epoch": 34.17, "learning_rate": 2.6808480565371024e-06, "loss": 0.2864, "step": 9840 }, { "epoch": 34.2, "learning_rate": 2.679434628975265e-06, "loss": 0.2564, "step": 9850 }, { "epoch": 34.24, "learning_rate": 2.678021201413427e-06, "loss": 0.2632, "step": 9860 }, { "epoch": 34.27, "learning_rate": 2.67660777385159e-06, "loss": 0.2442, "step": 9870 }, { "epoch": 34.3, "learning_rate": 2.6751943462897525e-06, "loss": 0.2923, "step": 9880 }, { "epoch": 34.34, "learning_rate": 2.6737809187279153e-06, "loss": 0.2789, "step": 9890 }, { "epoch": 34.37, "learning_rate": 2.6723674911660773e-06, "loss": 0.2835, "step": 9900 }, { "epoch": 34.41, "learning_rate": 2.67095406360424e-06, "loss": 0.2634, "step": 9910 }, { "epoch": 34.44, "learning_rate": 2.6695406360424025e-06, "loss": 0.2771, "step": 9920 }, { "epoch": 34.48, "learning_rate": 2.6681272084805653e-06, "loss": 0.2659, "step": 9930 }, { "epoch": 34.51, "learning_rate": 2.6667137809187278e-06, "loss": 0.2556, "step": 9940 }, { "epoch": 34.55, "learning_rate": 2.6653003533568906e-06, "loss": 0.2524, "step": 9950 }, { "epoch": 34.58, "learning_rate": 2.6638869257950526e-06, "loss": 0.2783, "step": 9960 }, { "epoch": 34.62, "learning_rate": 2.6624734982332154e-06, "loss": 0.245, "step": 9970 }, { "epoch": 34.65, "learning_rate": 2.661060070671378e-06, "loss": 0.2642, "step": 9980 }, { "epoch": 34.69, "learning_rate": 2.6596466431095407e-06, "loss": 0.2945, "step": 9990 }, { "epoch": 34.72, "learning_rate": 2.658233215547703e-06, "loss": 0.25, "step": 10000 }, { "epoch": 34.75, "learning_rate": 2.656819787985866e-06, "loss": 0.2635, "step": 10010 }, { "epoch": 34.79, "learning_rate": 2.655406360424028e-06, "loss": 0.2492, "step": 10020 }, { "epoch": 34.82, "learning_rate": 2.6539929328621907e-06, "loss": 0.2789, "step": 10030 }, { "epoch": 34.86, "learning_rate": 2.652579505300353e-06, "loss": 0.2797, "step": 10040 }, { "epoch": 34.89, "learning_rate": 2.651166077738516e-06, "loss": 0.2378, "step": 10050 }, { "epoch": 34.93, "learning_rate": 2.6497526501766784e-06, "loss": 0.2545, "step": 10060 }, { "epoch": 34.96, "learning_rate": 2.6483392226148408e-06, "loss": 0.2677, "step": 10070 }, { "epoch": 35.0, "learning_rate": 2.646925795053003e-06, "loss": 0.2708, "step": 10080 }, { "epoch": 35.0, "eval_loss": 0.5093948841094971, "eval_runtime": 129.527, "eval_samples_per_second": 4.107, "eval_steps_per_second": 1.027, "eval_wer": 0.19643890210194767, "step": 10080 }, { "epoch": 35.03, "learning_rate": 2.645512367491166e-06, "loss": 0.2628, "step": 10090 }, { "epoch": 35.07, "learning_rate": 2.6440989399293284e-06, "loss": 0.263, "step": 10100 }, { "epoch": 35.1, "learning_rate": 2.6426855123674913e-06, "loss": 0.241, "step": 10110 }, { "epoch": 35.14, "learning_rate": 2.6412720848056537e-06, "loss": 0.2802, "step": 10120 }, { "epoch": 35.17, "learning_rate": 2.639858657243816e-06, "loss": 0.2675, "step": 10130 }, { "epoch": 35.21, "learning_rate": 2.6384452296819785e-06, "loss": 0.2626, "step": 10140 }, { "epoch": 35.24, "learning_rate": 2.6370318021201413e-06, "loss": 0.2853, "step": 10150 }, { "epoch": 35.28, "learning_rate": 2.6356183745583037e-06, "loss": 0.2683, "step": 10160 }, { "epoch": 35.31, "learning_rate": 2.6342049469964666e-06, "loss": 0.269, "step": 10170 }, { "epoch": 35.35, "learning_rate": 2.632791519434629e-06, "loss": 0.2872, "step": 10180 }, { "epoch": 35.38, "learning_rate": 2.6313780918727914e-06, "loss": 0.2519, "step": 10190 }, { "epoch": 35.42, "learning_rate": 2.629964664310954e-06, "loss": 0.2554, "step": 10200 }, { "epoch": 35.45, "learning_rate": 2.6285512367491166e-06, "loss": 0.2548, "step": 10210 }, { "epoch": 35.48, "learning_rate": 2.627137809187279e-06, "loss": 0.291, "step": 10220 }, { "epoch": 35.52, "learning_rate": 2.625724381625442e-06, "loss": 0.2507, "step": 10230 }, { "epoch": 35.55, "learning_rate": 2.624310954063604e-06, "loss": 0.2681, "step": 10240 }, { "epoch": 35.59, "learning_rate": 2.6228975265017667e-06, "loss": 0.2637, "step": 10250 }, { "epoch": 35.62, "learning_rate": 2.621484098939929e-06, "loss": 0.2707, "step": 10260 }, { "epoch": 35.66, "learning_rate": 2.620070671378092e-06, "loss": 0.2784, "step": 10270 }, { "epoch": 35.69, "learning_rate": 2.6186572438162543e-06, "loss": 0.28, "step": 10280 }, { "epoch": 35.73, "learning_rate": 2.617243816254417e-06, "loss": 0.2459, "step": 10290 }, { "epoch": 35.76, "learning_rate": 2.615830388692579e-06, "loss": 0.2663, "step": 10300 }, { "epoch": 35.8, "learning_rate": 2.614416961130742e-06, "loss": 0.2546, "step": 10310 }, { "epoch": 35.83, "learning_rate": 2.6130035335689044e-06, "loss": 0.2632, "step": 10320 }, { "epoch": 35.87, "learning_rate": 2.6115901060070672e-06, "loss": 0.2692, "step": 10330 }, { "epoch": 35.9, "learning_rate": 2.6101766784452296e-06, "loss": 0.292, "step": 10340 }, { "epoch": 35.94, "learning_rate": 2.608763250883392e-06, "loss": 0.2487, "step": 10350 }, { "epoch": 35.97, "learning_rate": 2.6073498233215545e-06, "loss": 0.27, "step": 10360 }, { "epoch": 36.0, "eval_loss": 0.5076168775558472, "eval_runtime": 129.8583, "eval_samples_per_second": 4.097, "eval_steps_per_second": 1.024, "eval_wer": 0.19798161599280067, "step": 10368 }, { "epoch": 36.01, "learning_rate": 2.6059363957597173e-06, "loss": 0.2559, "step": 10370 }, { "epoch": 36.04, "learning_rate": 2.6045229681978797e-06, "loss": 0.2505, "step": 10380 }, { "epoch": 36.08, "learning_rate": 2.6031095406360425e-06, "loss": 0.279, "step": 10390 }, { "epoch": 36.11, "learning_rate": 2.601696113074205e-06, "loss": 0.2585, "step": 10400 }, { "epoch": 36.15, "learning_rate": 2.6002826855123674e-06, "loss": 0.2484, "step": 10410 }, { "epoch": 36.18, "learning_rate": 2.5988692579505298e-06, "loss": 0.2734, "step": 10420 }, { "epoch": 36.21, "learning_rate": 2.5974558303886926e-06, "loss": 0.2707, "step": 10430 }, { "epoch": 36.25, "learning_rate": 2.596042402826855e-06, "loss": 0.2594, "step": 10440 }, { "epoch": 36.28, "learning_rate": 2.594628975265018e-06, "loss": 0.248, "step": 10450 }, { "epoch": 36.32, "learning_rate": 2.5932155477031803e-06, "loss": 0.2647, "step": 10460 }, { "epoch": 36.35, "learning_rate": 2.5918021201413427e-06, "loss": 0.2599, "step": 10470 }, { "epoch": 36.39, "learning_rate": 2.590388692579505e-06, "loss": 0.267, "step": 10480 }, { "epoch": 36.42, "learning_rate": 2.588975265017668e-06, "loss": 0.2639, "step": 10490 }, { "epoch": 36.46, "learning_rate": 2.5875618374558303e-06, "loss": 0.2715, "step": 10500 }, { "epoch": 36.49, "learning_rate": 2.586148409893993e-06, "loss": 0.3031, "step": 10510 }, { "epoch": 36.53, "learning_rate": 2.584734982332155e-06, "loss": 0.2996, "step": 10520 }, { "epoch": 36.56, "learning_rate": 2.583321554770318e-06, "loss": 0.2586, "step": 10530 }, { "epoch": 36.6, "learning_rate": 2.5819081272084804e-06, "loss": 0.2514, "step": 10540 }, { "epoch": 36.63, "learning_rate": 2.580494699646643e-06, "loss": 0.255, "step": 10550 }, { "epoch": 36.66, "learning_rate": 2.5790812720848056e-06, "loss": 0.2765, "step": 10560 }, { "epoch": 36.7, "learning_rate": 2.5776678445229685e-06, "loss": 0.2721, "step": 10570 }, { "epoch": 36.73, "learning_rate": 2.5762544169611304e-06, "loss": 0.2704, "step": 10580 }, { "epoch": 36.77, "learning_rate": 2.5748409893992933e-06, "loss": 0.2613, "step": 10590 }, { "epoch": 36.8, "learning_rate": 2.5734275618374557e-06, "loss": 0.2711, "step": 10600 }, { "epoch": 36.84, "learning_rate": 2.5720141342756185e-06, "loss": 0.2769, "step": 10610 }, { "epoch": 36.87, "learning_rate": 2.570600706713781e-06, "loss": 0.2635, "step": 10620 }, { "epoch": 36.91, "learning_rate": 2.5691872791519438e-06, "loss": 0.2655, "step": 10630 }, { "epoch": 36.94, "learning_rate": 2.5677738515901057e-06, "loss": 0.2689, "step": 10640 }, { "epoch": 36.98, "learning_rate": 2.566360424028268e-06, "loss": 0.2706, "step": 10650 }, { "epoch": 37.0, "eval_loss": 0.5178768038749695, "eval_runtime": 130.9202, "eval_samples_per_second": 4.064, "eval_steps_per_second": 1.016, "eval_wer": 0.1983030147200617, "step": 10656 }, { "epoch": 37.01, "learning_rate": 2.564946996466431e-06, "loss": 0.2868, "step": 10660 }, { "epoch": 37.05, "learning_rate": 2.5635335689045934e-06, "loss": 0.2749, "step": 10670 }, { "epoch": 37.08, "learning_rate": 2.5621201413427562e-06, "loss": 0.2454, "step": 10680 }, { "epoch": 37.12, "learning_rate": 2.5607067137809182e-06, "loss": 0.283, "step": 10690 }, { "epoch": 37.15, "learning_rate": 2.559293286219081e-06, "loss": 0.2709, "step": 10700 }, { "epoch": 37.19, "learning_rate": 2.5578798586572435e-06, "loss": 0.2623, "step": 10710 }, { "epoch": 37.22, "learning_rate": 2.5564664310954063e-06, "loss": 0.2742, "step": 10720 }, { "epoch": 37.26, "learning_rate": 2.5550530035335687e-06, "loss": 0.2683, "step": 10730 }, { "epoch": 37.29, "learning_rate": 2.5536395759717315e-06, "loss": 0.251, "step": 10740 }, { "epoch": 37.33, "learning_rate": 2.5522261484098935e-06, "loss": 0.2613, "step": 10750 }, { "epoch": 37.36, "learning_rate": 2.5508127208480564e-06, "loss": 0.2655, "step": 10760 }, { "epoch": 37.39, "learning_rate": 2.5493992932862188e-06, "loss": 0.2723, "step": 10770 }, { "epoch": 37.43, "learning_rate": 2.5479858657243816e-06, "loss": 0.2675, "step": 10780 }, { "epoch": 37.46, "learning_rate": 2.546572438162544e-06, "loss": 0.2732, "step": 10790 }, { "epoch": 37.5, "learning_rate": 2.545159010600707e-06, "loss": 0.2773, "step": 10800 }, { "epoch": 37.53, "learning_rate": 2.543745583038869e-06, "loss": 0.2536, "step": 10810 }, { "epoch": 37.57, "learning_rate": 2.5423321554770317e-06, "loss": 0.2693, "step": 10820 }, { "epoch": 37.6, "learning_rate": 2.540918727915194e-06, "loss": 0.2498, "step": 10830 }, { "epoch": 37.64, "learning_rate": 2.539505300353357e-06, "loss": 0.2603, "step": 10840 }, { "epoch": 37.67, "learning_rate": 2.5380918727915193e-06, "loss": 0.2798, "step": 10850 }, { "epoch": 37.71, "learning_rate": 2.5366784452296817e-06, "loss": 0.2911, "step": 10860 }, { "epoch": 37.74, "learning_rate": 2.535265017667844e-06, "loss": 0.2625, "step": 10870 }, { "epoch": 37.78, "learning_rate": 2.533851590106007e-06, "loss": 0.2744, "step": 10880 }, { "epoch": 37.81, "learning_rate": 2.5324381625441694e-06, "loss": 0.2753, "step": 10890 }, { "epoch": 37.85, "learning_rate": 2.531024734982332e-06, "loss": 0.267, "step": 10900 }, { "epoch": 37.88, "learning_rate": 2.5296113074204946e-06, "loss": 0.2572, "step": 10910 }, { "epoch": 37.91, "learning_rate": 2.528197879858657e-06, "loss": 0.2551, "step": 10920 }, { "epoch": 37.95, "learning_rate": 2.5267844522968194e-06, "loss": 0.2469, "step": 10930 }, { "epoch": 37.98, "learning_rate": 2.5253710247349823e-06, "loss": 0.2791, "step": 10940 }, { "epoch": 38.0, "eval_loss": 0.515429675579071, "eval_runtime": 130.0554, "eval_samples_per_second": 4.091, "eval_steps_per_second": 1.023, "eval_wer": 0.19759593752008742, "step": 10944 }, { "epoch": 38.02, "learning_rate": 2.5239575971731447e-06, "loss": 0.2944, "step": 10950 }, { "epoch": 38.06, "learning_rate": 2.5225441696113075e-06, "loss": 0.264, "step": 10960 }, { "epoch": 38.09, "learning_rate": 2.52113074204947e-06, "loss": 0.2722, "step": 10970 }, { "epoch": 38.12, "learning_rate": 2.5197173144876323e-06, "loss": 0.2692, "step": 10980 }, { "epoch": 38.16, "learning_rate": 2.5183038869257947e-06, "loss": 0.2607, "step": 10990 }, { "epoch": 38.19, "learning_rate": 2.5168904593639576e-06, "loss": 0.2412, "step": 11000 }, { "epoch": 38.23, "learning_rate": 2.51547703180212e-06, "loss": 0.2621, "step": 11010 }, { "epoch": 38.26, "learning_rate": 2.514063604240283e-06, "loss": 0.2383, "step": 11020 }, { "epoch": 38.3, "learning_rate": 2.512650176678445e-06, "loss": 0.2608, "step": 11030 }, { "epoch": 38.33, "learning_rate": 2.5112367491166076e-06, "loss": 0.2865, "step": 11040 }, { "epoch": 38.37, "learning_rate": 2.50982332155477e-06, "loss": 0.2529, "step": 11050 }, { "epoch": 38.4, "learning_rate": 2.508409893992933e-06, "loss": 0.2468, "step": 11060 }, { "epoch": 38.44, "learning_rate": 2.5069964664310953e-06, "loss": 0.2767, "step": 11070 }, { "epoch": 38.47, "learning_rate": 2.505583038869258e-06, "loss": 0.2832, "step": 11080 }, { "epoch": 38.51, "learning_rate": 2.50416961130742e-06, "loss": 0.2732, "step": 11090 }, { "epoch": 38.54, "learning_rate": 2.502756183745583e-06, "loss": 0.2604, "step": 11100 }, { "epoch": 38.57, "learning_rate": 2.5013427561837453e-06, "loss": 0.2797, "step": 11110 }, { "epoch": 38.61, "learning_rate": 2.499929328621908e-06, "loss": 0.2548, "step": 11120 }, { "epoch": 38.64, "learning_rate": 2.4985159010600706e-06, "loss": 0.2735, "step": 11130 }, { "epoch": 38.68, "learning_rate": 2.497102473498233e-06, "loss": 0.2544, "step": 11140 }, { "epoch": 38.71, "learning_rate": 2.4956890459363954e-06, "loss": 0.2744, "step": 11150 }, { "epoch": 38.75, "learning_rate": 2.4942756183745582e-06, "loss": 0.2696, "step": 11160 }, { "epoch": 38.78, "learning_rate": 2.4928621908127206e-06, "loss": 0.2339, "step": 11170 }, { "epoch": 38.82, "learning_rate": 2.4914487632508835e-06, "loss": 0.2658, "step": 11180 }, { "epoch": 38.85, "learning_rate": 2.490035335689046e-06, "loss": 0.2626, "step": 11190 }, { "epoch": 38.89, "learning_rate": 2.4886219081272083e-06, "loss": 0.2592, "step": 11200 }, { "epoch": 38.92, "learning_rate": 2.4872084805653707e-06, "loss": 0.2644, "step": 11210 }, { "epoch": 38.96, "learning_rate": 2.4857950530035335e-06, "loss": 0.2661, "step": 11220 }, { "epoch": 38.99, "learning_rate": 2.484381625441696e-06, "loss": 0.3148, "step": 11230 }, { "epoch": 39.0, "eval_loss": 0.5082433223724365, "eval_runtime": 132.6404, "eval_samples_per_second": 4.011, "eval_steps_per_second": 1.003, "eval_wer": 0.199010091920036, "step": 11232 }, { "epoch": 39.03, "learning_rate": 2.4829681978798588e-06, "loss": 0.261, "step": 11240 }, { "epoch": 39.06, "learning_rate": 2.481554770318021e-06, "loss": 0.2706, "step": 11250 }, { "epoch": 39.1, "learning_rate": 2.4801413427561836e-06, "loss": 0.2532, "step": 11260 }, { "epoch": 39.13, "learning_rate": 2.478727915194346e-06, "loss": 0.2841, "step": 11270 }, { "epoch": 39.17, "learning_rate": 2.477314487632509e-06, "loss": 0.2502, "step": 11280 }, { "epoch": 39.2, "learning_rate": 2.4759010600706713e-06, "loss": 0.2579, "step": 11290 }, { "epoch": 39.24, "learning_rate": 2.474487632508834e-06, "loss": 0.2768, "step": 11300 }, { "epoch": 39.27, "learning_rate": 2.473074204946996e-06, "loss": 0.2351, "step": 11310 }, { "epoch": 39.3, "learning_rate": 2.471660777385159e-06, "loss": 0.2888, "step": 11320 }, { "epoch": 39.34, "learning_rate": 2.4702473498233213e-06, "loss": 0.2852, "step": 11330 }, { "epoch": 39.37, "learning_rate": 2.468833922261484e-06, "loss": 0.2604, "step": 11340 }, { "epoch": 39.41, "learning_rate": 2.4674204946996466e-06, "loss": 0.2629, "step": 11350 }, { "epoch": 39.44, "learning_rate": 2.4660070671378094e-06, "loss": 0.2291, "step": 11360 }, { "epoch": 39.48, "learning_rate": 2.4645936395759714e-06, "loss": 0.2684, "step": 11370 }, { "epoch": 39.51, "learning_rate": 2.4631802120141342e-06, "loss": 0.2635, "step": 11380 }, { "epoch": 39.55, "learning_rate": 2.4617667844522966e-06, "loss": 0.2524, "step": 11390 }, { "epoch": 39.58, "learning_rate": 2.4603533568904595e-06, "loss": 0.2813, "step": 11400 }, { "epoch": 39.62, "learning_rate": 2.458939929328622e-06, "loss": 0.2778, "step": 11410 }, { "epoch": 39.65, "learning_rate": 2.4575265017667847e-06, "loss": 0.2845, "step": 11420 }, { "epoch": 39.69, "learning_rate": 2.4561130742049467e-06, "loss": 0.2779, "step": 11430 }, { "epoch": 39.72, "learning_rate": 2.4546996466431095e-06, "loss": 0.2418, "step": 11440 }, { "epoch": 39.75, "learning_rate": 2.453286219081272e-06, "loss": 0.2493, "step": 11450 }, { "epoch": 39.79, "learning_rate": 2.4518727915194348e-06, "loss": 0.2677, "step": 11460 }, { "epoch": 39.82, "learning_rate": 2.450459363957597e-06, "loss": 0.2747, "step": 11470 }, { "epoch": 39.86, "learning_rate": 2.4490459363957596e-06, "loss": 0.2768, "step": 11480 }, { "epoch": 39.89, "learning_rate": 2.447632508833922e-06, "loss": 0.2705, "step": 11490 }, { "epoch": 39.93, "learning_rate": 2.446219081272085e-06, "loss": 0.2486, "step": 11500 }, { "epoch": 39.96, "learning_rate": 2.4448056537102472e-06, "loss": 0.2852, "step": 11510 }, { "epoch": 40.0, "learning_rate": 2.44339222614841e-06, "loss": 0.2834, "step": 11520 }, { "epoch": 40.0, "eval_loss": 0.5106706023216248, "eval_runtime": 132.6333, "eval_samples_per_second": 4.011, "eval_steps_per_second": 1.003, "eval_wer": 0.19804589573825288, "step": 11520 }, { "epoch": 40.03, "learning_rate": 2.4419787985865725e-06, "loss": 0.2684, "step": 11530 }, { "epoch": 40.07, "learning_rate": 2.440565371024735e-06, "loss": 0.2851, "step": 11540 }, { "epoch": 40.1, "learning_rate": 2.4391519434628973e-06, "loss": 0.2619, "step": 11550 }, { "epoch": 40.14, "learning_rate": 2.43773851590106e-06, "loss": 0.2778, "step": 11560 }, { "epoch": 40.17, "learning_rate": 2.4363250883392225e-06, "loss": 0.2822, "step": 11570 }, { "epoch": 40.21, "learning_rate": 2.4349116607773854e-06, "loss": 0.2447, "step": 11580 }, { "epoch": 40.24, "learning_rate": 2.4334982332155478e-06, "loss": 0.2741, "step": 11590 }, { "epoch": 40.28, "learning_rate": 2.43208480565371e-06, "loss": 0.2678, "step": 11600 }, { "epoch": 40.31, "learning_rate": 2.4306713780918726e-06, "loss": 0.2677, "step": 11610 }, { "epoch": 40.35, "learning_rate": 2.4292579505300354e-06, "loss": 0.2553, "step": 11620 }, { "epoch": 40.38, "learning_rate": 2.427844522968198e-06, "loss": 0.262, "step": 11630 }, { "epoch": 40.42, "learning_rate": 2.4264310954063607e-06, "loss": 0.2346, "step": 11640 }, { "epoch": 40.45, "learning_rate": 2.4250176678445227e-06, "loss": 0.2454, "step": 11650 }, { "epoch": 40.48, "learning_rate": 2.4236042402826855e-06, "loss": 0.2916, "step": 11660 }, { "epoch": 40.52, "learning_rate": 2.422190812720848e-06, "loss": 0.2796, "step": 11670 }, { "epoch": 40.55, "learning_rate": 2.4207773851590107e-06, "loss": 0.2665, "step": 11680 }, { "epoch": 40.59, "learning_rate": 2.419363957597173e-06, "loss": 0.2589, "step": 11690 }, { "epoch": 40.62, "learning_rate": 2.417950530035336e-06, "loss": 0.2391, "step": 11700 }, { "epoch": 40.66, "learning_rate": 2.416537102473498e-06, "loss": 0.2641, "step": 11710 }, { "epoch": 40.69, "learning_rate": 2.4151236749116604e-06, "loss": 0.2821, "step": 11720 }, { "epoch": 40.73, "learning_rate": 2.413710247349823e-06, "loss": 0.2595, "step": 11730 }, { "epoch": 40.76, "learning_rate": 2.4122968197879856e-06, "loss": 0.2632, "step": 11740 }, { "epoch": 40.8, "learning_rate": 2.4108833922261484e-06, "loss": 0.2707, "step": 11750 }, { "epoch": 40.83, "learning_rate": 2.4094699646643104e-06, "loss": 0.2821, "step": 11760 }, { "epoch": 40.87, "learning_rate": 2.4080565371024733e-06, "loss": 0.27, "step": 11770 }, { "epoch": 40.9, "learning_rate": 2.4066431095406357e-06, "loss": 0.2556, "step": 11780 }, { "epoch": 40.94, "learning_rate": 2.4052296819787985e-06, "loss": 0.2552, "step": 11790 }, { "epoch": 40.97, "learning_rate": 2.403816254416961e-06, "loss": 0.2739, "step": 11800 }, { "epoch": 41.0, "eval_loss": 0.5009294152259827, "eval_runtime": 134.0218, "eval_samples_per_second": 3.97, "eval_steps_per_second": 0.992, "eval_wer": 0.199010091920036, "step": 11808 }, { "epoch": 41.01, "learning_rate": 2.4024028268551238e-06, "loss": 0.2686, "step": 11810 }, { "epoch": 41.04, "learning_rate": 2.4009893992932857e-06, "loss": 0.2519, "step": 11820 }, { "epoch": 41.08, "learning_rate": 2.3995759717314486e-06, "loss": 0.2594, "step": 11830 }, { "epoch": 41.11, "learning_rate": 2.398162544169611e-06, "loss": 0.2581, "step": 11840 }, { "epoch": 41.15, "learning_rate": 2.396749116607774e-06, "loss": 0.2805, "step": 11850 }, { "epoch": 41.18, "learning_rate": 2.3953356890459362e-06, "loss": 0.2676, "step": 11860 }, { "epoch": 41.21, "learning_rate": 2.393922261484099e-06, "loss": 0.266, "step": 11870 }, { "epoch": 41.25, "learning_rate": 2.392508833922261e-06, "loss": 0.2659, "step": 11880 }, { "epoch": 41.28, "learning_rate": 2.391095406360424e-06, "loss": 0.2744, "step": 11890 }, { "epoch": 41.32, "learning_rate": 2.3896819787985863e-06, "loss": 0.2645, "step": 11900 }, { "epoch": 41.35, "learning_rate": 2.388268551236749e-06, "loss": 0.2566, "step": 11910 }, { "epoch": 41.39, "learning_rate": 2.3868551236749115e-06, "loss": 0.2739, "step": 11920 }, { "epoch": 41.42, "learning_rate": 2.385441696113074e-06, "loss": 0.2716, "step": 11930 }, { "epoch": 41.46, "learning_rate": 2.3840282685512363e-06, "loss": 0.2489, "step": 11940 }, { "epoch": 41.49, "learning_rate": 2.382614840989399e-06, "loss": 0.2852, "step": 11950 }, { "epoch": 41.53, "learning_rate": 2.3812014134275616e-06, "loss": 0.2709, "step": 11960 }, { "epoch": 41.56, "learning_rate": 2.3797879858657244e-06, "loss": 0.274, "step": 11970 }, { "epoch": 41.6, "learning_rate": 2.378374558303887e-06, "loss": 0.2656, "step": 11980 }, { "epoch": 41.63, "learning_rate": 2.3769611307420492e-06, "loss": 0.2745, "step": 11990 }, { "epoch": 41.66, "learning_rate": 2.3755477031802117e-06, "loss": 0.2757, "step": 12000 }, { "epoch": 41.7, "learning_rate": 2.3741342756183745e-06, "loss": 0.2799, "step": 12010 }, { "epoch": 41.73, "learning_rate": 2.372720848056537e-06, "loss": 0.2521, "step": 12020 }, { "epoch": 41.77, "learning_rate": 2.3713074204946997e-06, "loss": 0.2568, "step": 12030 }, { "epoch": 41.8, "learning_rate": 2.369893992932862e-06, "loss": 0.2557, "step": 12040 }, { "epoch": 41.84, "learning_rate": 2.3684805653710245e-06, "loss": 0.2617, "step": 12050 }, { "epoch": 41.87, "learning_rate": 2.367067137809187e-06, "loss": 0.2595, "step": 12060 }, { "epoch": 41.91, "learning_rate": 2.36565371024735e-06, "loss": 0.2647, "step": 12070 }, { "epoch": 41.94, "learning_rate": 2.364240282685512e-06, "loss": 0.2544, "step": 12080 }, { "epoch": 41.98, "learning_rate": 2.362826855123675e-06, "loss": 0.2687, "step": 12090 }, { "epoch": 42.0, "eval_loss": 0.5231707692146301, "eval_runtime": 133.0554, "eval_samples_per_second": 3.998, "eval_steps_per_second": 1.0, "eval_wer": 0.20113132351995885, "step": 12096 }, { "epoch": 42.01, "learning_rate": 2.361413427561837e-06, "loss": 0.288, "step": 12100 }, { "epoch": 42.05, "learning_rate": 2.36e-06, "loss": 0.2828, "step": 12110 }, { "epoch": 42.08, "learning_rate": 2.3585865724381623e-06, "loss": 0.267, "step": 12120 }, { "epoch": 42.12, "learning_rate": 2.357173144876325e-06, "loss": 0.2614, "step": 12130 }, { "epoch": 42.15, "learning_rate": 2.3557597173144875e-06, "loss": 0.2614, "step": 12140 }, { "epoch": 42.19, "learning_rate": 2.3543462897526503e-06, "loss": 0.2936, "step": 12150 }, { "epoch": 42.22, "learning_rate": 2.3529328621908123e-06, "loss": 0.2661, "step": 12160 }, { "epoch": 42.26, "learning_rate": 2.351519434628975e-06, "loss": 0.2655, "step": 12170 }, { "epoch": 42.29, "learning_rate": 2.3501060070671376e-06, "loss": 0.2874, "step": 12180 }, { "epoch": 42.33, "learning_rate": 2.3486925795053004e-06, "loss": 0.2629, "step": 12190 }, { "epoch": 42.36, "learning_rate": 2.347279151943463e-06, "loss": 0.2498, "step": 12200 }, { "epoch": 42.39, "learning_rate": 2.3458657243816256e-06, "loss": 0.2821, "step": 12210 }, { "epoch": 42.43, "learning_rate": 2.3444522968197876e-06, "loss": 0.2461, "step": 12220 }, { "epoch": 42.46, "learning_rate": 2.3430388692579505e-06, "loss": 0.2809, "step": 12230 }, { "epoch": 42.5, "learning_rate": 2.341625441696113e-06, "loss": 0.2653, "step": 12240 }, { "epoch": 42.53, "learning_rate": 2.3402120141342757e-06, "loss": 0.2616, "step": 12250 }, { "epoch": 42.57, "learning_rate": 2.338798586572438e-06, "loss": 0.261, "step": 12260 }, { "epoch": 42.6, "learning_rate": 2.3373851590106005e-06, "loss": 0.2511, "step": 12270 }, { "epoch": 42.64, "learning_rate": 2.335971731448763e-06, "loss": 0.2572, "step": 12280 }, { "epoch": 42.67, "learning_rate": 2.3345583038869258e-06, "loss": 0.2928, "step": 12290 }, { "epoch": 42.71, "learning_rate": 2.333144876325088e-06, "loss": 0.2539, "step": 12300 }, { "epoch": 42.74, "learning_rate": 2.331731448763251e-06, "loss": 0.2707, "step": 12310 }, { "epoch": 42.78, "learning_rate": 2.3303180212014134e-06, "loss": 0.2607, "step": 12320 }, { "epoch": 42.81, "learning_rate": 2.328904593639576e-06, "loss": 0.2695, "step": 12330 }, { "epoch": 42.85, "learning_rate": 2.3274911660777382e-06, "loss": 0.2836, "step": 12340 }, { "epoch": 42.88, "learning_rate": 2.326077738515901e-06, "loss": 0.2677, "step": 12350 }, { "epoch": 42.91, "learning_rate": 2.3246643109540635e-06, "loss": 0.2583, "step": 12360 }, { "epoch": 42.95, "learning_rate": 2.3232508833922263e-06, "loss": 0.2554, "step": 12370 }, { "epoch": 42.98, "learning_rate": 2.3218374558303883e-06, "loss": 0.2696, "step": 12380 }, { "epoch": 43.0, "eval_loss": 0.5108169913291931, "eval_runtime": 133.4619, "eval_samples_per_second": 3.986, "eval_steps_per_second": 0.997, "eval_wer": 0.19862441344732276, "step": 12384 }, { "epoch": 43.02, "learning_rate": 2.320424028268551e-06, "loss": 0.2739, "step": 12390 }, { "epoch": 43.06, "learning_rate": 2.3190106007067135e-06, "loss": 0.2612, "step": 12400 }, { "epoch": 43.09, "learning_rate": 2.3175971731448764e-06, "loss": 0.2596, "step": 12410 }, { "epoch": 43.12, "learning_rate": 2.3161837455830388e-06, "loss": 0.2777, "step": 12420 }, { "epoch": 43.16, "learning_rate": 2.3147703180212016e-06, "loss": 0.2487, "step": 12430 }, { "epoch": 43.19, "learning_rate": 2.3133568904593636e-06, "loss": 0.2452, "step": 12440 }, { "epoch": 43.23, "learning_rate": 2.3119434628975264e-06, "loss": 0.2495, "step": 12450 }, { "epoch": 43.26, "learning_rate": 2.310530035335689e-06, "loss": 0.2412, "step": 12460 }, { "epoch": 43.3, "learning_rate": 2.3091166077738517e-06, "loss": 0.2515, "step": 12470 }, { "epoch": 43.33, "learning_rate": 2.307703180212014e-06, "loss": 0.2955, "step": 12480 }, { "epoch": 43.37, "learning_rate": 2.306289752650177e-06, "loss": 0.2725, "step": 12490 }, { "epoch": 43.4, "learning_rate": 2.304876325088339e-06, "loss": 0.2414, "step": 12500 }, { "epoch": 43.44, "learning_rate": 2.3034628975265017e-06, "loss": 0.251, "step": 12510 }, { "epoch": 43.47, "learning_rate": 2.302049469964664e-06, "loss": 0.2579, "step": 12520 }, { "epoch": 43.51, "learning_rate": 2.300636042402827e-06, "loss": 0.2531, "step": 12530 }, { "epoch": 43.54, "learning_rate": 2.2992226148409894e-06, "loss": 0.247, "step": 12540 }, { "epoch": 43.57, "learning_rate": 2.297809187279152e-06, "loss": 0.278, "step": 12550 }, { "epoch": 43.61, "learning_rate": 2.296395759717314e-06, "loss": 0.2435, "step": 12560 }, { "epoch": 43.64, "learning_rate": 2.294982332155477e-06, "loss": 0.258, "step": 12570 }, { "epoch": 43.68, "learning_rate": 2.2935689045936395e-06, "loss": 0.2659, "step": 12580 }, { "epoch": 43.71, "learning_rate": 2.2921554770318023e-06, "loss": 0.2554, "step": 12590 }, { "epoch": 43.75, "learning_rate": 2.2907420494699647e-06, "loss": 0.2671, "step": 12600 }, { "epoch": 43.78, "learning_rate": 2.289328621908127e-06, "loss": 0.26, "step": 12610 }, { "epoch": 43.82, "learning_rate": 2.2879151943462895e-06, "loss": 0.2791, "step": 12620 }, { "epoch": 43.85, "learning_rate": 2.2865017667844523e-06, "loss": 0.2532, "step": 12630 }, { "epoch": 43.89, "learning_rate": 2.2850883392226148e-06, "loss": 0.2759, "step": 12640 }, { "epoch": 43.92, "learning_rate": 2.2836749116607776e-06, "loss": 0.2659, "step": 12650 }, { "epoch": 43.96, "learning_rate": 2.28226148409894e-06, "loss": 0.2672, "step": 12660 }, { "epoch": 43.99, "learning_rate": 2.2808480565371024e-06, "loss": 0.2729, "step": 12670 }, { "epoch": 44.0, "eval_loss": 0.5158911943435669, "eval_runtime": 133.2183, "eval_samples_per_second": 3.993, "eval_steps_per_second": 0.998, "eval_wer": 0.1990743716654882, "step": 12672 }, { "epoch": 44.03, "learning_rate": 2.279434628975265e-06, "loss": 0.2755, "step": 12680 }, { "epoch": 44.06, "learning_rate": 2.2780212014134277e-06, "loss": 0.2787, "step": 12690 }, { "epoch": 44.1, "learning_rate": 2.27660777385159e-06, "loss": 0.2539, "step": 12700 }, { "epoch": 44.13, "learning_rate": 2.275194346289753e-06, "loss": 0.2686, "step": 12710 }, { "epoch": 44.17, "learning_rate": 2.273780918727915e-06, "loss": 0.2883, "step": 12720 }, { "epoch": 44.2, "learning_rate": 2.2723674911660777e-06, "loss": 0.2573, "step": 12730 }, { "epoch": 44.24, "learning_rate": 2.27095406360424e-06, "loss": 0.2739, "step": 12740 }, { "epoch": 44.27, "learning_rate": 2.269540636042403e-06, "loss": 0.2749, "step": 12750 }, { "epoch": 44.3, "learning_rate": 2.2681272084805654e-06, "loss": 0.275, "step": 12760 }, { "epoch": 44.34, "learning_rate": 2.266713780918728e-06, "loss": 0.2766, "step": 12770 }, { "epoch": 44.37, "learning_rate": 2.26530035335689e-06, "loss": 0.2475, "step": 12780 }, { "epoch": 44.41, "learning_rate": 2.2638869257950526e-06, "loss": 0.2739, "step": 12790 }, { "epoch": 44.44, "learning_rate": 2.2624734982332154e-06, "loss": 0.2448, "step": 12800 }, { "epoch": 44.48, "learning_rate": 2.2610600706713783e-06, "loss": 0.2801, "step": 12810 }, { "epoch": 44.51, "learning_rate": 2.2596466431095407e-06, "loss": 0.2575, "step": 12820 }, { "epoch": 44.55, "learning_rate": 2.2582332155477035e-06, "loss": 0.249, "step": 12830 }, { "epoch": 44.58, "learning_rate": 2.2568197879858655e-06, "loss": 0.2546, "step": 12840 }, { "epoch": 44.62, "learning_rate": 2.255406360424028e-06, "loss": 0.2462, "step": 12850 }, { "epoch": 44.65, "learning_rate": 2.2539929328621907e-06, "loss": 0.2588, "step": 12860 }, { "epoch": 44.69, "learning_rate": 2.252579505300353e-06, "loss": 0.2569, "step": 12870 }, { "epoch": 44.72, "learning_rate": 2.251166077738516e-06, "loss": 0.2515, "step": 12880 }, { "epoch": 44.75, "learning_rate": 2.249752650176678e-06, "loss": 0.2564, "step": 12890 }, { "epoch": 44.79, "learning_rate": 2.248339222614841e-06, "loss": 0.2579, "step": 12900 }, { "epoch": 44.82, "learning_rate": 2.246925795053003e-06, "loss": 0.2831, "step": 12910 }, { "epoch": 44.86, "learning_rate": 2.245512367491166e-06, "loss": 0.2546, "step": 12920 }, { "epoch": 44.89, "learning_rate": 2.2440989399293284e-06, "loss": 0.2653, "step": 12930 }, { "epoch": 44.93, "learning_rate": 2.2426855123674913e-06, "loss": 0.2527, "step": 12940 }, { "epoch": 44.96, "learning_rate": 2.2412720848056533e-06, "loss": 0.2692, "step": 12950 }, { "epoch": 45.0, "learning_rate": 2.239858657243816e-06, "loss": 0.2579, "step": 12960 }, { "epoch": 45.0, "eval_loss": 0.516213059425354, "eval_runtime": 133.2787, "eval_samples_per_second": 3.992, "eval_steps_per_second": 0.998, "eval_wer": 0.19913865141094042, "step": 12960 }, { "epoch": 45.03, "learning_rate": 2.2384452296819785e-06, "loss": 0.273, "step": 12970 }, { "epoch": 45.07, "learning_rate": 2.2370318021201413e-06, "loss": 0.2757, "step": 12980 }, { "epoch": 45.1, "learning_rate": 2.2356183745583037e-06, "loss": 0.2461, "step": 12990 }, { "epoch": 45.14, "learning_rate": 2.234204946996466e-06, "loss": 0.2693, "step": 13000 }, { "epoch": 45.17, "learning_rate": 2.2327915194346286e-06, "loss": 0.2596, "step": 13010 }, { "epoch": 45.21, "learning_rate": 2.2313780918727914e-06, "loss": 0.2436, "step": 13020 }, { "epoch": 45.24, "learning_rate": 2.229964664310954e-06, "loss": 0.2484, "step": 13030 }, { "epoch": 45.28, "learning_rate": 2.2285512367491166e-06, "loss": 0.2378, "step": 13040 }, { "epoch": 45.31, "learning_rate": 2.227137809187279e-06, "loss": 0.2688, "step": 13050 }, { "epoch": 45.35, "learning_rate": 2.2257243816254415e-06, "loss": 0.2768, "step": 13060 }, { "epoch": 45.38, "learning_rate": 2.224310954063604e-06, "loss": 0.2626, "step": 13070 }, { "epoch": 45.42, "learning_rate": 2.2228975265017667e-06, "loss": 0.2602, "step": 13080 }, { "epoch": 45.45, "learning_rate": 2.221484098939929e-06, "loss": 0.2623, "step": 13090 }, { "epoch": 45.48, "learning_rate": 2.220070671378092e-06, "loss": 0.2782, "step": 13100 }, { "epoch": 45.52, "learning_rate": 2.2186572438162544e-06, "loss": 0.2689, "step": 13110 }, { "epoch": 45.55, "learning_rate": 2.2172438162544168e-06, "loss": 0.2642, "step": 13120 }, { "epoch": 45.59, "learning_rate": 2.215830388692579e-06, "loss": 0.2557, "step": 13130 }, { "epoch": 45.62, "learning_rate": 2.214416961130742e-06, "loss": 0.2737, "step": 13140 }, { "epoch": 45.66, "learning_rate": 2.2130035335689044e-06, "loss": 0.2703, "step": 13150 }, { "epoch": 45.69, "learning_rate": 2.2115901060070673e-06, "loss": 0.2737, "step": 13160 }, { "epoch": 45.73, "learning_rate": 2.2101766784452292e-06, "loss": 0.264, "step": 13170 }, { "epoch": 45.76, "learning_rate": 2.208763250883392e-06, "loss": 0.2595, "step": 13180 }, { "epoch": 45.8, "learning_rate": 2.2073498233215545e-06, "loss": 0.2488, "step": 13190 }, { "epoch": 45.83, "learning_rate": 2.2059363957597173e-06, "loss": 0.2766, "step": 13200 }, { "epoch": 45.87, "learning_rate": 2.2045229681978797e-06, "loss": 0.253, "step": 13210 }, { "epoch": 45.9, "learning_rate": 2.2031095406360426e-06, "loss": 0.2589, "step": 13220 }, { "epoch": 45.94, "learning_rate": 2.2016961130742045e-06, "loss": 0.2794, "step": 13230 }, { "epoch": 45.97, "learning_rate": 2.2002826855123674e-06, "loss": 0.283, "step": 13240 }, { "epoch": 46.0, "eval_loss": 0.5031996369361877, "eval_runtime": 133.0395, "eval_samples_per_second": 3.999, "eval_steps_per_second": 1.0, "eval_wer": 0.1981744552291573, "step": 13248 }, { "epoch": 46.01, "learning_rate": 2.1988692579505298e-06, "loss": 0.2882, "step": 13250 }, { "epoch": 46.04, "learning_rate": 2.1974558303886926e-06, "loss": 0.2563, "step": 13260 }, { "epoch": 46.08, "learning_rate": 2.196042402826855e-06, "loss": 0.2821, "step": 13270 }, { "epoch": 46.11, "learning_rate": 2.194628975265018e-06, "loss": 0.2555, "step": 13280 }, { "epoch": 46.15, "learning_rate": 2.19321554770318e-06, "loss": 0.2765, "step": 13290 }, { "epoch": 46.18, "learning_rate": 2.1918021201413427e-06, "loss": 0.2745, "step": 13300 }, { "epoch": 46.21, "learning_rate": 2.190388692579505e-06, "loss": 0.2667, "step": 13310 }, { "epoch": 46.25, "learning_rate": 2.188975265017668e-06, "loss": 0.2759, "step": 13320 }, { "epoch": 46.28, "learning_rate": 2.1875618374558303e-06, "loss": 0.2642, "step": 13330 }, { "epoch": 46.32, "learning_rate": 2.1861484098939927e-06, "loss": 0.2702, "step": 13340 }, { "epoch": 46.35, "learning_rate": 2.184734982332155e-06, "loss": 0.2689, "step": 13350 }, { "epoch": 46.39, "learning_rate": 2.183321554770318e-06, "loss": 0.2657, "step": 13360 }, { "epoch": 46.42, "learning_rate": 2.1819081272084804e-06, "loss": 0.2431, "step": 13370 }, { "epoch": 46.46, "learning_rate": 2.1804946996466432e-06, "loss": 0.2472, "step": 13380 }, { "epoch": 46.49, "learning_rate": 2.1790812720848056e-06, "loss": 0.2774, "step": 13390 }, { "epoch": 46.53, "learning_rate": 2.177667844522968e-06, "loss": 0.2459, "step": 13400 }, { "epoch": 46.56, "learning_rate": 2.1762544169611305e-06, "loss": 0.269, "step": 13410 }, { "epoch": 46.6, "learning_rate": 2.1748409893992933e-06, "loss": 0.2489, "step": 13420 }, { "epoch": 46.63, "learning_rate": 2.1734275618374557e-06, "loss": 0.2567, "step": 13430 }, { "epoch": 46.66, "learning_rate": 2.1720141342756185e-06, "loss": 0.2636, "step": 13440 }, { "epoch": 46.7, "learning_rate": 2.170600706713781e-06, "loss": 0.2421, "step": 13450 }, { "epoch": 46.73, "learning_rate": 2.1691872791519434e-06, "loss": 0.2446, "step": 13460 }, { "epoch": 46.77, "learning_rate": 2.1677738515901058e-06, "loss": 0.2593, "step": 13470 }, { "epoch": 46.8, "learning_rate": 2.1663604240282686e-06, "loss": 0.2525, "step": 13480 }, { "epoch": 46.84, "learning_rate": 2.164946996466431e-06, "loss": 0.2719, "step": 13490 }, { "epoch": 46.87, "learning_rate": 2.163533568904594e-06, "loss": 0.2601, "step": 13500 }, { "epoch": 46.91, "learning_rate": 2.162120141342756e-06, "loss": 0.2798, "step": 13510 }, { "epoch": 46.94, "learning_rate": 2.1608480565371027e-06, "loss": 0.2435, "step": 13520 }, { "epoch": 46.98, "learning_rate": 2.1594346289752647e-06, "loss": 0.282, "step": 13530 }, { "epoch": 47.0, "eval_loss": 0.5107125639915466, "eval_runtime": 133.7168, "eval_samples_per_second": 3.979, "eval_steps_per_second": 0.995, "eval_wer": 0.19804589573825288, "step": 13536 }, { "epoch": 47.01, "learning_rate": 2.1580212014134275e-06, "loss": 0.2783, "step": 13540 }, { "epoch": 47.05, "learning_rate": 2.15660777385159e-06, "loss": 0.2695, "step": 13550 }, { "epoch": 47.08, "learning_rate": 2.1551943462897528e-06, "loss": 0.2469, "step": 13560 }, { "epoch": 47.12, "learning_rate": 2.153780918727915e-06, "loss": 0.2757, "step": 13570 }, { "epoch": 47.15, "learning_rate": 2.152367491166078e-06, "loss": 0.2721, "step": 13580 }, { "epoch": 47.19, "learning_rate": 2.15095406360424e-06, "loss": 0.2529, "step": 13590 }, { "epoch": 47.22, "learning_rate": 2.149540636042403e-06, "loss": 0.2562, "step": 13600 }, { "epoch": 47.26, "learning_rate": 2.1481272084805652e-06, "loss": 0.2712, "step": 13610 }, { "epoch": 47.29, "learning_rate": 2.146713780918728e-06, "loss": 0.2696, "step": 13620 }, { "epoch": 47.33, "learning_rate": 2.1453003533568905e-06, "loss": 0.2698, "step": 13630 }, { "epoch": 47.36, "learning_rate": 2.143886925795053e-06, "loss": 0.2528, "step": 13640 }, { "epoch": 47.39, "learning_rate": 2.1424734982332153e-06, "loss": 0.2671, "step": 13650 }, { "epoch": 47.43, "learning_rate": 2.141060070671378e-06, "loss": 0.2542, "step": 13660 }, { "epoch": 47.46, "learning_rate": 2.1396466431095405e-06, "loss": 0.2696, "step": 13670 }, { "epoch": 47.5, "learning_rate": 2.1382332155477034e-06, "loss": 0.2652, "step": 13680 }, { "epoch": 47.53, "learning_rate": 2.136819787985866e-06, "loss": 0.2518, "step": 13690 }, { "epoch": 47.57, "learning_rate": 2.135406360424028e-06, "loss": 0.2353, "step": 13700 }, { "epoch": 47.6, "learning_rate": 2.1339929328621906e-06, "loss": 0.2568, "step": 13710 }, { "epoch": 47.64, "learning_rate": 2.1325795053003534e-06, "loss": 0.2935, "step": 13720 }, { "epoch": 47.67, "learning_rate": 2.131166077738516e-06, "loss": 0.2511, "step": 13730 }, { "epoch": 47.71, "learning_rate": 2.1297526501766787e-06, "loss": 0.2768, "step": 13740 }, { "epoch": 47.74, "learning_rate": 2.128339222614841e-06, "loss": 0.2525, "step": 13750 }, { "epoch": 47.78, "learning_rate": 2.126925795053003e-06, "loss": 0.2236, "step": 13760 }, { "epoch": 47.81, "learning_rate": 2.125512367491166e-06, "loss": 0.2719, "step": 13770 }, { "epoch": 47.85, "learning_rate": 2.1240989399293287e-06, "loss": 0.2772, "step": 13780 }, { "epoch": 47.88, "learning_rate": 2.122685512367491e-06, "loss": 0.2682, "step": 13790 }, { "epoch": 47.91, "learning_rate": 2.121272084805654e-06, "loss": 0.2631, "step": 13800 }, { "epoch": 47.95, "learning_rate": 2.119858657243816e-06, "loss": 0.2571, "step": 13810 }, { "epoch": 47.98, "learning_rate": 2.1184452296819784e-06, "loss": 0.2708, "step": 13820 }, { "epoch": 48.0, "eval_loss": 0.5127933025360107, "eval_runtime": 133.2709, "eval_samples_per_second": 3.992, "eval_steps_per_second": 0.998, "eval_wer": 0.1982387349746095, "step": 13824 }, { "epoch": 48.02, "learning_rate": 2.1170318021201412e-06, "loss": 0.2812, "step": 13830 }, { "epoch": 48.06, "learning_rate": 2.1156183745583036e-06, "loss": 0.2673, "step": 13840 }, { "epoch": 48.09, "learning_rate": 2.1142049469964665e-06, "loss": 0.2529, "step": 13850 }, { "epoch": 48.12, "learning_rate": 2.112791519434629e-06, "loss": 0.2602, "step": 13860 }, { "epoch": 48.16, "learning_rate": 2.1113780918727913e-06, "loss": 0.2634, "step": 13870 }, { "epoch": 48.19, "learning_rate": 2.1099646643109537e-06, "loss": 0.2439, "step": 13880 }, { "epoch": 48.23, "learning_rate": 2.1085512367491165e-06, "loss": 0.2744, "step": 13890 }, { "epoch": 48.26, "learning_rate": 2.107137809187279e-06, "loss": 0.2572, "step": 13900 }, { "epoch": 48.3, "learning_rate": 2.1057243816254418e-06, "loss": 0.2838, "step": 13910 }, { "epoch": 48.33, "learning_rate": 2.1043109540636038e-06, "loss": 0.2746, "step": 13920 }, { "epoch": 48.37, "learning_rate": 2.1028975265017666e-06, "loss": 0.2663, "step": 13930 }, { "epoch": 48.4, "learning_rate": 2.101484098939929e-06, "loss": 0.2817, "step": 13940 }, { "epoch": 48.44, "learning_rate": 2.100070671378092e-06, "loss": 0.2583, "step": 13950 }, { "epoch": 48.47, "learning_rate": 2.0986572438162542e-06, "loss": 0.2796, "step": 13960 }, { "epoch": 48.51, "learning_rate": 2.097243816254417e-06, "loss": 0.266, "step": 13970 }, { "epoch": 48.54, "learning_rate": 2.095830388692579e-06, "loss": 0.2757, "step": 13980 }, { "epoch": 48.57, "learning_rate": 2.094416961130742e-06, "loss": 0.262, "step": 13990 }, { "epoch": 48.61, "learning_rate": 2.0930035335689043e-06, "loss": 0.2463, "step": 14000 }, { "epoch": 48.64, "learning_rate": 2.091590106007067e-06, "loss": 0.2763, "step": 14010 }, { "epoch": 48.68, "learning_rate": 2.0901766784452295e-06, "loss": 0.2746, "step": 14020 }, { "epoch": 48.71, "learning_rate": 2.0887632508833924e-06, "loss": 0.2459, "step": 14030 }, { "epoch": 48.75, "learning_rate": 2.0873498233215544e-06, "loss": 0.2657, "step": 14040 }, { "epoch": 48.78, "learning_rate": 2.085936395759717e-06, "loss": 0.2599, "step": 14050 }, { "epoch": 48.82, "learning_rate": 2.0845229681978796e-06, "loss": 0.2634, "step": 14060 }, { "epoch": 48.85, "learning_rate": 2.0831095406360424e-06, "loss": 0.2551, "step": 14070 }, { "epoch": 48.89, "learning_rate": 2.081696113074205e-06, "loss": 0.2322, "step": 14080 }, { "epoch": 48.92, "learning_rate": 2.0802826855123673e-06, "loss": 0.2524, "step": 14090 }, { "epoch": 48.96, "learning_rate": 2.0788692579505297e-06, "loss": 0.2667, "step": 14100 }, { "epoch": 48.99, "learning_rate": 2.0774558303886925e-06, "loss": 0.2562, "step": 14110 }, { "epoch": 49.0, "eval_loss": 0.5162803530693054, "eval_runtime": 133.3898, "eval_samples_per_second": 3.988, "eval_steps_per_second": 0.997, "eval_wer": 0.1990743716654882, "step": 14112 }, { "epoch": 49.03, "learning_rate": 2.076042402826855e-06, "loss": 0.2776, "step": 14120 }, { "epoch": 49.06, "learning_rate": 2.0746289752650177e-06, "loss": 0.2473, "step": 14130 }, { "epoch": 49.1, "learning_rate": 2.07321554770318e-06, "loss": 0.2626, "step": 14140 }, { "epoch": 49.13, "learning_rate": 2.0718021201413426e-06, "loss": 0.2602, "step": 14150 }, { "epoch": 49.17, "learning_rate": 2.070388692579505e-06, "loss": 0.2707, "step": 14160 }, { "epoch": 49.2, "learning_rate": 2.068975265017668e-06, "loss": 0.2423, "step": 14170 }, { "epoch": 49.24, "learning_rate": 2.06756183745583e-06, "loss": 0.2965, "step": 14180 }, { "epoch": 49.27, "learning_rate": 2.066148409893993e-06, "loss": 0.2602, "step": 14190 }, { "epoch": 49.3, "learning_rate": 2.0647349823321555e-06, "loss": 0.2547, "step": 14200 }, { "epoch": 49.34, "learning_rate": 2.063321554770318e-06, "loss": 0.2702, "step": 14210 }, { "epoch": 49.37, "learning_rate": 2.0619081272084803e-06, "loss": 0.2806, "step": 14220 }, { "epoch": 49.41, "learning_rate": 2.060494699646643e-06, "loss": 0.2648, "step": 14230 }, { "epoch": 49.44, "learning_rate": 2.0590812720848055e-06, "loss": 0.2396, "step": 14240 }, { "epoch": 49.48, "learning_rate": 2.0576678445229683e-06, "loss": 0.2837, "step": 14250 }, { "epoch": 49.51, "learning_rate": 2.0562544169611303e-06, "loss": 0.281, "step": 14260 }, { "epoch": 49.55, "learning_rate": 2.054840989399293e-06, "loss": 0.235, "step": 14270 }, { "epoch": 49.58, "learning_rate": 2.0534275618374556e-06, "loss": 0.2556, "step": 14280 }, { "epoch": 49.62, "learning_rate": 2.0520141342756184e-06, "loss": 0.2675, "step": 14290 }, { "epoch": 49.65, "learning_rate": 2.050600706713781e-06, "loss": 0.2774, "step": 14300 }, { "epoch": 49.69, "learning_rate": 2.0491872791519437e-06, "loss": 0.2742, "step": 14310 }, { "epoch": 49.72, "learning_rate": 2.0477738515901056e-06, "loss": 0.2665, "step": 14320 }, { "epoch": 49.75, "learning_rate": 2.0463604240282685e-06, "loss": 0.2664, "step": 14330 }, { "epoch": 49.79, "learning_rate": 2.044946996466431e-06, "loss": 0.2496, "step": 14340 }, { "epoch": 49.82, "learning_rate": 2.0435335689045937e-06, "loss": 0.2725, "step": 14350 }, { "epoch": 49.86, "learning_rate": 2.042120141342756e-06, "loss": 0.2581, "step": 14360 }, { "epoch": 49.89, "learning_rate": 2.040706713780919e-06, "loss": 0.2582, "step": 14370 }, { "epoch": 49.93, "learning_rate": 2.039293286219081e-06, "loss": 0.2514, "step": 14380 }, { "epoch": 49.96, "learning_rate": 2.0378798586572438e-06, "loss": 0.2765, "step": 14390 }, { "epoch": 50.0, "learning_rate": 2.036466431095406e-06, "loss": 0.2675, "step": 14400 }, { "epoch": 50.0, "eval_loss": 0.5062453150749207, "eval_runtime": 133.1193, "eval_samples_per_second": 3.996, "eval_steps_per_second": 0.999, "eval_wer": 0.19939577039274925, "step": 14400 }, { "epoch": 50.03, "learning_rate": 2.035053003533569e-06, "loss": 0.2766, "step": 14410 }, { "epoch": 50.07, "learning_rate": 2.0336395759717314e-06, "loss": 0.2511, "step": 14420 }, { "epoch": 50.1, "learning_rate": 2.032226148409894e-06, "loss": 0.2459, "step": 14430 }, { "epoch": 50.14, "learning_rate": 2.0308127208480562e-06, "loss": 0.2715, "step": 14440 }, { "epoch": 50.17, "learning_rate": 2.029399293286219e-06, "loss": 0.2912, "step": 14450 }, { "epoch": 50.21, "learning_rate": 2.0279858657243815e-06, "loss": 0.2606, "step": 14460 }, { "epoch": 50.24, "learning_rate": 2.0265724381625443e-06, "loss": 0.2685, "step": 14470 }, { "epoch": 50.28, "learning_rate": 2.0251590106007067e-06, "loss": 0.2354, "step": 14480 }, { "epoch": 50.31, "learning_rate": 2.023745583038869e-06, "loss": 0.2725, "step": 14490 }, { "epoch": 50.35, "learning_rate": 2.0223321554770316e-06, "loss": 0.2681, "step": 14500 }, { "epoch": 50.38, "learning_rate": 2.0209187279151944e-06, "loss": 0.242, "step": 14510 }, { "epoch": 50.42, "learning_rate": 2.019505300353357e-06, "loss": 0.2646, "step": 14520 }, { "epoch": 50.45, "learning_rate": 2.0180918727915196e-06, "loss": 0.2415, "step": 14530 }, { "epoch": 50.48, "learning_rate": 2.0166784452296816e-06, "loss": 0.2905, "step": 14540 }, { "epoch": 50.52, "learning_rate": 2.0152650176678444e-06, "loss": 0.2674, "step": 14550 }, { "epoch": 50.55, "learning_rate": 2.013851590106007e-06, "loss": 0.2427, "step": 14560 }, { "epoch": 50.59, "learning_rate": 2.0124381625441697e-06, "loss": 0.2535, "step": 14570 }, { "epoch": 50.62, "learning_rate": 2.011024734982332e-06, "loss": 0.252, "step": 14580 }, { "epoch": 50.66, "learning_rate": 2.009611307420495e-06, "loss": 0.2764, "step": 14590 }, { "epoch": 50.69, "learning_rate": 2.008197879858657e-06, "loss": 0.2632, "step": 14600 }, { "epoch": 50.73, "learning_rate": 2.0067844522968198e-06, "loss": 0.2551, "step": 14610 }, { "epoch": 50.76, "learning_rate": 2.005371024734982e-06, "loss": 0.2657, "step": 14620 }, { "epoch": 50.8, "learning_rate": 2.003957597173145e-06, "loss": 0.2655, "step": 14630 }, { "epoch": 50.83, "learning_rate": 2.0025441696113074e-06, "loss": 0.2512, "step": 14640 }, { "epoch": 50.87, "learning_rate": 2.0011307420494702e-06, "loss": 0.2607, "step": 14650 }, { "epoch": 50.9, "learning_rate": 1.9997173144876326e-06, "loss": 0.2681, "step": 14660 }, { "epoch": 50.94, "learning_rate": 1.998303886925795e-06, "loss": 0.2625, "step": 14670 }, { "epoch": 50.97, "learning_rate": 1.9968904593639575e-06, "loss": 0.285, "step": 14680 }, { "epoch": 51.0, "eval_loss": 0.4999462068080902, "eval_runtime": 133.4245, "eval_samples_per_second": 3.987, "eval_steps_per_second": 0.997, "eval_wer": 0.19875297293822716, "step": 14688 }, { "epoch": 51.01, "learning_rate": 1.9954770318021203e-06, "loss": 0.2801, "step": 14690 }, { "epoch": 51.04, "learning_rate": 1.9940636042402827e-06, "loss": 0.2528, "step": 14700 }, { "epoch": 51.08, "learning_rate": 1.992650176678445e-06, "loss": 0.2613, "step": 14710 }, { "epoch": 51.11, "learning_rate": 1.991236749116608e-06, "loss": 0.2647, "step": 14720 }, { "epoch": 51.15, "learning_rate": 1.9898233215547704e-06, "loss": 0.2629, "step": 14730 }, { "epoch": 51.18, "learning_rate": 1.9884098939929328e-06, "loss": 0.2848, "step": 14740 }, { "epoch": 51.21, "learning_rate": 1.9869964664310956e-06, "loss": 0.25, "step": 14750 }, { "epoch": 51.25, "learning_rate": 1.985583038869258e-06, "loss": 0.2707, "step": 14760 }, { "epoch": 51.28, "learning_rate": 1.9841696113074204e-06, "loss": 0.2287, "step": 14770 }, { "epoch": 51.32, "learning_rate": 1.982756183745583e-06, "loss": 0.2822, "step": 14780 }, { "epoch": 51.35, "learning_rate": 1.9813427561837457e-06, "loss": 0.2816, "step": 14790 }, { "epoch": 51.39, "learning_rate": 1.979929328621908e-06, "loss": 0.2655, "step": 14800 }, { "epoch": 51.42, "learning_rate": 1.9785159010600705e-06, "loss": 0.2573, "step": 14810 }, { "epoch": 51.46, "learning_rate": 1.9771024734982333e-06, "loss": 0.2674, "step": 14820 }, { "epoch": 51.49, "learning_rate": 1.9756890459363957e-06, "loss": 0.2745, "step": 14830 }, { "epoch": 51.53, "learning_rate": 1.974275618374558e-06, "loss": 0.2586, "step": 14840 }, { "epoch": 51.56, "learning_rate": 1.972862190812721e-06, "loss": 0.2439, "step": 14850 }, { "epoch": 51.6, "learning_rate": 1.9714487632508834e-06, "loss": 0.2376, "step": 14860 }, { "epoch": 51.63, "learning_rate": 1.9700353356890458e-06, "loss": 0.248, "step": 14870 }, { "epoch": 51.66, "learning_rate": 1.968621908127208e-06, "loss": 0.2522, "step": 14880 }, { "epoch": 51.7, "learning_rate": 1.967208480565371e-06, "loss": 0.2599, "step": 14890 }, { "epoch": 51.73, "learning_rate": 1.9657950530035334e-06, "loss": 0.2678, "step": 14900 }, { "epoch": 51.77, "learning_rate": 1.964381625441696e-06, "loss": 0.2662, "step": 14910 }, { "epoch": 51.8, "learning_rate": 1.9629681978798587e-06, "loss": 0.2576, "step": 14920 }, { "epoch": 51.84, "learning_rate": 1.961554770318021e-06, "loss": 0.2788, "step": 14930 }, { "epoch": 51.87, "learning_rate": 1.9601413427561835e-06, "loss": 0.2517, "step": 14940 }, { "epoch": 51.91, "learning_rate": 1.958727915194346e-06, "loss": 0.2728, "step": 14950 }, { "epoch": 51.94, "learning_rate": 1.9573144876325087e-06, "loss": 0.2538, "step": 14960 }, { "epoch": 51.98, "learning_rate": 1.955901060070671e-06, "loss": 0.2756, "step": 14970 }, { "epoch": 52.0, "eval_loss": 0.5029511451721191, "eval_runtime": 133.7467, "eval_samples_per_second": 3.978, "eval_steps_per_second": 0.994, "eval_wer": 0.19862441344732276, "step": 14976 }, { "epoch": 52.01, "learning_rate": 1.9544876325088336e-06, "loss": 0.2558, "step": 14980 }, { "epoch": 52.05, "learning_rate": 1.9530742049469964e-06, "loss": 0.2658, "step": 14990 }, { "epoch": 52.08, "learning_rate": 1.951660777385159e-06, "loss": 0.255, "step": 15000 }, { "epoch": 52.12, "learning_rate": 1.9503886925795053e-06, "loss": 0.2528, "step": 15010 }, { "epoch": 52.15, "learning_rate": 1.9489752650176677e-06, "loss": 0.2853, "step": 15020 }, { "epoch": 52.19, "learning_rate": 1.94756183745583e-06, "loss": 0.2631, "step": 15030 }, { "epoch": 52.22, "learning_rate": 1.946148409893993e-06, "loss": 0.2424, "step": 15040 }, { "epoch": 52.26, "learning_rate": 1.9447349823321553e-06, "loss": 0.2537, "step": 15050 }, { "epoch": 52.29, "learning_rate": 1.9433215547703177e-06, "loss": 0.2686, "step": 15060 }, { "epoch": 52.33, "learning_rate": 1.9419081272084806e-06, "loss": 0.259, "step": 15070 }, { "epoch": 52.36, "learning_rate": 1.940494699646643e-06, "loss": 0.2609, "step": 15080 }, { "epoch": 52.39, "learning_rate": 1.9390812720848054e-06, "loss": 0.2807, "step": 15090 }, { "epoch": 52.43, "learning_rate": 1.9376678445229682e-06, "loss": 0.2633, "step": 15100 }, { "epoch": 52.46, "learning_rate": 1.9362544169611306e-06, "loss": 0.2583, "step": 15110 }, { "epoch": 52.5, "learning_rate": 1.934840989399293e-06, "loss": 0.2656, "step": 15120 }, { "epoch": 52.53, "learning_rate": 1.933427561837456e-06, "loss": 0.2534, "step": 15130 }, { "epoch": 52.57, "learning_rate": 1.9320141342756183e-06, "loss": 0.2639, "step": 15140 }, { "epoch": 52.6, "learning_rate": 1.9306007067137807e-06, "loss": 0.2408, "step": 15150 }, { "epoch": 52.64, "learning_rate": 1.9291872791519435e-06, "loss": 0.2493, "step": 15160 }, { "epoch": 52.67, "learning_rate": 1.927773851590106e-06, "loss": 0.2729, "step": 15170 }, { "epoch": 52.71, "learning_rate": 1.9263604240282684e-06, "loss": 0.2708, "step": 15180 }, { "epoch": 52.74, "learning_rate": 1.924946996466431e-06, "loss": 0.2759, "step": 15190 }, { "epoch": 52.78, "learning_rate": 1.9235335689045936e-06, "loss": 0.254, "step": 15200 }, { "epoch": 52.81, "learning_rate": 1.922120141342756e-06, "loss": 0.2598, "step": 15210 }, { "epoch": 52.85, "learning_rate": 1.9207067137809184e-06, "loss": 0.2672, "step": 15220 }, { "epoch": 52.88, "learning_rate": 1.9192932862190812e-06, "loss": 0.2436, "step": 15230 }, { "epoch": 52.91, "learning_rate": 1.9178798586572437e-06, "loss": 0.2741, "step": 15240 }, { "epoch": 52.95, "learning_rate": 1.916466431095406e-06, "loss": 0.2601, "step": 15250 }, { "epoch": 52.98, "learning_rate": 1.915053003533569e-06, "loss": 0.2888, "step": 15260 }, { "epoch": 53.0, "eval_loss": 0.5042588114738464, "eval_runtime": 133.2498, "eval_samples_per_second": 3.993, "eval_steps_per_second": 0.998, "eval_wer": 0.19746737802918302, "step": 15264 }, { "epoch": 53.02, "learning_rate": 1.9136395759717313e-06, "loss": 0.2853, "step": 15270 }, { "epoch": 53.06, "learning_rate": 1.9122261484098937e-06, "loss": 0.2504, "step": 15280 }, { "epoch": 53.09, "learning_rate": 1.9108127208480565e-06, "loss": 0.2608, "step": 15290 }, { "epoch": 53.12, "learning_rate": 1.909399293286219e-06, "loss": 0.2486, "step": 15300 }, { "epoch": 53.16, "learning_rate": 1.9079858657243814e-06, "loss": 0.2576, "step": 15310 }, { "epoch": 53.19, "learning_rate": 1.906572438162544e-06, "loss": 0.2678, "step": 15320 }, { "epoch": 53.23, "learning_rate": 1.9051590106007068e-06, "loss": 0.271, "step": 15330 }, { "epoch": 53.26, "learning_rate": 1.903745583038869e-06, "loss": 0.2528, "step": 15340 }, { "epoch": 53.3, "learning_rate": 1.9023321554770316e-06, "loss": 0.2786, "step": 15350 }, { "epoch": 53.33, "learning_rate": 1.9009187279151943e-06, "loss": 0.2634, "step": 15360 }, { "epoch": 53.37, "learning_rate": 1.8995053003533567e-06, "loss": 0.2764, "step": 15370 }, { "epoch": 53.4, "learning_rate": 1.8980918727915193e-06, "loss": 0.2592, "step": 15380 }, { "epoch": 53.44, "learning_rate": 1.8966784452296817e-06, "loss": 0.2503, "step": 15390 }, { "epoch": 53.47, "learning_rate": 1.8952650176678443e-06, "loss": 0.2712, "step": 15400 }, { "epoch": 53.51, "learning_rate": 1.893851590106007e-06, "loss": 0.2914, "step": 15410 }, { "epoch": 53.54, "learning_rate": 1.8924381625441694e-06, "loss": 0.2474, "step": 15420 }, { "epoch": 53.57, "learning_rate": 1.891024734982332e-06, "loss": 0.2733, "step": 15430 }, { "epoch": 53.61, "learning_rate": 1.8896113074204946e-06, "loss": 0.2511, "step": 15440 }, { "epoch": 53.64, "learning_rate": 1.888197879858657e-06, "loss": 0.2564, "step": 15450 }, { "epoch": 53.68, "learning_rate": 1.8867844522968196e-06, "loss": 0.2475, "step": 15460 }, { "epoch": 53.71, "learning_rate": 1.8853710247349823e-06, "loss": 0.2616, "step": 15470 }, { "epoch": 53.75, "learning_rate": 1.8839575971731447e-06, "loss": 0.2788, "step": 15480 }, { "epoch": 53.78, "learning_rate": 1.8825441696113073e-06, "loss": 0.2476, "step": 15490 }, { "epoch": 53.82, "learning_rate": 1.88113074204947e-06, "loss": 0.2713, "step": 15500 }, { "epoch": 53.85, "learning_rate": 1.8797173144876323e-06, "loss": 0.2638, "step": 15510 }, { "epoch": 53.89, "learning_rate": 1.878303886925795e-06, "loss": 0.2478, "step": 15520 }, { "epoch": 53.92, "learning_rate": 1.8768904593639573e-06, "loss": 0.2535, "step": 15530 }, { "epoch": 53.96, "learning_rate": 1.87547703180212e-06, "loss": 0.2804, "step": 15540 }, { "epoch": 53.99, "learning_rate": 1.8740636042402826e-06, "loss": 0.2778, "step": 15550 }, { "epoch": 54.0, "eval_loss": 0.5110978484153748, "eval_runtime": 133.5788, "eval_samples_per_second": 3.983, "eval_steps_per_second": 0.996, "eval_wer": 0.19804589573825288, "step": 15552 }, { "epoch": 54.03, "learning_rate": 1.872650176678445e-06, "loss": 0.2538, "step": 15560 }, { "epoch": 54.06, "learning_rate": 1.8712367491166076e-06, "loss": 0.2607, "step": 15570 }, { "epoch": 54.1, "learning_rate": 1.8698233215547702e-06, "loss": 0.2557, "step": 15580 }, { "epoch": 54.13, "learning_rate": 1.8684098939929326e-06, "loss": 0.2918, "step": 15590 }, { "epoch": 54.17, "learning_rate": 1.8669964664310953e-06, "loss": 0.3063, "step": 15600 }, { "epoch": 54.2, "learning_rate": 1.8655830388692579e-06, "loss": 0.2604, "step": 15610 }, { "epoch": 54.24, "learning_rate": 1.8641696113074203e-06, "loss": 0.263, "step": 15620 }, { "epoch": 54.27, "learning_rate": 1.862756183745583e-06, "loss": 0.2506, "step": 15630 }, { "epoch": 54.3, "learning_rate": 1.8613427561837455e-06, "loss": 0.271, "step": 15640 }, { "epoch": 54.34, "learning_rate": 1.859929328621908e-06, "loss": 0.2591, "step": 15650 }, { "epoch": 54.37, "learning_rate": 1.8585159010600706e-06, "loss": 0.2762, "step": 15660 }, { "epoch": 54.41, "learning_rate": 1.8571024734982332e-06, "loss": 0.2877, "step": 15670 }, { "epoch": 54.44, "learning_rate": 1.8556890459363956e-06, "loss": 0.2491, "step": 15680 }, { "epoch": 54.48, "learning_rate": 1.8542756183745582e-06, "loss": 0.2738, "step": 15690 }, { "epoch": 54.51, "learning_rate": 1.8528621908127206e-06, "loss": 0.2679, "step": 15700 }, { "epoch": 54.55, "learning_rate": 1.8514487632508833e-06, "loss": 0.2627, "step": 15710 }, { "epoch": 54.58, "learning_rate": 1.8500353356890459e-06, "loss": 0.2609, "step": 15720 }, { "epoch": 54.62, "learning_rate": 1.8486219081272083e-06, "loss": 0.2451, "step": 15730 }, { "epoch": 54.65, "learning_rate": 1.847208480565371e-06, "loss": 0.2622, "step": 15740 }, { "epoch": 54.69, "learning_rate": 1.8457950530035335e-06, "loss": 0.2716, "step": 15750 }, { "epoch": 54.72, "learning_rate": 1.844381625441696e-06, "loss": 0.2604, "step": 15760 }, { "epoch": 54.75, "learning_rate": 1.8429681978798586e-06, "loss": 0.2488, "step": 15770 }, { "epoch": 54.79, "learning_rate": 1.8415547703180212e-06, "loss": 0.2716, "step": 15780 }, { "epoch": 54.82, "learning_rate": 1.8401413427561836e-06, "loss": 0.2795, "step": 15790 }, { "epoch": 54.86, "learning_rate": 1.8387279151943462e-06, "loss": 0.2662, "step": 15800 }, { "epoch": 54.89, "learning_rate": 1.8373144876325088e-06, "loss": 0.2475, "step": 15810 }, { "epoch": 54.93, "learning_rate": 1.8359010600706712e-06, "loss": 0.2695, "step": 15820 }, { "epoch": 54.96, "learning_rate": 1.8344876325088339e-06, "loss": 0.2605, "step": 15830 }, { "epoch": 55.0, "learning_rate": 1.8330742049469965e-06, "loss": 0.2707, "step": 15840 }, { "epoch": 55.0, "eval_loss": 0.5116538405418396, "eval_runtime": 133.5286, "eval_samples_per_second": 3.984, "eval_steps_per_second": 0.996, "eval_wer": 0.19946005013820145, "step": 15840 }, { "epoch": 55.03, "learning_rate": 1.831660777385159e-06, "loss": 0.2439, "step": 15850 }, { "epoch": 55.07, "learning_rate": 1.8302473498233215e-06, "loss": 0.2534, "step": 15860 }, { "epoch": 55.1, "learning_rate": 1.828833922261484e-06, "loss": 0.2465, "step": 15870 }, { "epoch": 55.14, "learning_rate": 1.8274204946996465e-06, "loss": 0.2705, "step": 15880 }, { "epoch": 55.17, "learning_rate": 1.8260070671378092e-06, "loss": 0.2686, "step": 15890 }, { "epoch": 55.21, "learning_rate": 1.8245936395759716e-06, "loss": 0.2646, "step": 15900 }, { "epoch": 55.24, "learning_rate": 1.8231802120141342e-06, "loss": 0.2688, "step": 15910 }, { "epoch": 55.28, "learning_rate": 1.8217667844522968e-06, "loss": 0.2504, "step": 15920 }, { "epoch": 55.31, "learning_rate": 1.8203533568904592e-06, "loss": 0.2696, "step": 15930 }, { "epoch": 55.35, "learning_rate": 1.8189399293286219e-06, "loss": 0.2634, "step": 15940 }, { "epoch": 55.38, "learning_rate": 1.8175265017667845e-06, "loss": 0.281, "step": 15950 }, { "epoch": 55.42, "learning_rate": 1.8161130742049469e-06, "loss": 0.2617, "step": 15960 }, { "epoch": 55.45, "learning_rate": 1.8146996466431095e-06, "loss": 0.2631, "step": 15970 }, { "epoch": 55.48, "learning_rate": 1.8132862190812721e-06, "loss": 0.2646, "step": 15980 }, { "epoch": 55.52, "learning_rate": 1.8118727915194345e-06, "loss": 0.2597, "step": 15990 }, { "epoch": 55.55, "learning_rate": 1.8104593639575972e-06, "loss": 0.2723, "step": 16000 }, { "epoch": 55.59, "learning_rate": 1.8090459363957596e-06, "loss": 0.2507, "step": 16010 }, { "epoch": 55.62, "learning_rate": 1.8076325088339222e-06, "loss": 0.2457, "step": 16020 }, { "epoch": 55.66, "learning_rate": 1.8062190812720848e-06, "loss": 0.2963, "step": 16030 }, { "epoch": 55.69, "learning_rate": 1.8048056537102472e-06, "loss": 0.2469, "step": 16040 }, { "epoch": 55.73, "learning_rate": 1.8033922261484098e-06, "loss": 0.2333, "step": 16050 }, { "epoch": 55.76, "learning_rate": 1.8019787985865725e-06, "loss": 0.2694, "step": 16060 }, { "epoch": 55.8, "learning_rate": 1.8005653710247349e-06, "loss": 0.2568, "step": 16070 }, { "epoch": 55.83, "learning_rate": 1.7991519434628975e-06, "loss": 0.277, "step": 16080 }, { "epoch": 55.87, "learning_rate": 1.7977385159010601e-06, "loss": 0.2871, "step": 16090 }, { "epoch": 55.9, "learning_rate": 1.7963250883392225e-06, "loss": 0.2669, "step": 16100 }, { "epoch": 55.94, "learning_rate": 1.7949116607773851e-06, "loss": 0.2684, "step": 16110 }, { "epoch": 55.97, "learning_rate": 1.7934982332155478e-06, "loss": 0.2566, "step": 16120 }, { "epoch": 56.0, "eval_loss": 0.5196597576141357, "eval_runtime": 133.3522, "eval_samples_per_second": 3.989, "eval_steps_per_second": 0.997, "eval_wer": 0.20023140708362794, "step": 16128 }, { "epoch": 56.01, "learning_rate": 1.7920848056537102e-06, "loss": 0.2742, "step": 16130 }, { "epoch": 56.04, "learning_rate": 1.7906713780918728e-06, "loss": 0.2635, "step": 16140 }, { "epoch": 56.08, "learning_rate": 1.7892579505300354e-06, "loss": 0.263, "step": 16150 }, { "epoch": 56.11, "learning_rate": 1.7878445229681978e-06, "loss": 0.2578, "step": 16160 }, { "epoch": 56.15, "learning_rate": 1.7864310954063604e-06, "loss": 0.26, "step": 16170 }, { "epoch": 56.18, "learning_rate": 1.7850176678445229e-06, "loss": 0.2523, "step": 16180 }, { "epoch": 56.21, "learning_rate": 1.7836042402826855e-06, "loss": 0.2663, "step": 16190 }, { "epoch": 56.25, "learning_rate": 1.782190812720848e-06, "loss": 0.2493, "step": 16200 }, { "epoch": 56.28, "learning_rate": 1.7807773851590105e-06, "loss": 0.2407, "step": 16210 }, { "epoch": 56.32, "learning_rate": 1.7793639575971731e-06, "loss": 0.2565, "step": 16220 }, { "epoch": 56.35, "learning_rate": 1.7779505300353358e-06, "loss": 0.2673, "step": 16230 }, { "epoch": 56.39, "learning_rate": 1.7765371024734982e-06, "loss": 0.2487, "step": 16240 }, { "epoch": 56.42, "learning_rate": 1.7751236749116608e-06, "loss": 0.2539, "step": 16250 }, { "epoch": 56.46, "learning_rate": 1.7737102473498234e-06, "loss": 0.267, "step": 16260 }, { "epoch": 56.49, "learning_rate": 1.7722968197879858e-06, "loss": 0.2649, "step": 16270 }, { "epoch": 56.53, "learning_rate": 1.7708833922261484e-06, "loss": 0.2514, "step": 16280 }, { "epoch": 56.56, "learning_rate": 1.769469964664311e-06, "loss": 0.2652, "step": 16290 }, { "epoch": 56.6, "learning_rate": 1.7680565371024735e-06, "loss": 0.2702, "step": 16300 }, { "epoch": 56.63, "learning_rate": 1.766643109540636e-06, "loss": 0.2674, "step": 16310 }, { "epoch": 56.66, "learning_rate": 1.7652296819787985e-06, "loss": 0.3018, "step": 16320 }, { "epoch": 56.7, "learning_rate": 1.7638162544169611e-06, "loss": 0.2583, "step": 16330 }, { "epoch": 56.73, "learning_rate": 1.7624028268551237e-06, "loss": 0.262, "step": 16340 }, { "epoch": 56.77, "learning_rate": 1.7609893992932861e-06, "loss": 0.2863, "step": 16350 }, { "epoch": 56.8, "learning_rate": 1.7595759717314488e-06, "loss": 0.2632, "step": 16360 }, { "epoch": 56.84, "learning_rate": 1.7581625441696114e-06, "loss": 0.2861, "step": 16370 }, { "epoch": 56.87, "learning_rate": 1.7567491166077738e-06, "loss": 0.2588, "step": 16380 }, { "epoch": 56.91, "learning_rate": 1.7553356890459364e-06, "loss": 0.2594, "step": 16390 }, { "epoch": 56.94, "learning_rate": 1.753922261484099e-06, "loss": 0.2593, "step": 16400 }, { "epoch": 56.98, "learning_rate": 1.7525088339222612e-06, "loss": 0.2517, "step": 16410 }, { "epoch": 57.0, "eval_loss": 0.5210915803909302, "eval_runtime": 133.6955, "eval_samples_per_second": 3.979, "eval_steps_per_second": 0.995, "eval_wer": 0.19766021726553962, "step": 16416 }, { "epoch": 57.01, "learning_rate": 1.7510954063604239e-06, "loss": 0.2697, "step": 16420 }, { "epoch": 57.05, "learning_rate": 1.7496819787985865e-06, "loss": 0.2594, "step": 16430 }, { "epoch": 57.08, "learning_rate": 1.7482685512367489e-06, "loss": 0.255, "step": 16440 }, { "epoch": 57.12, "learning_rate": 1.7468551236749115e-06, "loss": 0.2831, "step": 16450 }, { "epoch": 57.15, "learning_rate": 1.7454416961130741e-06, "loss": 0.2727, "step": 16460 }, { "epoch": 57.19, "learning_rate": 1.7440282685512365e-06, "loss": 0.2516, "step": 16470 }, { "epoch": 57.22, "learning_rate": 1.7426148409893992e-06, "loss": 0.2602, "step": 16480 }, { "epoch": 57.26, "learning_rate": 1.7412014134275616e-06, "loss": 0.2567, "step": 16490 }, { "epoch": 57.29, "learning_rate": 1.7397879858657242e-06, "loss": 0.2625, "step": 16500 }, { "epoch": 57.33, "learning_rate": 1.7383745583038868e-06, "loss": 0.2711, "step": 16510 }, { "epoch": 57.36, "learning_rate": 1.7369611307420492e-06, "loss": 0.2688, "step": 16520 }, { "epoch": 57.39, "learning_rate": 1.7355477031802119e-06, "loss": 0.2677, "step": 16530 }, { "epoch": 57.43, "learning_rate": 1.7341342756183745e-06, "loss": 0.2636, "step": 16540 }, { "epoch": 57.46, "learning_rate": 1.7327208480565369e-06, "loss": 0.2531, "step": 16550 }, { "epoch": 57.5, "learning_rate": 1.7313074204946995e-06, "loss": 0.2769, "step": 16560 }, { "epoch": 57.53, "learning_rate": 1.7298939929328621e-06, "loss": 0.2666, "step": 16570 }, { "epoch": 57.57, "learning_rate": 1.7284805653710245e-06, "loss": 0.2544, "step": 16580 }, { "epoch": 57.6, "learning_rate": 1.7270671378091872e-06, "loss": 0.2544, "step": 16590 }, { "epoch": 57.64, "learning_rate": 1.7256537102473498e-06, "loss": 0.2738, "step": 16600 }, { "epoch": 57.67, "learning_rate": 1.7242402826855122e-06, "loss": 0.274, "step": 16610 }, { "epoch": 57.71, "learning_rate": 1.7228268551236748e-06, "loss": 0.2501, "step": 16620 }, { "epoch": 57.74, "learning_rate": 1.7214134275618372e-06, "loss": 0.2516, "step": 16630 }, { "epoch": 57.78, "learning_rate": 1.7199999999999998e-06, "loss": 0.2444, "step": 16640 }, { "epoch": 57.81, "learning_rate": 1.7185865724381625e-06, "loss": 0.2728, "step": 16650 }, { "epoch": 57.85, "learning_rate": 1.7171731448763249e-06, "loss": 0.2628, "step": 16660 }, { "epoch": 57.88, "learning_rate": 1.7157597173144875e-06, "loss": 0.2577, "step": 16670 }, { "epoch": 57.91, "learning_rate": 1.7143462897526501e-06, "loss": 0.2769, "step": 16680 }, { "epoch": 57.95, "learning_rate": 1.7129328621908125e-06, "loss": 0.2379, "step": 16690 }, { "epoch": 57.98, "learning_rate": 1.7115194346289751e-06, "loss": 0.2629, "step": 16700 }, { "epoch": 58.0, "eval_loss": 0.5079585313796997, "eval_runtime": 133.0035, "eval_samples_per_second": 4.0, "eval_steps_per_second": 1.0, "eval_wer": 0.19856013370187053, "step": 16704 }, { "epoch": 58.02, "learning_rate": 1.7101060070671378e-06, "loss": 0.2771, "step": 16710 }, { "epoch": 58.06, "learning_rate": 1.7086925795053002e-06, "loss": 0.2628, "step": 16720 }, { "epoch": 58.09, "learning_rate": 1.7072791519434628e-06, "loss": 0.278, "step": 16730 }, { "epoch": 58.12, "learning_rate": 1.7058657243816254e-06, "loss": 0.2515, "step": 16740 }, { "epoch": 58.16, "learning_rate": 1.7044522968197878e-06, "loss": 0.2736, "step": 16750 }, { "epoch": 58.19, "learning_rate": 1.7030388692579504e-06, "loss": 0.263, "step": 16760 }, { "epoch": 58.23, "learning_rate": 1.701625441696113e-06, "loss": 0.2649, "step": 16770 }, { "epoch": 58.26, "learning_rate": 1.7002120141342755e-06, "loss": 0.2387, "step": 16780 }, { "epoch": 58.3, "learning_rate": 1.698798586572438e-06, "loss": 0.2654, "step": 16790 }, { "epoch": 58.33, "learning_rate": 1.6973851590106005e-06, "loss": 0.2658, "step": 16800 }, { "epoch": 58.37, "learning_rate": 1.6959717314487631e-06, "loss": 0.2685, "step": 16810 }, { "epoch": 58.4, "learning_rate": 1.6945583038869258e-06, "loss": 0.2531, "step": 16820 }, { "epoch": 58.44, "learning_rate": 1.6931448763250882e-06, "loss": 0.2577, "step": 16830 }, { "epoch": 58.47, "learning_rate": 1.6917314487632508e-06, "loss": 0.2636, "step": 16840 }, { "epoch": 58.51, "learning_rate": 1.6903180212014134e-06, "loss": 0.2856, "step": 16850 }, { "epoch": 58.54, "learning_rate": 1.6889045936395758e-06, "loss": 0.2475, "step": 16860 }, { "epoch": 58.57, "learning_rate": 1.6874911660777384e-06, "loss": 0.2671, "step": 16870 }, { "epoch": 58.61, "learning_rate": 1.686077738515901e-06, "loss": 0.2512, "step": 16880 }, { "epoch": 58.64, "learning_rate": 1.6846643109540635e-06, "loss": 0.2786, "step": 16890 }, { "epoch": 58.68, "learning_rate": 1.683250883392226e-06, "loss": 0.2816, "step": 16900 }, { "epoch": 58.71, "learning_rate": 1.6818374558303887e-06, "loss": 0.2577, "step": 16910 }, { "epoch": 58.75, "learning_rate": 1.6804240282685511e-06, "loss": 0.2604, "step": 16920 }, { "epoch": 58.78, "learning_rate": 1.6790106007067137e-06, "loss": 0.2746, "step": 16930 }, { "epoch": 58.82, "learning_rate": 1.6775971731448761e-06, "loss": 0.269, "step": 16940 }, { "epoch": 58.85, "learning_rate": 1.6761837455830388e-06, "loss": 0.2399, "step": 16950 }, { "epoch": 58.89, "learning_rate": 1.6747703180212014e-06, "loss": 0.275, "step": 16960 }, { "epoch": 58.92, "learning_rate": 1.6733568904593638e-06, "loss": 0.2616, "step": 16970 }, { "epoch": 58.96, "learning_rate": 1.6719434628975264e-06, "loss": 0.2533, "step": 16980 }, { "epoch": 58.99, "learning_rate": 1.670530035335689e-06, "loss": 0.2787, "step": 16990 }, { "epoch": 59.0, "eval_loss": 0.5133015513420105, "eval_runtime": 133.197, "eval_samples_per_second": 3.994, "eval_steps_per_second": 0.999, "eval_wer": 0.19798161599280067, "step": 16992 }, { "epoch": 59.03, "learning_rate": 1.6691166077738515e-06, "loss": 0.2536, "step": 17000 }, { "epoch": 59.06, "learning_rate": 1.667703180212014e-06, "loss": 0.2524, "step": 17010 }, { "epoch": 59.1, "learning_rate": 1.6662897526501767e-06, "loss": 0.2374, "step": 17020 }, { "epoch": 59.13, "learning_rate": 1.664876325088339e-06, "loss": 0.2744, "step": 17030 }, { "epoch": 59.17, "learning_rate": 1.6634628975265017e-06, "loss": 0.2803, "step": 17040 }, { "epoch": 59.2, "learning_rate": 1.6620494699646643e-06, "loss": 0.2857, "step": 17050 }, { "epoch": 59.24, "learning_rate": 1.6606360424028268e-06, "loss": 0.2656, "step": 17060 }, { "epoch": 59.27, "learning_rate": 1.6592226148409894e-06, "loss": 0.2608, "step": 17070 }, { "epoch": 59.3, "learning_rate": 1.657809187279152e-06, "loss": 0.2826, "step": 17080 }, { "epoch": 59.34, "learning_rate": 1.6563957597173144e-06, "loss": 0.2972, "step": 17090 }, { "epoch": 59.37, "learning_rate": 1.654982332155477e-06, "loss": 0.2681, "step": 17100 }, { "epoch": 59.41, "learning_rate": 1.6535689045936394e-06, "loss": 0.2643, "step": 17110 }, { "epoch": 59.44, "learning_rate": 1.652155477031802e-06, "loss": 0.255, "step": 17120 }, { "epoch": 59.48, "learning_rate": 1.6507420494699647e-06, "loss": 0.2737, "step": 17130 }, { "epoch": 59.51, "learning_rate": 1.649328621908127e-06, "loss": 0.2642, "step": 17140 }, { "epoch": 59.55, "learning_rate": 1.6479151943462897e-06, "loss": 0.2459, "step": 17150 }, { "epoch": 59.58, "learning_rate": 1.6465017667844523e-06, "loss": 0.2693, "step": 17160 }, { "epoch": 59.62, "learning_rate": 1.6450883392226147e-06, "loss": 0.2648, "step": 17170 }, { "epoch": 59.65, "learning_rate": 1.6436749116607774e-06, "loss": 0.2467, "step": 17180 }, { "epoch": 59.69, "learning_rate": 1.64226148409894e-06, "loss": 0.2732, "step": 17190 }, { "epoch": 59.72, "learning_rate": 1.6408480565371024e-06, "loss": 0.2362, "step": 17200 }, { "epoch": 59.75, "learning_rate": 1.639434628975265e-06, "loss": 0.2591, "step": 17210 }, { "epoch": 59.79, "learning_rate": 1.6380212014134276e-06, "loss": 0.2481, "step": 17220 }, { "epoch": 59.82, "learning_rate": 1.63660777385159e-06, "loss": 0.2918, "step": 17230 }, { "epoch": 59.86, "learning_rate": 1.6351943462897527e-06, "loss": 0.2633, "step": 17240 }, { "epoch": 59.89, "learning_rate": 1.633780918727915e-06, "loss": 0.2691, "step": 17250 }, { "epoch": 59.93, "learning_rate": 1.6323674911660777e-06, "loss": 0.2457, "step": 17260 }, { "epoch": 59.96, "learning_rate": 1.6309540636042403e-06, "loss": 0.2563, "step": 17270 }, { "epoch": 60.0, "learning_rate": 1.6295406360424027e-06, "loss": 0.269, "step": 17280 }, { "epoch": 60.0, "eval_loss": 0.5155569314956665, "eval_runtime": 133.7176, "eval_samples_per_second": 3.979, "eval_steps_per_second": 0.995, "eval_wer": 0.1972745387928264, "step": 17280 }, { "epoch": 60.03, "learning_rate": 1.6281272084805654e-06, "loss": 0.2982, "step": 17290 }, { "epoch": 60.07, "learning_rate": 1.626713780918728e-06, "loss": 0.2651, "step": 17300 }, { "epoch": 60.1, "learning_rate": 1.6253003533568904e-06, "loss": 0.2533, "step": 17310 }, { "epoch": 60.14, "learning_rate": 1.623886925795053e-06, "loss": 0.2531, "step": 17320 }, { "epoch": 60.17, "learning_rate": 1.6224734982332156e-06, "loss": 0.2584, "step": 17330 }, { "epoch": 60.21, "learning_rate": 1.621060070671378e-06, "loss": 0.2649, "step": 17340 }, { "epoch": 60.24, "learning_rate": 1.6196466431095407e-06, "loss": 0.2601, "step": 17350 }, { "epoch": 60.28, "learning_rate": 1.6182332155477033e-06, "loss": 0.2509, "step": 17360 }, { "epoch": 60.31, "learning_rate": 1.6168197879858657e-06, "loss": 0.2647, "step": 17370 }, { "epoch": 60.35, "learning_rate": 1.6154063604240283e-06, "loss": 0.259, "step": 17380 }, { "epoch": 60.38, "learning_rate": 1.613992932862191e-06, "loss": 0.2466, "step": 17390 }, { "epoch": 60.42, "learning_rate": 1.6125795053003533e-06, "loss": 0.2568, "step": 17400 }, { "epoch": 60.45, "learning_rate": 1.611166077738516e-06, "loss": 0.2427, "step": 17410 }, { "epoch": 60.48, "learning_rate": 1.6097526501766784e-06, "loss": 0.265, "step": 17420 }, { "epoch": 60.52, "learning_rate": 1.608339222614841e-06, "loss": 0.2602, "step": 17430 }, { "epoch": 60.55, "learning_rate": 1.6069257950530036e-06, "loss": 0.2419, "step": 17440 }, { "epoch": 60.59, "learning_rate": 1.605512367491166e-06, "loss": 0.2363, "step": 17450 }, { "epoch": 60.62, "learning_rate": 1.6040989399293286e-06, "loss": 0.2614, "step": 17460 }, { "epoch": 60.66, "learning_rate": 1.6026855123674913e-06, "loss": 0.288, "step": 17470 }, { "epoch": 60.69, "learning_rate": 1.6012720848056535e-06, "loss": 0.2746, "step": 17480 }, { "epoch": 60.73, "learning_rate": 1.5998586572438163e-06, "loss": 0.2442, "step": 17490 }, { "epoch": 60.76, "learning_rate": 1.598445229681979e-06, "loss": 0.2789, "step": 17500 }, { "epoch": 60.8, "learning_rate": 1.5970318021201411e-06, "loss": 0.2478, "step": 17510 }, { "epoch": 60.83, "learning_rate": 1.5956183745583037e-06, "loss": 0.2833, "step": 17520 }, { "epoch": 60.87, "learning_rate": 1.5942049469964664e-06, "loss": 0.2829, "step": 17530 }, { "epoch": 60.9, "learning_rate": 1.5927915194346288e-06, "loss": 0.2482, "step": 17540 }, { "epoch": 60.94, "learning_rate": 1.5913780918727914e-06, "loss": 0.2772, "step": 17550 }, { "epoch": 60.97, "learning_rate": 1.5899646643109538e-06, "loss": 0.2664, "step": 17560 }, { "epoch": 61.0, "eval_loss": 0.5191646814346313, "eval_runtime": 133.5584, "eval_samples_per_second": 3.983, "eval_steps_per_second": 0.996, "eval_wer": 0.1948961882110947, "step": 17568 }, { "epoch": 61.01, "learning_rate": 1.5885512367491164e-06, "loss": 0.2819, "step": 17570 }, { "epoch": 61.04, "learning_rate": 1.587137809187279e-06, "loss": 0.2615, "step": 17580 }, { "epoch": 61.08, "learning_rate": 1.5857243816254414e-06, "loss": 0.2556, "step": 17590 }, { "epoch": 61.11, "learning_rate": 1.584310954063604e-06, "loss": 0.2771, "step": 17600 }, { "epoch": 61.15, "learning_rate": 1.5828975265017667e-06, "loss": 0.2854, "step": 17610 }, { "epoch": 61.18, "learning_rate": 1.581484098939929e-06, "loss": 0.2554, "step": 17620 }, { "epoch": 61.21, "learning_rate": 1.5800706713780917e-06, "loss": 0.2597, "step": 17630 }, { "epoch": 61.25, "learning_rate": 1.5786572438162543e-06, "loss": 0.2422, "step": 17640 }, { "epoch": 61.28, "learning_rate": 1.5772438162544168e-06, "loss": 0.268, "step": 17650 }, { "epoch": 61.32, "learning_rate": 1.5758303886925794e-06, "loss": 0.2665, "step": 17660 }, { "epoch": 61.35, "learning_rate": 1.574416961130742e-06, "loss": 0.2504, "step": 17670 }, { "epoch": 61.39, "learning_rate": 1.5730035335689044e-06, "loss": 0.256, "step": 17680 }, { "epoch": 61.42, "learning_rate": 1.571590106007067e-06, "loss": 0.2634, "step": 17690 }, { "epoch": 61.46, "learning_rate": 1.5701766784452296e-06, "loss": 0.2538, "step": 17700 }, { "epoch": 61.49, "learning_rate": 1.568763250883392e-06, "loss": 0.2518, "step": 17710 }, { "epoch": 61.53, "learning_rate": 1.5673498233215547e-06, "loss": 0.2623, "step": 17720 }, { "epoch": 61.56, "learning_rate": 1.565936395759717e-06, "loss": 0.2741, "step": 17730 }, { "epoch": 61.6, "learning_rate": 1.5645229681978797e-06, "loss": 0.2519, "step": 17740 }, { "epoch": 61.63, "learning_rate": 1.5631095406360423e-06, "loss": 0.2381, "step": 17750 }, { "epoch": 61.66, "learning_rate": 1.5616961130742047e-06, "loss": 0.26, "step": 17760 }, { "epoch": 61.7, "learning_rate": 1.5602826855123674e-06, "loss": 0.2751, "step": 17770 }, { "epoch": 61.73, "learning_rate": 1.55886925795053e-06, "loss": 0.2536, "step": 17780 }, { "epoch": 61.77, "learning_rate": 1.5574558303886924e-06, "loss": 0.2614, "step": 17790 }, { "epoch": 61.8, "learning_rate": 1.556042402826855e-06, "loss": 0.2669, "step": 17800 }, { "epoch": 61.84, "learning_rate": 1.5546289752650176e-06, "loss": 0.2653, "step": 17810 }, { "epoch": 61.87, "learning_rate": 1.55321554770318e-06, "loss": 0.2641, "step": 17820 }, { "epoch": 61.91, "learning_rate": 1.5518021201413427e-06, "loss": 0.267, "step": 17830 }, { "epoch": 61.94, "learning_rate": 1.5503886925795053e-06, "loss": 0.2447, "step": 17840 }, { "epoch": 61.98, "learning_rate": 1.5489752650176677e-06, "loss": 0.2605, "step": 17850 }, { "epoch": 62.0, "eval_loss": 0.5094706416130066, "eval_runtime": 133.5482, "eval_samples_per_second": 3.984, "eval_steps_per_second": 0.996, "eval_wer": 0.19701741981101756, "step": 17856 }, { "epoch": 62.01, "learning_rate": 1.5475618374558303e-06, "loss": 0.2882, "step": 17860 }, { "epoch": 62.05, "learning_rate": 1.5461484098939927e-06, "loss": 0.2536, "step": 17870 }, { "epoch": 62.08, "learning_rate": 1.5447349823321554e-06, "loss": 0.2642, "step": 17880 }, { "epoch": 62.12, "learning_rate": 1.543321554770318e-06, "loss": 0.2723, "step": 17890 }, { "epoch": 62.15, "learning_rate": 1.5419081272084804e-06, "loss": 0.2688, "step": 17900 }, { "epoch": 62.19, "learning_rate": 1.540494699646643e-06, "loss": 0.2406, "step": 17910 }, { "epoch": 62.22, "learning_rate": 1.5390812720848056e-06, "loss": 0.2617, "step": 17920 }, { "epoch": 62.26, "learning_rate": 1.537667844522968e-06, "loss": 0.259, "step": 17930 }, { "epoch": 62.29, "learning_rate": 1.5362544169611307e-06, "loss": 0.25, "step": 17940 }, { "epoch": 62.33, "learning_rate": 1.5348409893992933e-06, "loss": 0.2976, "step": 17950 }, { "epoch": 62.36, "learning_rate": 1.5334275618374557e-06, "loss": 0.2654, "step": 17960 }, { "epoch": 62.39, "learning_rate": 1.5320141342756183e-06, "loss": 0.2781, "step": 17970 }, { "epoch": 62.43, "learning_rate": 1.530600706713781e-06, "loss": 0.2588, "step": 17980 }, { "epoch": 62.46, "learning_rate": 1.5291872791519433e-06, "loss": 0.2336, "step": 17990 }, { "epoch": 62.5, "learning_rate": 1.527773851590106e-06, "loss": 0.2496, "step": 18000 }, { "epoch": 62.53, "learning_rate": 1.5263604240282686e-06, "loss": 0.2469, "step": 18010 }, { "epoch": 62.57, "learning_rate": 1.524946996466431e-06, "loss": 0.2624, "step": 18020 }, { "epoch": 62.6, "learning_rate": 1.5235335689045936e-06, "loss": 0.2382, "step": 18030 }, { "epoch": 62.64, "learning_rate": 1.522120141342756e-06, "loss": 0.2812, "step": 18040 }, { "epoch": 62.67, "learning_rate": 1.5207067137809186e-06, "loss": 0.2653, "step": 18050 }, { "epoch": 62.71, "learning_rate": 1.519434628975265e-06, "loss": 0.2644, "step": 18060 }, { "epoch": 62.74, "learning_rate": 1.5180212014134275e-06, "loss": 0.2725, "step": 18070 }, { "epoch": 62.78, "learning_rate": 1.5166077738515901e-06, "loss": 0.2444, "step": 18080 }, { "epoch": 62.81, "learning_rate": 1.5151943462897525e-06, "loss": 0.276, "step": 18090 }, { "epoch": 62.85, "learning_rate": 1.5137809187279152e-06, "loss": 0.2724, "step": 18100 }, { "epoch": 62.88, "learning_rate": 1.5123674911660778e-06, "loss": 0.2495, "step": 18110 }, { "epoch": 62.91, "learning_rate": 1.5109540636042402e-06, "loss": 0.2311, "step": 18120 }, { "epoch": 62.95, "learning_rate": 1.5095406360424028e-06, "loss": 0.2443, "step": 18130 }, { "epoch": 62.98, "learning_rate": 1.5081272084805654e-06, "loss": 0.2649, "step": 18140 }, { "epoch": 63.0, "eval_loss": 0.5149233937263489, "eval_runtime": 133.9576, "eval_samples_per_second": 3.971, "eval_steps_per_second": 0.993, "eval_wer": 0.19695314006556533, "step": 18144 }, { "epoch": 63.02, "learning_rate": 1.5067137809187279e-06, "loss": 0.2642, "step": 18150 }, { "epoch": 63.06, "learning_rate": 1.5053003533568905e-06, "loss": 0.2526, "step": 18160 }, { "epoch": 63.09, "learning_rate": 1.5038869257950529e-06, "loss": 0.2483, "step": 18170 }, { "epoch": 63.12, "learning_rate": 1.5024734982332155e-06, "loss": 0.2617, "step": 18180 }, { "epoch": 63.16, "learning_rate": 1.5010600706713781e-06, "loss": 0.2942, "step": 18190 }, { "epoch": 63.19, "learning_rate": 1.4996466431095405e-06, "loss": 0.2672, "step": 18200 }, { "epoch": 63.23, "learning_rate": 1.4982332155477032e-06, "loss": 0.2541, "step": 18210 }, { "epoch": 63.26, "learning_rate": 1.4968197879858658e-06, "loss": 0.2403, "step": 18220 }, { "epoch": 63.3, "learning_rate": 1.4954063604240282e-06, "loss": 0.2749, "step": 18230 }, { "epoch": 63.33, "learning_rate": 1.4939929328621908e-06, "loss": 0.2812, "step": 18240 }, { "epoch": 63.37, "learning_rate": 1.4925795053003534e-06, "loss": 0.2279, "step": 18250 }, { "epoch": 63.4, "learning_rate": 1.4911660777385158e-06, "loss": 0.2552, "step": 18260 }, { "epoch": 63.44, "learning_rate": 1.4897526501766785e-06, "loss": 0.2594, "step": 18270 }, { "epoch": 63.47, "learning_rate": 1.488339222614841e-06, "loss": 0.2593, "step": 18280 }, { "epoch": 63.51, "learning_rate": 1.4869257950530035e-06, "loss": 0.2681, "step": 18290 }, { "epoch": 63.54, "learning_rate": 1.4855123674911661e-06, "loss": 0.239, "step": 18300 }, { "epoch": 63.57, "learning_rate": 1.4840989399293287e-06, "loss": 0.2505, "step": 18310 }, { "epoch": 63.61, "learning_rate": 1.4826855123674911e-06, "loss": 0.2526, "step": 18320 }, { "epoch": 63.64, "learning_rate": 1.4812720848056538e-06, "loss": 0.2672, "step": 18330 }, { "epoch": 63.68, "learning_rate": 1.4798586572438162e-06, "loss": 0.2715, "step": 18340 }, { "epoch": 63.71, "learning_rate": 1.4784452296819788e-06, "loss": 0.2519, "step": 18350 }, { "epoch": 63.75, "learning_rate": 1.4770318021201414e-06, "loss": 0.2712, "step": 18360 }, { "epoch": 63.78, "learning_rate": 1.4756183745583038e-06, "loss": 0.2385, "step": 18370 }, { "epoch": 63.82, "learning_rate": 1.4742049469964664e-06, "loss": 0.2732, "step": 18380 }, { "epoch": 63.85, "learning_rate": 1.472791519434629e-06, "loss": 0.2835, "step": 18390 }, { "epoch": 63.89, "learning_rate": 1.4713780918727915e-06, "loss": 0.2812, "step": 18400 }, { "epoch": 63.92, "learning_rate": 1.469964664310954e-06, "loss": 0.2488, "step": 18410 }, { "epoch": 63.96, "learning_rate": 1.4685512367491167e-06, "loss": 0.2607, "step": 18420 }, { "epoch": 63.99, "learning_rate": 1.4671378091872791e-06, "loss": 0.246, "step": 18430 }, { "epoch": 64.0, "eval_loss": 0.5164635181427002, "eval_runtime": 134.1849, "eval_samples_per_second": 3.965, "eval_steps_per_second": 0.991, "eval_wer": 0.19753165777463522, "step": 18432 }, { "epoch": 64.03, "learning_rate": 1.4657243816254418e-06, "loss": 0.2641, "step": 18440 }, { "epoch": 64.06, "learning_rate": 1.4643109540636044e-06, "loss": 0.268, "step": 18450 }, { "epoch": 64.1, "learning_rate": 1.4628975265017666e-06, "loss": 0.2544, "step": 18460 }, { "epoch": 64.13, "learning_rate": 1.4614840989399294e-06, "loss": 0.299, "step": 18470 }, { "epoch": 64.17, "learning_rate": 1.4600706713780916e-06, "loss": 0.27, "step": 18480 }, { "epoch": 64.2, "learning_rate": 1.4586572438162542e-06, "loss": 0.2475, "step": 18490 }, { "epoch": 64.24, "learning_rate": 1.4572438162544168e-06, "loss": 0.262, "step": 18500 }, { "epoch": 64.27, "learning_rate": 1.4558303886925793e-06, "loss": 0.2591, "step": 18510 }, { "epoch": 64.3, "learning_rate": 1.4544169611307419e-06, "loss": 0.2448, "step": 18520 }, { "epoch": 64.34, "learning_rate": 1.4530035335689045e-06, "loss": 0.263, "step": 18530 }, { "epoch": 64.37, "learning_rate": 1.451590106007067e-06, "loss": 0.2527, "step": 18540 }, { "epoch": 64.41, "learning_rate": 1.4501766784452295e-06, "loss": 0.2668, "step": 18550 }, { "epoch": 64.44, "learning_rate": 1.4487632508833921e-06, "loss": 0.2316, "step": 18560 }, { "epoch": 64.48, "learning_rate": 1.4473498233215546e-06, "loss": 0.2757, "step": 18570 }, { "epoch": 64.51, "learning_rate": 1.4459363957597172e-06, "loss": 0.2749, "step": 18580 }, { "epoch": 64.55, "learning_rate": 1.4445229681978798e-06, "loss": 0.2537, "step": 18590 }, { "epoch": 64.58, "learning_rate": 1.4431095406360422e-06, "loss": 0.2663, "step": 18600 }, { "epoch": 64.62, "learning_rate": 1.4416961130742048e-06, "loss": 0.2525, "step": 18610 }, { "epoch": 64.65, "learning_rate": 1.4402826855123675e-06, "loss": 0.2669, "step": 18620 }, { "epoch": 64.69, "learning_rate": 1.4388692579505299e-06, "loss": 0.2724, "step": 18630 }, { "epoch": 64.72, "learning_rate": 1.4374558303886925e-06, "loss": 0.2506, "step": 18640 }, { "epoch": 64.75, "learning_rate": 1.4360424028268549e-06, "loss": 0.2458, "step": 18650 }, { "epoch": 64.79, "learning_rate": 1.4346289752650175e-06, "loss": 0.2545, "step": 18660 }, { "epoch": 64.82, "learning_rate": 1.4332155477031801e-06, "loss": 0.2623, "step": 18670 }, { "epoch": 64.86, "learning_rate": 1.4318021201413425e-06, "loss": 0.2512, "step": 18680 }, { "epoch": 64.89, "learning_rate": 1.4303886925795052e-06, "loss": 0.2394, "step": 18690 }, { "epoch": 64.93, "learning_rate": 1.4289752650176678e-06, "loss": 0.2602, "step": 18700 }, { "epoch": 64.96, "learning_rate": 1.4275618374558302e-06, "loss": 0.2483, "step": 18710 }, { "epoch": 65.0, "learning_rate": 1.4261484098939928e-06, "loss": 0.2567, "step": 18720 }, { "epoch": 65.0, "eval_loss": 0.5072118043899536, "eval_runtime": 134.0915, "eval_samples_per_second": 3.967, "eval_steps_per_second": 0.992, "eval_wer": 0.19811017548370508, "step": 18720 }, { "epoch": 65.03, "learning_rate": 1.4247349823321554e-06, "loss": 0.2677, "step": 18730 }, { "epoch": 65.07, "learning_rate": 1.4233215547703178e-06, "loss": 0.2524, "step": 18740 }, { "epoch": 65.1, "learning_rate": 1.4219081272084805e-06, "loss": 0.2628, "step": 18750 }, { "epoch": 65.14, "learning_rate": 1.420494699646643e-06, "loss": 0.2743, "step": 18760 }, { "epoch": 65.17, "learning_rate": 1.4190812720848055e-06, "loss": 0.2692, "step": 18770 }, { "epoch": 65.21, "learning_rate": 1.4176678445229681e-06, "loss": 0.2551, "step": 18780 }, { "epoch": 65.24, "learning_rate": 1.4162544169611305e-06, "loss": 0.2416, "step": 18790 }, { "epoch": 65.28, "learning_rate": 1.4148409893992932e-06, "loss": 0.2516, "step": 18800 }, { "epoch": 65.31, "learning_rate": 1.4134275618374558e-06, "loss": 0.2842, "step": 18810 }, { "epoch": 65.35, "learning_rate": 1.4120141342756182e-06, "loss": 0.263, "step": 18820 }, { "epoch": 65.38, "learning_rate": 1.4106007067137808e-06, "loss": 0.2531, "step": 18830 }, { "epoch": 65.42, "learning_rate": 1.4091872791519434e-06, "loss": 0.2536, "step": 18840 }, { "epoch": 65.45, "learning_rate": 1.4077738515901058e-06, "loss": 0.2741, "step": 18850 }, { "epoch": 65.48, "learning_rate": 1.4063604240282685e-06, "loss": 0.2675, "step": 18860 }, { "epoch": 65.52, "learning_rate": 1.404946996466431e-06, "loss": 0.2597, "step": 18870 }, { "epoch": 65.55, "learning_rate": 1.4035335689045935e-06, "loss": 0.259, "step": 18880 }, { "epoch": 65.59, "learning_rate": 1.4021201413427561e-06, "loss": 0.2586, "step": 18890 }, { "epoch": 65.62, "learning_rate": 1.4007067137809187e-06, "loss": 0.2473, "step": 18900 }, { "epoch": 65.66, "learning_rate": 1.3992932862190811e-06, "loss": 0.2679, "step": 18910 }, { "epoch": 65.69, "learning_rate": 1.3978798586572438e-06, "loss": 0.2429, "step": 18920 }, { "epoch": 65.73, "learning_rate": 1.3964664310954064e-06, "loss": 0.2521, "step": 18930 }, { "epoch": 65.76, "learning_rate": 1.3950530035335688e-06, "loss": 0.2651, "step": 18940 }, { "epoch": 65.8, "learning_rate": 1.3936395759717314e-06, "loss": 0.243, "step": 18950 }, { "epoch": 65.83, "learning_rate": 1.3922261484098938e-06, "loss": 0.26, "step": 18960 }, { "epoch": 65.87, "learning_rate": 1.3908127208480564e-06, "loss": 0.2509, "step": 18970 }, { "epoch": 65.9, "learning_rate": 1.389399293286219e-06, "loss": 0.2528, "step": 18980 }, { "epoch": 65.94, "learning_rate": 1.3879858657243815e-06, "loss": 0.2602, "step": 18990 }, { "epoch": 65.97, "learning_rate": 1.386572438162544e-06, "loss": 0.2509, "step": 19000 }, { "epoch": 66.0, "eval_loss": 0.5061087012290955, "eval_runtime": 133.4932, "eval_samples_per_second": 3.985, "eval_steps_per_second": 0.996, "eval_wer": 0.19778877675644405, "step": 19008 }, { "epoch": 66.01, "learning_rate": 1.3851590106007067e-06, "loss": 0.2801, "step": 19010 }, { "epoch": 66.04, "learning_rate": 1.3837455830388691e-06, "loss": 0.256, "step": 19020 }, { "epoch": 66.08, "learning_rate": 1.3823321554770318e-06, "loss": 0.2356, "step": 19030 }, { "epoch": 66.11, "learning_rate": 1.3809187279151944e-06, "loss": 0.2594, "step": 19040 }, { "epoch": 66.15, "learning_rate": 1.3795053003533568e-06, "loss": 0.2468, "step": 19050 }, { "epoch": 66.18, "learning_rate": 1.3780918727915194e-06, "loss": 0.2661, "step": 19060 }, { "epoch": 66.21, "learning_rate": 1.376678445229682e-06, "loss": 0.2664, "step": 19070 }, { "epoch": 66.25, "learning_rate": 1.3752650176678444e-06, "loss": 0.266, "step": 19080 }, { "epoch": 66.28, "learning_rate": 1.373851590106007e-06, "loss": 0.2531, "step": 19090 }, { "epoch": 66.32, "learning_rate": 1.3724381625441695e-06, "loss": 0.2631, "step": 19100 }, { "epoch": 66.35, "learning_rate": 1.371024734982332e-06, "loss": 0.2732, "step": 19110 }, { "epoch": 66.39, "learning_rate": 1.3696113074204947e-06, "loss": 0.2584, "step": 19120 }, { "epoch": 66.42, "learning_rate": 1.3681978798586571e-06, "loss": 0.2374, "step": 19130 }, { "epoch": 66.46, "learning_rate": 1.3667844522968197e-06, "loss": 0.2653, "step": 19140 }, { "epoch": 66.49, "learning_rate": 1.3653710247349824e-06, "loss": 0.2614, "step": 19150 }, { "epoch": 66.53, "learning_rate": 1.3639575971731448e-06, "loss": 0.2625, "step": 19160 }, { "epoch": 66.56, "learning_rate": 1.3625441696113074e-06, "loss": 0.2558, "step": 19170 }, { "epoch": 66.6, "learning_rate": 1.36113074204947e-06, "loss": 0.2759, "step": 19180 }, { "epoch": 66.63, "learning_rate": 1.3597173144876324e-06, "loss": 0.238, "step": 19190 }, { "epoch": 66.66, "learning_rate": 1.358303886925795e-06, "loss": 0.2661, "step": 19200 }, { "epoch": 66.7, "learning_rate": 1.3568904593639577e-06, "loss": 0.2439, "step": 19210 }, { "epoch": 66.73, "learning_rate": 1.35547703180212e-06, "loss": 0.251, "step": 19220 }, { "epoch": 66.77, "learning_rate": 1.3540636042402827e-06, "loss": 0.2693, "step": 19230 }, { "epoch": 66.8, "learning_rate": 1.3526501766784453e-06, "loss": 0.2361, "step": 19240 }, { "epoch": 66.84, "learning_rate": 1.3512367491166077e-06, "loss": 0.2761, "step": 19250 }, { "epoch": 66.87, "learning_rate": 1.3498233215547703e-06, "loss": 0.2546, "step": 19260 }, { "epoch": 66.91, "learning_rate": 1.3484098939929328e-06, "loss": 0.251, "step": 19270 }, { "epoch": 66.94, "learning_rate": 1.3469964664310954e-06, "loss": 0.2381, "step": 19280 }, { "epoch": 66.98, "learning_rate": 1.345583038869258e-06, "loss": 0.289, "step": 19290 }, { "epoch": 67.0, "eval_loss": 0.5087379217147827, "eval_runtime": 134.753, "eval_samples_per_second": 3.948, "eval_steps_per_second": 0.987, "eval_wer": 0.19573182490197338, "step": 19296 }, { "epoch": 67.01, "learning_rate": 1.3441696113074204e-06, "loss": 0.255, "step": 19300 }, { "epoch": 67.05, "learning_rate": 1.342756183745583e-06, "loss": 0.2501, "step": 19310 }, { "epoch": 67.08, "learning_rate": 1.3413427561837457e-06, "loss": 0.2529, "step": 19320 }, { "epoch": 67.12, "learning_rate": 1.339929328621908e-06, "loss": 0.2559, "step": 19330 }, { "epoch": 67.15, "learning_rate": 1.3385159010600707e-06, "loss": 0.2783, "step": 19340 }, { "epoch": 67.19, "learning_rate": 1.3371024734982333e-06, "loss": 0.2495, "step": 19350 }, { "epoch": 67.22, "learning_rate": 1.3356890459363957e-06, "loss": 0.2414, "step": 19360 }, { "epoch": 67.26, "learning_rate": 1.3342756183745583e-06, "loss": 0.2584, "step": 19370 }, { "epoch": 67.29, "learning_rate": 1.332862190812721e-06, "loss": 0.2553, "step": 19380 }, { "epoch": 67.33, "learning_rate": 1.3314487632508834e-06, "loss": 0.2712, "step": 19390 }, { "epoch": 67.36, "learning_rate": 1.330035335689046e-06, "loss": 0.2593, "step": 19400 }, { "epoch": 67.39, "learning_rate": 1.3286219081272084e-06, "loss": 0.2656, "step": 19410 }, { "epoch": 67.43, "learning_rate": 1.327208480565371e-06, "loss": 0.237, "step": 19420 }, { "epoch": 67.46, "learning_rate": 1.3257950530035336e-06, "loss": 0.262, "step": 19430 }, { "epoch": 67.5, "learning_rate": 1.324381625441696e-06, "loss": 0.2545, "step": 19440 }, { "epoch": 67.53, "learning_rate": 1.3229681978798587e-06, "loss": 0.2582, "step": 19450 }, { "epoch": 67.57, "learning_rate": 1.3215547703180213e-06, "loss": 0.2508, "step": 19460 }, { "epoch": 67.6, "learning_rate": 1.3201413427561837e-06, "loss": 0.2401, "step": 19470 }, { "epoch": 67.64, "learning_rate": 1.3187279151943463e-06, "loss": 0.2543, "step": 19480 }, { "epoch": 67.67, "learning_rate": 1.317314487632509e-06, "loss": 0.2467, "step": 19490 }, { "epoch": 67.71, "learning_rate": 1.3159010600706714e-06, "loss": 0.2675, "step": 19500 }, { "epoch": 67.74, "learning_rate": 1.314487632508834e-06, "loss": 0.2792, "step": 19510 }, { "epoch": 67.78, "learning_rate": 1.3130742049469966e-06, "loss": 0.2734, "step": 19520 }, { "epoch": 67.81, "learning_rate": 1.311660777385159e-06, "loss": 0.2645, "step": 19530 }, { "epoch": 67.85, "learning_rate": 1.3102473498233216e-06, "loss": 0.284, "step": 19540 }, { "epoch": 67.88, "learning_rate": 1.3088339222614842e-06, "loss": 0.2687, "step": 19550 }, { "epoch": 67.91, "learning_rate": 1.3074204946996464e-06, "loss": 0.2661, "step": 19560 }, { "epoch": 67.95, "learning_rate": 1.306007067137809e-06, "loss": 0.2568, "step": 19570 }, { "epoch": 67.98, "learning_rate": 1.3045936395759715e-06, "loss": 0.2511, "step": 19580 }, { "epoch": 68.0, "eval_loss": 0.516753077507019, "eval_runtime": 134.5773, "eval_samples_per_second": 3.953, "eval_steps_per_second": 0.988, "eval_wer": 0.1981744552291573, "step": 19584 }, { "epoch": 68.02, "learning_rate": 1.303180212014134e-06, "loss": 0.2656, "step": 19590 }, { "epoch": 68.06, "learning_rate": 1.3017667844522967e-06, "loss": 0.2578, "step": 19600 }, { "epoch": 68.09, "learning_rate": 1.3003533568904591e-06, "loss": 0.2424, "step": 19610 }, { "epoch": 68.12, "learning_rate": 1.2989399293286217e-06, "loss": 0.264, "step": 19620 }, { "epoch": 68.16, "learning_rate": 1.2975265017667844e-06, "loss": 0.2589, "step": 19630 }, { "epoch": 68.19, "learning_rate": 1.2961130742049468e-06, "loss": 0.2536, "step": 19640 }, { "epoch": 68.23, "learning_rate": 1.2946996466431094e-06, "loss": 0.2713, "step": 19650 }, { "epoch": 68.26, "learning_rate": 1.293286219081272e-06, "loss": 0.2517, "step": 19660 }, { "epoch": 68.3, "learning_rate": 1.2918727915194344e-06, "loss": 0.271, "step": 19670 }, { "epoch": 68.33, "learning_rate": 1.290459363957597e-06, "loss": 0.2754, "step": 19680 }, { "epoch": 68.37, "learning_rate": 1.2890459363957597e-06, "loss": 0.2486, "step": 19690 }, { "epoch": 68.4, "learning_rate": 1.287632508833922e-06, "loss": 0.2627, "step": 19700 }, { "epoch": 68.44, "learning_rate": 1.2862190812720847e-06, "loss": 0.2434, "step": 19710 }, { "epoch": 68.47, "learning_rate": 1.2848056537102471e-06, "loss": 0.2685, "step": 19720 }, { "epoch": 68.51, "learning_rate": 1.2833922261484097e-06, "loss": 0.2677, "step": 19730 }, { "epoch": 68.54, "learning_rate": 1.2819787985865724e-06, "loss": 0.2783, "step": 19740 }, { "epoch": 68.57, "learning_rate": 1.2805653710247348e-06, "loss": 0.2518, "step": 19750 }, { "epoch": 68.61, "learning_rate": 1.2791519434628974e-06, "loss": 0.2521, "step": 19760 }, { "epoch": 68.64, "learning_rate": 1.27773851590106e-06, "loss": 0.2613, "step": 19770 }, { "epoch": 68.68, "learning_rate": 1.2763250883392224e-06, "loss": 0.2718, "step": 19780 }, { "epoch": 68.71, "learning_rate": 1.274911660777385e-06, "loss": 0.2337, "step": 19790 }, { "epoch": 68.75, "learning_rate": 1.2734982332155477e-06, "loss": 0.2617, "step": 19800 }, { "epoch": 68.78, "learning_rate": 1.27208480565371e-06, "loss": 0.2588, "step": 19810 }, { "epoch": 68.82, "learning_rate": 1.2706713780918727e-06, "loss": 0.254, "step": 19820 }, { "epoch": 68.85, "learning_rate": 1.2692579505300353e-06, "loss": 0.2595, "step": 19830 }, { "epoch": 68.89, "learning_rate": 1.2678445229681977e-06, "loss": 0.2418, "step": 19840 }, { "epoch": 68.92, "learning_rate": 1.2664310954063603e-06, "loss": 0.2567, "step": 19850 }, { "epoch": 68.96, "learning_rate": 1.265017667844523e-06, "loss": 0.2671, "step": 19860 }, { "epoch": 68.99, "learning_rate": 1.2636042402826854e-06, "loss": 0.2623, "step": 19870 }, { "epoch": 69.0, "eval_loss": 0.5109707117080688, "eval_runtime": 133.3708, "eval_samples_per_second": 3.989, "eval_steps_per_second": 0.997, "eval_wer": 0.1958603843928778, "step": 19872 }, { "epoch": 69.03, "learning_rate": 1.262190812720848e-06, "loss": 0.2721, "step": 19880 }, { "epoch": 69.06, "learning_rate": 1.2607773851590104e-06, "loss": 0.2508, "step": 19890 }, { "epoch": 69.1, "learning_rate": 1.259363957597173e-06, "loss": 0.2522, "step": 19900 }, { "epoch": 69.13, "learning_rate": 1.2579505300353356e-06, "loss": 0.2842, "step": 19910 }, { "epoch": 69.17, "learning_rate": 1.256537102473498e-06, "loss": 0.2641, "step": 19920 }, { "epoch": 69.2, "learning_rate": 1.2551236749116607e-06, "loss": 0.2427, "step": 19930 }, { "epoch": 69.24, "learning_rate": 1.2537102473498233e-06, "loss": 0.2805, "step": 19940 }, { "epoch": 69.27, "learning_rate": 1.2522968197879857e-06, "loss": 0.254, "step": 19950 }, { "epoch": 69.3, "learning_rate": 1.2508833922261483e-06, "loss": 0.2651, "step": 19960 }, { "epoch": 69.34, "learning_rate": 1.249469964664311e-06, "loss": 0.2748, "step": 19970 }, { "epoch": 69.37, "learning_rate": 1.2480565371024734e-06, "loss": 0.2592, "step": 19980 }, { "epoch": 69.41, "learning_rate": 1.246643109540636e-06, "loss": 0.2652, "step": 19990 }, { "epoch": 69.44, "learning_rate": 1.2452296819787986e-06, "loss": 0.2382, "step": 20000 }, { "epoch": 69.48, "learning_rate": 1.243816254416961e-06, "loss": 0.2769, "step": 20010 }, { "epoch": 69.51, "learning_rate": 1.2424028268551236e-06, "loss": 0.2448, "step": 20020 }, { "epoch": 69.55, "learning_rate": 1.240989399293286e-06, "loss": 0.2392, "step": 20030 }, { "epoch": 69.58, "learning_rate": 1.2395759717314487e-06, "loss": 0.2546, "step": 20040 }, { "epoch": 69.62, "learning_rate": 1.2381625441696113e-06, "loss": 0.2472, "step": 20050 }, { "epoch": 69.65, "learning_rate": 1.2367491166077737e-06, "loss": 0.2772, "step": 20060 }, { "epoch": 69.69, "learning_rate": 1.2353356890459363e-06, "loss": 0.2799, "step": 20070 }, { "epoch": 69.72, "learning_rate": 1.233922261484099e-06, "loss": 0.2458, "step": 20080 }, { "epoch": 69.75, "learning_rate": 1.2325088339222613e-06, "loss": 0.2776, "step": 20090 }, { "epoch": 69.79, "learning_rate": 1.231095406360424e-06, "loss": 0.2571, "step": 20100 }, { "epoch": 69.82, "learning_rate": 1.2296819787985866e-06, "loss": 0.2464, "step": 20110 }, { "epoch": 69.86, "learning_rate": 1.228268551236749e-06, "loss": 0.2765, "step": 20120 }, { "epoch": 69.89, "learning_rate": 1.2268551236749116e-06, "loss": 0.2443, "step": 20130 }, { "epoch": 69.93, "learning_rate": 1.2254416961130742e-06, "loss": 0.2432, "step": 20140 }, { "epoch": 69.96, "learning_rate": 1.2240282685512367e-06, "loss": 0.2482, "step": 20150 }, { "epoch": 70.0, "learning_rate": 1.2226148409893993e-06, "loss": 0.2762, "step": 20160 }, { "epoch": 70.0, "eval_loss": 0.5123195648193359, "eval_runtime": 133.6748, "eval_samples_per_second": 3.98, "eval_steps_per_second": 0.995, "eval_wer": 0.19592466413833, "step": 20160 }, { "epoch": 70.03, "learning_rate": 1.221201413427562e-06, "loss": 0.2698, "step": 20170 }, { "epoch": 70.07, "learning_rate": 1.2197879858657243e-06, "loss": 0.231, "step": 20180 }, { "epoch": 70.1, "learning_rate": 1.218374558303887e-06, "loss": 0.2392, "step": 20190 }, { "epoch": 70.14, "learning_rate": 1.2169611307420493e-06, "loss": 0.2549, "step": 20200 }, { "epoch": 70.17, "learning_rate": 1.215547703180212e-06, "loss": 0.2701, "step": 20210 }, { "epoch": 70.21, "learning_rate": 1.2141342756183746e-06, "loss": 0.2526, "step": 20220 }, { "epoch": 70.24, "learning_rate": 1.212720848056537e-06, "loss": 0.2654, "step": 20230 }, { "epoch": 70.28, "learning_rate": 1.2113074204946996e-06, "loss": 0.2659, "step": 20240 }, { "epoch": 70.31, "learning_rate": 1.2098939929328622e-06, "loss": 0.2583, "step": 20250 }, { "epoch": 70.35, "learning_rate": 1.2084805653710246e-06, "loss": 0.2559, "step": 20260 }, { "epoch": 70.38, "learning_rate": 1.2070671378091873e-06, "loss": 0.2498, "step": 20270 }, { "epoch": 70.42, "learning_rate": 1.2056537102473499e-06, "loss": 0.2515, "step": 20280 }, { "epoch": 70.45, "learning_rate": 1.2042402826855123e-06, "loss": 0.2389, "step": 20290 }, { "epoch": 70.48, "learning_rate": 1.202826855123675e-06, "loss": 0.2793, "step": 20300 }, { "epoch": 70.52, "learning_rate": 1.2014134275618375e-06, "loss": 0.2548, "step": 20310 }, { "epoch": 70.55, "learning_rate": 1.2e-06, "loss": 0.243, "step": 20320 }, { "epoch": 70.59, "learning_rate": 1.1985865724381626e-06, "loss": 0.2314, "step": 20330 }, { "epoch": 70.62, "learning_rate": 1.197173144876325e-06, "loss": 0.2416, "step": 20340 }, { "epoch": 70.66, "learning_rate": 1.1957597173144876e-06, "loss": 0.2705, "step": 20350 }, { "epoch": 70.69, "learning_rate": 1.1943462897526502e-06, "loss": 0.2564, "step": 20360 }, { "epoch": 70.73, "learning_rate": 1.1929328621908126e-06, "loss": 0.2683, "step": 20370 }, { "epoch": 70.76, "learning_rate": 1.1915194346289753e-06, "loss": 0.2626, "step": 20380 }, { "epoch": 70.8, "learning_rate": 1.1901060070671379e-06, "loss": 0.2484, "step": 20390 }, { "epoch": 70.83, "learning_rate": 1.1886925795053003e-06, "loss": 0.2649, "step": 20400 }, { "epoch": 70.87, "learning_rate": 1.187279151943463e-06, "loss": 0.255, "step": 20410 }, { "epoch": 70.9, "learning_rate": 1.1858657243816255e-06, "loss": 0.253, "step": 20420 }, { "epoch": 70.94, "learning_rate": 1.184452296819788e-06, "loss": 0.2373, "step": 20430 }, { "epoch": 70.97, "learning_rate": 1.1830388692579506e-06, "loss": 0.2704, "step": 20440 }, { "epoch": 71.0, "eval_loss": 0.5117577314376831, "eval_runtime": 133.058, "eval_samples_per_second": 3.998, "eval_steps_per_second": 1.0, "eval_wer": 0.1965674615928521, "step": 20448 }, { "epoch": 71.01, "learning_rate": 1.1816254416961132e-06, "loss": 0.2783, "step": 20450 }, { "epoch": 71.04, "learning_rate": 1.1802120141342756e-06, "loss": 0.2665, "step": 20460 }, { "epoch": 71.08, "learning_rate": 1.1787985865724382e-06, "loss": 0.2626, "step": 20470 }, { "epoch": 71.11, "learning_rate": 1.1773851590106008e-06, "loss": 0.2544, "step": 20480 }, { "epoch": 71.15, "learning_rate": 1.1759717314487632e-06, "loss": 0.2526, "step": 20490 }, { "epoch": 71.18, "learning_rate": 1.1745583038869259e-06, "loss": 0.2749, "step": 20500 }, { "epoch": 71.21, "learning_rate": 1.1731448763250883e-06, "loss": 0.2545, "step": 20510 }, { "epoch": 71.25, "learning_rate": 1.1717314487632509e-06, "loss": 0.2475, "step": 20520 }, { "epoch": 71.28, "learning_rate": 1.1703180212014135e-06, "loss": 0.2502, "step": 20530 }, { "epoch": 71.32, "learning_rate": 1.168904593639576e-06, "loss": 0.2452, "step": 20540 }, { "epoch": 71.35, "learning_rate": 1.1676325088339224e-06, "loss": 0.2562, "step": 20550 }, { "epoch": 71.39, "learning_rate": 1.1662190812720846e-06, "loss": 0.2364, "step": 20560 }, { "epoch": 71.42, "learning_rate": 1.1648056537102472e-06, "loss": 0.2529, "step": 20570 }, { "epoch": 71.46, "learning_rate": 1.1633922261484098e-06, "loss": 0.2561, "step": 20580 }, { "epoch": 71.49, "learning_rate": 1.1619787985865722e-06, "loss": 0.2726, "step": 20590 }, { "epoch": 71.53, "learning_rate": 1.1605653710247349e-06, "loss": 0.2774, "step": 20600 }, { "epoch": 71.56, "learning_rate": 1.1591519434628975e-06, "loss": 0.2541, "step": 20610 }, { "epoch": 71.6, "learning_rate": 1.1577385159010599e-06, "loss": 0.2512, "step": 20620 }, { "epoch": 71.63, "learning_rate": 1.1563250883392225e-06, "loss": 0.2532, "step": 20630 }, { "epoch": 71.66, "learning_rate": 1.154911660777385e-06, "loss": 0.2639, "step": 20640 }, { "epoch": 71.7, "learning_rate": 1.1534982332155475e-06, "loss": 0.2573, "step": 20650 }, { "epoch": 71.73, "learning_rate": 1.1520848056537102e-06, "loss": 0.2662, "step": 20660 }, { "epoch": 71.77, "learning_rate": 1.1506713780918726e-06, "loss": 0.2486, "step": 20670 }, { "epoch": 71.8, "learning_rate": 1.1492579505300352e-06, "loss": 0.2563, "step": 20680 }, { "epoch": 71.84, "learning_rate": 1.1478445229681978e-06, "loss": 0.2631, "step": 20690 }, { "epoch": 71.87, "learning_rate": 1.1464310954063602e-06, "loss": 0.2697, "step": 20700 }, { "epoch": 71.91, "learning_rate": 1.1450176678445228e-06, "loss": 0.2478, "step": 20710 }, { "epoch": 71.94, "learning_rate": 1.1436042402826855e-06, "loss": 0.2436, "step": 20720 }, { "epoch": 71.98, "learning_rate": 1.1421908127208479e-06, "loss": 0.2854, "step": 20730 }, { "epoch": 72.0, "eval_loss": 0.5127651691436768, "eval_runtime": 133.8804, "eval_samples_per_second": 3.974, "eval_steps_per_second": 0.993, "eval_wer": 0.1948961882110947, "step": 20736 }, { "epoch": 72.01, "learning_rate": 1.1407773851590105e-06, "loss": 0.2796, "step": 20740 }, { "epoch": 72.05, "learning_rate": 1.1393639575971731e-06, "loss": 0.2772, "step": 20750 }, { "epoch": 72.08, "learning_rate": 1.1379505300353355e-06, "loss": 0.2524, "step": 20760 }, { "epoch": 72.12, "learning_rate": 1.1365371024734981e-06, "loss": 0.2331, "step": 20770 }, { "epoch": 72.15, "learning_rate": 1.1351236749116608e-06, "loss": 0.2678, "step": 20780 }, { "epoch": 72.19, "learning_rate": 1.1337102473498232e-06, "loss": 0.2769, "step": 20790 }, { "epoch": 72.22, "learning_rate": 1.1322968197879858e-06, "loss": 0.2535, "step": 20800 }, { "epoch": 72.26, "learning_rate": 1.1308833922261482e-06, "loss": 0.2478, "step": 20810 }, { "epoch": 72.29, "learning_rate": 1.1294699646643108e-06, "loss": 0.2383, "step": 20820 }, { "epoch": 72.33, "learning_rate": 1.1280565371024735e-06, "loss": 0.2699, "step": 20830 }, { "epoch": 72.36, "learning_rate": 1.1266431095406359e-06, "loss": 0.2635, "step": 20840 }, { "epoch": 72.39, "learning_rate": 1.1252296819787985e-06, "loss": 0.2566, "step": 20850 }, { "epoch": 72.43, "learning_rate": 1.123816254416961e-06, "loss": 0.2414, "step": 20860 }, { "epoch": 72.46, "learning_rate": 1.1224028268551235e-06, "loss": 0.2522, "step": 20870 }, { "epoch": 72.5, "learning_rate": 1.1209893992932861e-06, "loss": 0.2483, "step": 20880 }, { "epoch": 72.53, "learning_rate": 1.1195759717314488e-06, "loss": 0.2597, "step": 20890 }, { "epoch": 72.57, "learning_rate": 1.1181625441696112e-06, "loss": 0.2576, "step": 20900 }, { "epoch": 72.6, "learning_rate": 1.1167491166077738e-06, "loss": 0.2525, "step": 20910 }, { "epoch": 72.64, "learning_rate": 1.1153356890459364e-06, "loss": 0.2679, "step": 20920 }, { "epoch": 72.67, "learning_rate": 1.1139222614840988e-06, "loss": 0.2634, "step": 20930 }, { "epoch": 72.71, "learning_rate": 1.1125088339222614e-06, "loss": 0.2325, "step": 20940 }, { "epoch": 72.74, "learning_rate": 1.1110954063604238e-06, "loss": 0.2625, "step": 20950 }, { "epoch": 72.78, "learning_rate": 1.1096819787985865e-06, "loss": 0.2442, "step": 20960 }, { "epoch": 72.81, "learning_rate": 1.108268551236749e-06, "loss": 0.2651, "step": 20970 }, { "epoch": 72.85, "learning_rate": 1.1068551236749115e-06, "loss": 0.2531, "step": 20980 }, { "epoch": 72.88, "learning_rate": 1.1054416961130741e-06, "loss": 0.2444, "step": 20990 }, { "epoch": 72.91, "learning_rate": 1.1040282685512367e-06, "loss": 0.2735, "step": 21000 }, { "epoch": 72.95, "learning_rate": 1.1026148409893992e-06, "loss": 0.2528, "step": 21010 }, { "epoch": 72.98, "learning_rate": 1.1012014134275618e-06, "loss": 0.2602, "step": 21020 }, { "epoch": 73.0, "eval_loss": 0.5094349384307861, "eval_runtime": 134.0533, "eval_samples_per_second": 3.969, "eval_steps_per_second": 0.992, "eval_wer": 0.1966317413383043, "step": 21024 }, { "epoch": 73.02, "learning_rate": 1.0997879858657244e-06, "loss": 0.2639, "step": 21030 }, { "epoch": 73.06, "learning_rate": 1.0983745583038868e-06, "loss": 0.2614, "step": 21040 }, { "epoch": 73.09, "learning_rate": 1.0969611307420494e-06, "loss": 0.2265, "step": 21050 }, { "epoch": 73.12, "learning_rate": 1.095547703180212e-06, "loss": 0.2721, "step": 21060 }, { "epoch": 73.16, "learning_rate": 1.0941342756183745e-06, "loss": 0.2645, "step": 21070 }, { "epoch": 73.19, "learning_rate": 1.092720848056537e-06, "loss": 0.2381, "step": 21080 }, { "epoch": 73.23, "learning_rate": 1.0913074204946997e-06, "loss": 0.2458, "step": 21090 }, { "epoch": 73.26, "learning_rate": 1.0898939929328621e-06, "loss": 0.2378, "step": 21100 }, { "epoch": 73.3, "learning_rate": 1.0884805653710247e-06, "loss": 0.2567, "step": 21110 }, { "epoch": 73.33, "learning_rate": 1.0870671378091871e-06, "loss": 0.264, "step": 21120 }, { "epoch": 73.37, "learning_rate": 1.0856537102473498e-06, "loss": 0.2563, "step": 21130 }, { "epoch": 73.4, "learning_rate": 1.0842402826855124e-06, "loss": 0.2683, "step": 21140 }, { "epoch": 73.44, "learning_rate": 1.0828268551236748e-06, "loss": 0.2692, "step": 21150 }, { "epoch": 73.47, "learning_rate": 1.0814134275618374e-06, "loss": 0.2751, "step": 21160 }, { "epoch": 73.51, "learning_rate": 1.08e-06, "loss": 0.2638, "step": 21170 }, { "epoch": 73.54, "learning_rate": 1.0785865724381624e-06, "loss": 0.2333, "step": 21180 }, { "epoch": 73.57, "learning_rate": 1.077173144876325e-06, "loss": 0.2784, "step": 21190 }, { "epoch": 73.61, "learning_rate": 1.0757597173144877e-06, "loss": 0.2539, "step": 21200 }, { "epoch": 73.64, "learning_rate": 1.07434628975265e-06, "loss": 0.2442, "step": 21210 }, { "epoch": 73.68, "learning_rate": 1.0729328621908127e-06, "loss": 0.2633, "step": 21220 }, { "epoch": 73.71, "learning_rate": 1.0715194346289753e-06, "loss": 0.2318, "step": 21230 }, { "epoch": 73.75, "learning_rate": 1.0701060070671377e-06, "loss": 0.259, "step": 21240 }, { "epoch": 73.78, "learning_rate": 1.0686925795053004e-06, "loss": 0.2351, "step": 21250 }, { "epoch": 73.82, "learning_rate": 1.0672791519434628e-06, "loss": 0.2904, "step": 21260 }, { "epoch": 73.85, "learning_rate": 1.0658657243816254e-06, "loss": 0.2636, "step": 21270 }, { "epoch": 73.89, "learning_rate": 1.064452296819788e-06, "loss": 0.2746, "step": 21280 }, { "epoch": 73.92, "learning_rate": 1.0630388692579504e-06, "loss": 0.2249, "step": 21290 }, { "epoch": 73.96, "learning_rate": 1.061625441696113e-06, "loss": 0.257, "step": 21300 }, { "epoch": 73.99, "learning_rate": 1.0602120141342757e-06, "loss": 0.2675, "step": 21310 }, { "epoch": 74.0, "eval_loss": 0.5058467388153076, "eval_runtime": 133.957, "eval_samples_per_second": 3.971, "eval_steps_per_second": 0.993, "eval_wer": 0.19605322362923444, "step": 21312 }, { "epoch": 74.03, "learning_rate": 1.058798586572438e-06, "loss": 0.2531, "step": 21320 }, { "epoch": 74.06, "learning_rate": 1.0573851590106007e-06, "loss": 0.241, "step": 21330 }, { "epoch": 74.1, "learning_rate": 1.0559717314487633e-06, "loss": 0.2388, "step": 21340 }, { "epoch": 74.13, "learning_rate": 1.0545583038869257e-06, "loss": 0.2513, "step": 21350 }, { "epoch": 74.17, "learning_rate": 1.0531448763250884e-06, "loss": 0.2672, "step": 21360 }, { "epoch": 74.2, "learning_rate": 1.051731448763251e-06, "loss": 0.2415, "step": 21370 }, { "epoch": 74.24, "learning_rate": 1.0503180212014134e-06, "loss": 0.2492, "step": 21380 }, { "epoch": 74.27, "learning_rate": 1.048904593639576e-06, "loss": 0.2421, "step": 21390 }, { "epoch": 74.3, "learning_rate": 1.0474911660777386e-06, "loss": 0.2926, "step": 21400 }, { "epoch": 74.34, "learning_rate": 1.046077738515901e-06, "loss": 0.2639, "step": 21410 }, { "epoch": 74.37, "learning_rate": 1.0446643109540637e-06, "loss": 0.2357, "step": 21420 }, { "epoch": 74.41, "learning_rate": 1.043250883392226e-06, "loss": 0.2707, "step": 21430 }, { "epoch": 74.44, "learning_rate": 1.0418374558303887e-06, "loss": 0.2426, "step": 21440 }, { "epoch": 74.48, "learning_rate": 1.0404240282685513e-06, "loss": 0.2743, "step": 21450 }, { "epoch": 74.51, "learning_rate": 1.0390106007067137e-06, "loss": 0.2739, "step": 21460 }, { "epoch": 74.55, "learning_rate": 1.0375971731448763e-06, "loss": 0.2391, "step": 21470 }, { "epoch": 74.58, "learning_rate": 1.036183745583039e-06, "loss": 0.2781, "step": 21480 }, { "epoch": 74.62, "learning_rate": 1.0347703180212014e-06, "loss": 0.2666, "step": 21490 }, { "epoch": 74.65, "learning_rate": 1.033356890459364e-06, "loss": 0.2484, "step": 21500 }, { "epoch": 74.69, "learning_rate": 1.0319434628975266e-06, "loss": 0.2529, "step": 21510 }, { "epoch": 74.72, "learning_rate": 1.030530035335689e-06, "loss": 0.2447, "step": 21520 }, { "epoch": 74.75, "learning_rate": 1.0291166077738516e-06, "loss": 0.2399, "step": 21530 }, { "epoch": 74.79, "learning_rate": 1.0277031802120143e-06, "loss": 0.2519, "step": 21540 }, { "epoch": 74.82, "learning_rate": 1.0262897526501767e-06, "loss": 0.2689, "step": 21550 }, { "epoch": 74.86, "learning_rate": 1.0248763250883393e-06, "loss": 0.2558, "step": 21560 }, { "epoch": 74.89, "learning_rate": 1.0234628975265017e-06, "loss": 0.2466, "step": 21570 }, { "epoch": 74.93, "learning_rate": 1.0220494699646643e-06, "loss": 0.2463, "step": 21580 }, { "epoch": 74.96, "learning_rate": 1.020636042402827e-06, "loss": 0.2776, "step": 21590 }, { "epoch": 75.0, "learning_rate": 1.0192226148409894e-06, "loss": 0.2519, "step": 21600 }, { "epoch": 75.0, "eval_loss": 0.5216230750083923, "eval_runtime": 133.9162, "eval_samples_per_second": 3.973, "eval_steps_per_second": 0.993, "eval_wer": 0.19875297293822716, "step": 21600 }, { "epoch": 75.03, "learning_rate": 1.017809187279152e-06, "loss": 0.2963, "step": 21610 }, { "epoch": 75.07, "learning_rate": 1.0163957597173146e-06, "loss": 0.2578, "step": 21620 }, { "epoch": 75.1, "learning_rate": 1.0149823321554768e-06, "loss": 0.2693, "step": 21630 }, { "epoch": 75.14, "learning_rate": 1.0135689045936394e-06, "loss": 0.2924, "step": 21640 }, { "epoch": 75.17, "learning_rate": 1.012155477031802e-06, "loss": 0.2423, "step": 21650 }, { "epoch": 75.21, "learning_rate": 1.0107420494699645e-06, "loss": 0.2563, "step": 21660 }, { "epoch": 75.24, "learning_rate": 1.009328621908127e-06, "loss": 0.267, "step": 21670 }, { "epoch": 75.28, "learning_rate": 1.0079151943462897e-06, "loss": 0.2634, "step": 21680 }, { "epoch": 75.31, "learning_rate": 1.0065017667844521e-06, "loss": 0.2661, "step": 21690 }, { "epoch": 75.35, "learning_rate": 1.0050883392226147e-06, "loss": 0.2425, "step": 21700 }, { "epoch": 75.38, "learning_rate": 1.0036749116607774e-06, "loss": 0.2592, "step": 21710 }, { "epoch": 75.42, "learning_rate": 1.0022614840989398e-06, "loss": 0.236, "step": 21720 }, { "epoch": 75.45, "learning_rate": 1.0008480565371024e-06, "loss": 0.2506, "step": 21730 }, { "epoch": 75.48, "learning_rate": 9.99434628975265e-07, "loss": 0.2746, "step": 21740 }, { "epoch": 75.52, "learning_rate": 9.980212014134274e-07, "loss": 0.2696, "step": 21750 }, { "epoch": 75.55, "learning_rate": 9.9660777385159e-07, "loss": 0.249, "step": 21760 }, { "epoch": 75.59, "learning_rate": 9.951943462897527e-07, "loss": 0.2845, "step": 21770 }, { "epoch": 75.62, "learning_rate": 9.93780918727915e-07, "loss": 0.2298, "step": 21780 }, { "epoch": 75.66, "learning_rate": 9.923674911660777e-07, "loss": 0.2675, "step": 21790 }, { "epoch": 75.69, "learning_rate": 9.909540636042403e-07, "loss": 0.2734, "step": 21800 }, { "epoch": 75.73, "learning_rate": 9.895406360424027e-07, "loss": 0.244, "step": 21810 }, { "epoch": 75.76, "learning_rate": 9.881272084805653e-07, "loss": 0.2333, "step": 21820 }, { "epoch": 75.8, "learning_rate": 9.86713780918728e-07, "loss": 0.226, "step": 21830 }, { "epoch": 75.83, "learning_rate": 9.853003533568904e-07, "loss": 0.2542, "step": 21840 }, { "epoch": 75.87, "learning_rate": 9.83886925795053e-07, "loss": 0.283, "step": 21850 }, { "epoch": 75.9, "learning_rate": 9.824734982332154e-07, "loss": 0.2332, "step": 21860 }, { "epoch": 75.94, "learning_rate": 9.81060070671378e-07, "loss": 0.2518, "step": 21870 }, { "epoch": 75.97, "learning_rate": 9.796466431095406e-07, "loss": 0.2666, "step": 21880 }, { "epoch": 76.0, "eval_loss": 0.5116772651672363, "eval_runtime": 134.0532, "eval_samples_per_second": 3.969, "eval_steps_per_second": 0.992, "eval_wer": 0.1958603843928778, "step": 21888 }, { "epoch": 76.01, "learning_rate": 9.78233215547703e-07, "loss": 0.2766, "step": 21890 }, { "epoch": 76.04, "learning_rate": 9.768197879858657e-07, "loss": 0.2281, "step": 21900 }, { "epoch": 76.08, "learning_rate": 9.754063604240283e-07, "loss": 0.2703, "step": 21910 }, { "epoch": 76.11, "learning_rate": 9.739929328621907e-07, "loss": 0.258, "step": 21920 }, { "epoch": 76.15, "learning_rate": 9.725795053003533e-07, "loss": 0.2614, "step": 21930 }, { "epoch": 76.18, "learning_rate": 9.71166077738516e-07, "loss": 0.2773, "step": 21940 }, { "epoch": 76.21, "learning_rate": 9.697526501766784e-07, "loss": 0.2701, "step": 21950 }, { "epoch": 76.25, "learning_rate": 9.68339222614841e-07, "loss": 0.2416, "step": 21960 }, { "epoch": 76.28, "learning_rate": 9.669257950530036e-07, "loss": 0.2547, "step": 21970 }, { "epoch": 76.32, "learning_rate": 9.65512367491166e-07, "loss": 0.2483, "step": 21980 }, { "epoch": 76.35, "learning_rate": 9.640989399293286e-07, "loss": 0.2473, "step": 21990 }, { "epoch": 76.39, "learning_rate": 9.62685512367491e-07, "loss": 0.2471, "step": 22000 }, { "epoch": 76.42, "learning_rate": 9.612720848056537e-07, "loss": 0.2323, "step": 22010 }, { "epoch": 76.46, "learning_rate": 9.598586572438163e-07, "loss": 0.276, "step": 22020 }, { "epoch": 76.49, "learning_rate": 9.584452296819787e-07, "loss": 0.2644, "step": 22030 }, { "epoch": 76.53, "learning_rate": 9.570318021201413e-07, "loss": 0.2605, "step": 22040 }, { "epoch": 76.56, "learning_rate": 9.55618374558304e-07, "loss": 0.2717, "step": 22050 }, { "epoch": 76.6, "learning_rate": 9.542049469964663e-07, "loss": 0.2534, "step": 22060 }, { "epoch": 76.63, "learning_rate": 9.52791519434629e-07, "loss": 0.2359, "step": 22070 }, { "epoch": 76.66, "learning_rate": 9.513780918727915e-07, "loss": 0.2806, "step": 22080 }, { "epoch": 76.7, "learning_rate": 9.49964664310954e-07, "loss": 0.2575, "step": 22090 }, { "epoch": 76.73, "learning_rate": 9.485512367491165e-07, "loss": 0.2439, "step": 22100 }, { "epoch": 76.77, "learning_rate": 9.471378091872791e-07, "loss": 0.2618, "step": 22110 }, { "epoch": 76.8, "learning_rate": 9.457243816254416e-07, "loss": 0.2445, "step": 22120 }, { "epoch": 76.84, "learning_rate": 9.443109540636042e-07, "loss": 0.2525, "step": 22130 }, { "epoch": 76.87, "learning_rate": 9.428975265017668e-07, "loss": 0.2441, "step": 22140 }, { "epoch": 76.91, "learning_rate": 9.414840989399293e-07, "loss": 0.259, "step": 22150 }, { "epoch": 76.94, "learning_rate": 9.400706713780918e-07, "loss": 0.2506, "step": 22160 }, { "epoch": 76.98, "learning_rate": 9.386572438162543e-07, "loss": 0.2637, "step": 22170 }, { "epoch": 77.0, "eval_loss": 0.5057582259178162, "eval_runtime": 134.4046, "eval_samples_per_second": 3.958, "eval_steps_per_second": 0.99, "eval_wer": 0.19566754515652118, "step": 22176 }, { "epoch": 77.01, "learning_rate": 9.37243816254417e-07, "loss": 0.2561, "step": 22180 }, { "epoch": 77.05, "learning_rate": 9.358303886925795e-07, "loss": 0.2573, "step": 22190 }, { "epoch": 77.08, "learning_rate": 9.34416961130742e-07, "loss": 0.2447, "step": 22200 }, { "epoch": 77.12, "learning_rate": 9.330035335689046e-07, "loss": 0.2532, "step": 22210 }, { "epoch": 77.15, "learning_rate": 9.315901060070671e-07, "loss": 0.2602, "step": 22220 }, { "epoch": 77.19, "learning_rate": 9.301766784452296e-07, "loss": 0.2541, "step": 22230 }, { "epoch": 77.22, "learning_rate": 9.287632508833922e-07, "loss": 0.2406, "step": 22240 }, { "epoch": 77.26, "learning_rate": 9.273498233215548e-07, "loss": 0.2469, "step": 22250 }, { "epoch": 77.29, "learning_rate": 9.259363957597173e-07, "loss": 0.2633, "step": 22260 }, { "epoch": 77.33, "learning_rate": 9.245229681978798e-07, "loss": 0.2607, "step": 22270 }, { "epoch": 77.36, "learning_rate": 9.231095406360424e-07, "loss": 0.2627, "step": 22280 }, { "epoch": 77.39, "learning_rate": 9.216961130742049e-07, "loss": 0.2787, "step": 22290 }, { "epoch": 77.43, "learning_rate": 9.202826855123675e-07, "loss": 0.2381, "step": 22300 }, { "epoch": 77.46, "learning_rate": 9.1886925795053e-07, "loss": 0.2736, "step": 22310 }, { "epoch": 77.5, "learning_rate": 9.174558303886926e-07, "loss": 0.2599, "step": 22320 }, { "epoch": 77.53, "learning_rate": 9.160424028268551e-07, "loss": 0.2563, "step": 22330 }, { "epoch": 77.57, "learning_rate": 9.146289752650176e-07, "loss": 0.2467, "step": 22340 }, { "epoch": 77.6, "learning_rate": 9.132155477031802e-07, "loss": 0.2582, "step": 22350 }, { "epoch": 77.64, "learning_rate": 9.118021201413428e-07, "loss": 0.2677, "step": 22360 }, { "epoch": 77.67, "learning_rate": 9.103886925795053e-07, "loss": 0.2752, "step": 22370 }, { "epoch": 77.71, "learning_rate": 9.089752650176679e-07, "loss": 0.2373, "step": 22380 }, { "epoch": 77.74, "learning_rate": 9.075618374558304e-07, "loss": 0.2476, "step": 22390 }, { "epoch": 77.78, "learning_rate": 9.061484098939929e-07, "loss": 0.2542, "step": 22400 }, { "epoch": 77.81, "learning_rate": 9.047349823321554e-07, "loss": 0.2466, "step": 22410 }, { "epoch": 77.85, "learning_rate": 9.033215547703181e-07, "loss": 0.2581, "step": 22420 }, { "epoch": 77.88, "learning_rate": 9.019081272084806e-07, "loss": 0.2594, "step": 22430 }, { "epoch": 77.91, "learning_rate": 9.00494699646643e-07, "loss": 0.2615, "step": 22440 }, { "epoch": 77.95, "learning_rate": 8.990812720848057e-07, "loss": 0.2566, "step": 22450 }, { "epoch": 77.98, "learning_rate": 8.976678445229681e-07, "loss": 0.273, "step": 22460 }, { "epoch": 78.0, "eval_loss": 0.5186824798583984, "eval_runtime": 133.6981, "eval_samples_per_second": 3.979, "eval_steps_per_second": 0.995, "eval_wer": 0.1966317413383043, "step": 22464 }, { "epoch": 78.02, "learning_rate": 8.962544169611306e-07, "loss": 0.2666, "step": 22470 }, { "epoch": 78.06, "learning_rate": 8.948409893992932e-07, "loss": 0.2591, "step": 22480 }, { "epoch": 78.09, "learning_rate": 8.934275618374558e-07, "loss": 0.2377, "step": 22490 }, { "epoch": 78.12, "learning_rate": 8.920141342756183e-07, "loss": 0.2836, "step": 22500 }, { "epoch": 78.16, "learning_rate": 8.906007067137808e-07, "loss": 0.2657, "step": 22510 }, { "epoch": 78.19, "learning_rate": 8.891872791519434e-07, "loss": 0.2613, "step": 22520 }, { "epoch": 78.23, "learning_rate": 8.877738515901059e-07, "loss": 0.2644, "step": 22530 }, { "epoch": 78.26, "learning_rate": 8.863604240282685e-07, "loss": 0.2435, "step": 22540 }, { "epoch": 78.3, "learning_rate": 8.84946996466431e-07, "loss": 0.2693, "step": 22550 }, { "epoch": 78.33, "learning_rate": 8.835335689045936e-07, "loss": 0.2531, "step": 22560 }, { "epoch": 78.37, "learning_rate": 8.821201413427561e-07, "loss": 0.2535, "step": 22570 }, { "epoch": 78.4, "learning_rate": 8.807067137809186e-07, "loss": 0.2645, "step": 22580 }, { "epoch": 78.44, "learning_rate": 8.792932862190812e-07, "loss": 0.2336, "step": 22590 }, { "epoch": 78.47, "learning_rate": 8.778798586572438e-07, "loss": 0.2474, "step": 22600 }, { "epoch": 78.51, "learning_rate": 8.764664310954063e-07, "loss": 0.2524, "step": 22610 }, { "epoch": 78.54, "learning_rate": 8.750530035335688e-07, "loss": 0.2246, "step": 22620 }, { "epoch": 78.57, "learning_rate": 8.736395759717314e-07, "loss": 0.2573, "step": 22630 }, { "epoch": 78.61, "learning_rate": 8.722261484098939e-07, "loss": 0.2482, "step": 22640 }, { "epoch": 78.64, "learning_rate": 8.708127208480564e-07, "loss": 0.272, "step": 22650 }, { "epoch": 78.68, "learning_rate": 8.693992932862191e-07, "loss": 0.266, "step": 22660 }, { "epoch": 78.71, "learning_rate": 8.679858657243816e-07, "loss": 0.262, "step": 22670 }, { "epoch": 78.75, "learning_rate": 8.665724381625441e-07, "loss": 0.2503, "step": 22680 }, { "epoch": 78.78, "learning_rate": 8.651590106007067e-07, "loss": 0.2554, "step": 22690 }, { "epoch": 78.82, "learning_rate": 8.637455830388692e-07, "loss": 0.263, "step": 22700 }, { "epoch": 78.85, "learning_rate": 8.623321554770318e-07, "loss": 0.269, "step": 22710 }, { "epoch": 78.89, "learning_rate": 8.609187279151943e-07, "loss": 0.262, "step": 22720 }, { "epoch": 78.92, "learning_rate": 8.595053003533569e-07, "loss": 0.2698, "step": 22730 }, { "epoch": 78.96, "learning_rate": 8.580918727915194e-07, "loss": 0.255, "step": 22740 }, { "epoch": 78.99, "learning_rate": 8.566784452296819e-07, "loss": 0.2666, "step": 22750 }, { "epoch": 79.0, "eval_loss": 0.5175613760948181, "eval_runtime": 134.3104, "eval_samples_per_second": 3.961, "eval_steps_per_second": 0.99, "eval_wer": 0.19579610464742558, "step": 22752 }, { "epoch": 79.03, "learning_rate": 8.552650176678445e-07, "loss": 0.2381, "step": 22760 }, { "epoch": 79.06, "learning_rate": 8.538515901060071e-07, "loss": 0.2487, "step": 22770 }, { "epoch": 79.1, "learning_rate": 8.524381625441696e-07, "loss": 0.2621, "step": 22780 }, { "epoch": 79.13, "learning_rate": 8.510247349823321e-07, "loss": 0.271, "step": 22790 }, { "epoch": 79.17, "learning_rate": 8.496113074204947e-07, "loss": 0.2689, "step": 22800 }, { "epoch": 79.2, "learning_rate": 8.481978798586572e-07, "loss": 0.2351, "step": 22810 }, { "epoch": 79.24, "learning_rate": 8.467844522968197e-07, "loss": 0.2733, "step": 22820 }, { "epoch": 79.27, "learning_rate": 8.453710247349824e-07, "loss": 0.2436, "step": 22830 }, { "epoch": 79.3, "learning_rate": 8.439575971731449e-07, "loss": 0.2628, "step": 22840 }, { "epoch": 79.34, "learning_rate": 8.425441696113074e-07, "loss": 0.251, "step": 22850 }, { "epoch": 79.37, "learning_rate": 8.411307420494699e-07, "loss": 0.258, "step": 22860 }, { "epoch": 79.41, "learning_rate": 8.397173144876325e-07, "loss": 0.242, "step": 22870 }, { "epoch": 79.44, "learning_rate": 8.38303886925795e-07, "loss": 0.2446, "step": 22880 }, { "epoch": 79.48, "learning_rate": 8.368904593639576e-07, "loss": 0.2683, "step": 22890 }, { "epoch": 79.51, "learning_rate": 8.354770318021202e-07, "loss": 0.2686, "step": 22900 }, { "epoch": 79.55, "learning_rate": 8.340636042402827e-07, "loss": 0.2717, "step": 22910 }, { "epoch": 79.58, "learning_rate": 8.326501766784452e-07, "loss": 0.2373, "step": 22920 }, { "epoch": 79.62, "learning_rate": 8.312367491166077e-07, "loss": 0.2399, "step": 22930 }, { "epoch": 79.65, "learning_rate": 8.298233215547703e-07, "loss": 0.2867, "step": 22940 }, { "epoch": 79.69, "learning_rate": 8.284098939929329e-07, "loss": 0.277, "step": 22950 }, { "epoch": 79.72, "learning_rate": 8.269964664310954e-07, "loss": 0.2399, "step": 22960 }, { "epoch": 79.75, "learning_rate": 8.25583038869258e-07, "loss": 0.2537, "step": 22970 }, { "epoch": 79.79, "learning_rate": 8.241696113074205e-07, "loss": 0.2491, "step": 22980 }, { "epoch": 79.82, "learning_rate": 8.227561837455829e-07, "loss": 0.2747, "step": 22990 }, { "epoch": 79.86, "learning_rate": 8.213427561837457e-07, "loss": 0.2612, "step": 23000 }, { "epoch": 79.89, "learning_rate": 8.199293286219081e-07, "loss": 0.2455, "step": 23010 }, { "epoch": 79.93, "learning_rate": 8.185159010600706e-07, "loss": 0.2593, "step": 23020 }, { "epoch": 79.96, "learning_rate": 8.171024734982331e-07, "loss": 0.258, "step": 23030 }, { "epoch": 80.0, "learning_rate": 8.156890459363957e-07, "loss": 0.2627, "step": 23040 }, { "epoch": 80.0, "eval_loss": 0.5141689777374268, "eval_runtime": 133.6944, "eval_samples_per_second": 3.979, "eval_steps_per_second": 0.995, "eval_wer": 0.1949604679565469, "step": 23040 }, { "epoch": 80.03, "learning_rate": 8.142756183745582e-07, "loss": 0.2598, "step": 23050 }, { "epoch": 80.07, "learning_rate": 8.128621908127207e-07, "loss": 0.2679, "step": 23060 }, { "epoch": 80.1, "learning_rate": 8.114487632508834e-07, "loss": 0.223, "step": 23070 }, { "epoch": 80.14, "learning_rate": 8.100353356890459e-07, "loss": 0.2692, "step": 23080 }, { "epoch": 80.17, "learning_rate": 8.086219081272084e-07, "loss": 0.2647, "step": 23090 }, { "epoch": 80.21, "learning_rate": 8.072084805653709e-07, "loss": 0.2544, "step": 23100 }, { "epoch": 80.24, "learning_rate": 8.057950530035335e-07, "loss": 0.2579, "step": 23110 }, { "epoch": 80.28, "learning_rate": 8.04381625441696e-07, "loss": 0.246, "step": 23120 }, { "epoch": 80.31, "learning_rate": 8.029681978798586e-07, "loss": 0.2714, "step": 23130 }, { "epoch": 80.35, "learning_rate": 8.015547703180212e-07, "loss": 0.2763, "step": 23140 }, { "epoch": 80.38, "learning_rate": 8.001413427561837e-07, "loss": 0.2489, "step": 23150 }, { "epoch": 80.42, "learning_rate": 7.987279151943462e-07, "loss": 0.2382, "step": 23160 }, { "epoch": 80.45, "learning_rate": 7.973144876325087e-07, "loss": 0.2712, "step": 23170 }, { "epoch": 80.48, "learning_rate": 7.959010600706714e-07, "loss": 0.2612, "step": 23180 }, { "epoch": 80.52, "learning_rate": 7.944876325088339e-07, "loss": 0.2573, "step": 23190 }, { "epoch": 80.55, "learning_rate": 7.930742049469964e-07, "loss": 0.2412, "step": 23200 }, { "epoch": 80.59, "learning_rate": 7.91660777385159e-07, "loss": 0.262, "step": 23210 }, { "epoch": 80.62, "learning_rate": 7.902473498233215e-07, "loss": 0.2555, "step": 23220 }, { "epoch": 80.66, "learning_rate": 7.88833922261484e-07, "loss": 0.2685, "step": 23230 }, { "epoch": 80.69, "learning_rate": 7.874204946996466e-07, "loss": 0.2427, "step": 23240 }, { "epoch": 80.73, "learning_rate": 7.860070671378092e-07, "loss": 0.2629, "step": 23250 }, { "epoch": 80.76, "learning_rate": 7.845936395759717e-07, "loss": 0.248, "step": 23260 }, { "epoch": 80.8, "learning_rate": 7.831802120141342e-07, "loss": 0.2413, "step": 23270 }, { "epoch": 80.83, "learning_rate": 7.817667844522968e-07, "loss": 0.2675, "step": 23280 }, { "epoch": 80.87, "learning_rate": 7.803533568904593e-07, "loss": 0.263, "step": 23290 }, { "epoch": 80.9, "learning_rate": 7.789399293286219e-07, "loss": 0.2674, "step": 23300 }, { "epoch": 80.94, "learning_rate": 7.775265017667845e-07, "loss": 0.2567, "step": 23310 }, { "epoch": 80.97, "learning_rate": 7.76113074204947e-07, "loss": 0.2508, "step": 23320 }, { "epoch": 81.0, "eval_loss": 0.5157809853553772, "eval_runtime": 134.6235, "eval_samples_per_second": 3.952, "eval_steps_per_second": 0.988, "eval_wer": 0.19605322362923444, "step": 23328 }, { "epoch": 81.01, "learning_rate": 7.746996466431095e-07, "loss": 0.289, "step": 23330 }, { "epoch": 81.04, "learning_rate": 7.73286219081272e-07, "loss": 0.2503, "step": 23340 }, { "epoch": 81.08, "learning_rate": 7.718727915194346e-07, "loss": 0.2387, "step": 23350 }, { "epoch": 81.11, "learning_rate": 7.704593639575972e-07, "loss": 0.2675, "step": 23360 }, { "epoch": 81.15, "learning_rate": 7.690459363957597e-07, "loss": 0.2534, "step": 23370 }, { "epoch": 81.18, "learning_rate": 7.676325088339223e-07, "loss": 0.2603, "step": 23380 }, { "epoch": 81.21, "learning_rate": 7.662190812720848e-07, "loss": 0.2545, "step": 23390 }, { "epoch": 81.25, "learning_rate": 7.648056537102473e-07, "loss": 0.2617, "step": 23400 }, { "epoch": 81.28, "learning_rate": 7.633922261484098e-07, "loss": 0.2495, "step": 23410 }, { "epoch": 81.32, "learning_rate": 7.619787985865725e-07, "loss": 0.2608, "step": 23420 }, { "epoch": 81.35, "learning_rate": 7.60565371024735e-07, "loss": 0.2561, "step": 23430 }, { "epoch": 81.39, "learning_rate": 7.591519434628975e-07, "loss": 0.2487, "step": 23440 }, { "epoch": 81.42, "learning_rate": 7.577385159010601e-07, "loss": 0.2522, "step": 23450 }, { "epoch": 81.46, "learning_rate": 7.563250883392226e-07, "loss": 0.2796, "step": 23460 }, { "epoch": 81.49, "learning_rate": 7.549116607773851e-07, "loss": 0.2516, "step": 23470 }, { "epoch": 81.53, "learning_rate": 7.534982332155477e-07, "loss": 0.2653, "step": 23480 }, { "epoch": 81.56, "learning_rate": 7.520848056537103e-07, "loss": 0.2627, "step": 23490 }, { "epoch": 81.6, "learning_rate": 7.506713780918728e-07, "loss": 0.2524, "step": 23500 }, { "epoch": 81.63, "learning_rate": 7.492579505300353e-07, "loss": 0.2545, "step": 23510 }, { "epoch": 81.66, "learning_rate": 7.478445229681979e-07, "loss": 0.2838, "step": 23520 }, { "epoch": 81.7, "learning_rate": 7.464310954063605e-07, "loss": 0.25, "step": 23530 }, { "epoch": 81.73, "learning_rate": 7.450176678445229e-07, "loss": 0.2702, "step": 23540 }, { "epoch": 81.77, "learning_rate": 7.436042402826854e-07, "loss": 0.2521, "step": 23550 }, { "epoch": 81.8, "learning_rate": 7.42190812720848e-07, "loss": 0.2537, "step": 23560 }, { "epoch": 81.84, "learning_rate": 7.407773851590105e-07, "loss": 0.2731, "step": 23570 }, { "epoch": 81.87, "learning_rate": 7.39363957597173e-07, "loss": 0.2441, "step": 23580 }, { "epoch": 81.91, "learning_rate": 7.379505300353357e-07, "loss": 0.2541, "step": 23590 }, { "epoch": 81.94, "learning_rate": 7.365371024734982e-07, "loss": 0.2546, "step": 23600 }, { "epoch": 81.98, "learning_rate": 7.351236749116607e-07, "loss": 0.2499, "step": 23610 }, { "epoch": 82.0, "eval_loss": 0.5130564570426941, "eval_runtime": 134.0023, "eval_samples_per_second": 3.97, "eval_steps_per_second": 0.993, "eval_wer": 0.19695314006556533, "step": 23616 }, { "epoch": 82.01, "learning_rate": 7.337102473498233e-07, "loss": 0.2829, "step": 23620 }, { "epoch": 82.05, "learning_rate": 7.322968197879858e-07, "loss": 0.2725, "step": 23630 }, { "epoch": 82.08, "learning_rate": 7.308833922261483e-07, "loss": 0.2439, "step": 23640 }, { "epoch": 82.12, "learning_rate": 7.294699646643108e-07, "loss": 0.2534, "step": 23650 }, { "epoch": 82.15, "learning_rate": 7.280565371024735e-07, "loss": 0.2644, "step": 23660 }, { "epoch": 82.19, "learning_rate": 7.26643109540636e-07, "loss": 0.2402, "step": 23670 }, { "epoch": 82.22, "learning_rate": 7.252296819787985e-07, "loss": 0.2337, "step": 23680 }, { "epoch": 82.26, "learning_rate": 7.238162544169611e-07, "loss": 0.2612, "step": 23690 }, { "epoch": 82.29, "learning_rate": 7.224028268551236e-07, "loss": 0.276, "step": 23700 }, { "epoch": 82.33, "learning_rate": 7.209893992932862e-07, "loss": 0.275, "step": 23710 }, { "epoch": 82.36, "learning_rate": 7.195759717314487e-07, "loss": 0.2353, "step": 23720 }, { "epoch": 82.39, "learning_rate": 7.181625441696113e-07, "loss": 0.2435, "step": 23730 }, { "epoch": 82.43, "learning_rate": 7.167491166077738e-07, "loss": 0.2574, "step": 23740 }, { "epoch": 82.46, "learning_rate": 7.153356890459363e-07, "loss": 0.2834, "step": 23750 }, { "epoch": 82.5, "learning_rate": 7.139222614840989e-07, "loss": 0.2714, "step": 23760 }, { "epoch": 82.53, "learning_rate": 7.125088339222615e-07, "loss": 0.2523, "step": 23770 }, { "epoch": 82.57, "learning_rate": 7.11095406360424e-07, "loss": 0.2729, "step": 23780 }, { "epoch": 82.6, "learning_rate": 7.096819787985865e-07, "loss": 0.2366, "step": 23790 }, { "epoch": 82.64, "learning_rate": 7.082685512367491e-07, "loss": 0.2644, "step": 23800 }, { "epoch": 82.67, "learning_rate": 7.068551236749116e-07, "loss": 0.2382, "step": 23810 }, { "epoch": 82.71, "learning_rate": 7.054416961130741e-07, "loss": 0.2489, "step": 23820 }, { "epoch": 82.74, "learning_rate": 7.040282685512368e-07, "loss": 0.2933, "step": 23830 }, { "epoch": 82.78, "learning_rate": 7.026148409893993e-07, "loss": 0.2437, "step": 23840 }, { "epoch": 82.81, "learning_rate": 7.012014134275618e-07, "loss": 0.2433, "step": 23850 }, { "epoch": 82.85, "learning_rate": 6.997879858657243e-07, "loss": 0.2602, "step": 23860 }, { "epoch": 82.88, "learning_rate": 6.983745583038869e-07, "loss": 0.2693, "step": 23870 }, { "epoch": 82.91, "learning_rate": 6.969611307420494e-07, "loss": 0.2426, "step": 23880 }, { "epoch": 82.95, "learning_rate": 6.95547703180212e-07, "loss": 0.242, "step": 23890 }, { "epoch": 82.98, "learning_rate": 6.941342756183746e-07, "loss": 0.2583, "step": 23900 }, { "epoch": 83.0, "eval_loss": 0.5149600505828857, "eval_runtime": 134.0167, "eval_samples_per_second": 3.97, "eval_steps_per_second": 0.992, "eval_wer": 0.19746737802918302, "step": 23904 }, { "epoch": 83.02, "learning_rate": 6.927208480565371e-07, "loss": 0.2692, "step": 23910 }, { "epoch": 83.06, "learning_rate": 6.913074204946996e-07, "loss": 0.2688, "step": 23920 }, { "epoch": 83.09, "learning_rate": 6.898939929328622e-07, "loss": 0.2601, "step": 23930 }, { "epoch": 83.12, "learning_rate": 6.884805653710247e-07, "loss": 0.2784, "step": 23940 }, { "epoch": 83.16, "learning_rate": 6.870671378091873e-07, "loss": 0.2408, "step": 23950 }, { "epoch": 83.19, "learning_rate": 6.856537102473498e-07, "loss": 0.2512, "step": 23960 }, { "epoch": 83.23, "learning_rate": 6.842402826855124e-07, "loss": 0.2371, "step": 23970 }, { "epoch": 83.26, "learning_rate": 6.828268551236749e-07, "loss": 0.2627, "step": 23980 }, { "epoch": 83.3, "learning_rate": 6.814134275618374e-07, "loss": 0.2642, "step": 23990 }, { "epoch": 83.33, "learning_rate": 6.800000000000001e-07, "loss": 0.2806, "step": 24000 }, { "epoch": 83.37, "learning_rate": 6.785865724381626e-07, "loss": 0.2409, "step": 24010 }, { "epoch": 83.4, "learning_rate": 6.771731448763251e-07, "loss": 0.256, "step": 24020 }, { "epoch": 83.44, "learning_rate": 6.757597173144876e-07, "loss": 0.2399, "step": 24030 }, { "epoch": 83.47, "learning_rate": 6.743462897526502e-07, "loss": 0.2721, "step": 24040 }, { "epoch": 83.51, "learning_rate": 6.729328621908127e-07, "loss": 0.2702, "step": 24050 }, { "epoch": 83.54, "learning_rate": 6.715194346289753e-07, "loss": 0.2252, "step": 24060 }, { "epoch": 83.57, "learning_rate": 6.701060070671379e-07, "loss": 0.2405, "step": 24070 }, { "epoch": 83.61, "learning_rate": 6.686925795053003e-07, "loss": 0.2409, "step": 24080 }, { "epoch": 83.64, "learning_rate": 6.672791519434628e-07, "loss": 0.257, "step": 24090 }, { "epoch": 83.68, "learning_rate": 6.658657243816253e-07, "loss": 0.2642, "step": 24100 }, { "epoch": 83.71, "learning_rate": 6.644522968197879e-07, "loss": 0.2699, "step": 24110 }, { "epoch": 83.75, "learning_rate": 6.630388692579505e-07, "loss": 0.2487, "step": 24120 }, { "epoch": 83.78, "learning_rate": 6.61625441696113e-07, "loss": 0.2505, "step": 24130 }, { "epoch": 83.82, "learning_rate": 6.602120141342756e-07, "loss": 0.2627, "step": 24140 }, { "epoch": 83.85, "learning_rate": 6.587985865724381e-07, "loss": 0.2579, "step": 24150 }, { "epoch": 83.89, "learning_rate": 6.573851590106006e-07, "loss": 0.2434, "step": 24160 }, { "epoch": 83.92, "learning_rate": 6.559717314487631e-07, "loss": 0.2344, "step": 24170 }, { "epoch": 83.96, "learning_rate": 6.545583038869258e-07, "loss": 0.2468, "step": 24180 }, { "epoch": 83.99, "learning_rate": 6.531448763250883e-07, "loss": 0.246, "step": 24190 }, { "epoch": 84.0, "eval_loss": 0.5096983909606934, "eval_runtime": 133.3449, "eval_samples_per_second": 3.99, "eval_steps_per_second": 0.997, "eval_wer": 0.19618178312013884, "step": 24192 }, { "epoch": 84.03, "learning_rate": 6.517314487632508e-07, "loss": 0.2808, "step": 24200 }, { "epoch": 84.06, "learning_rate": 6.503180212014134e-07, "loss": 0.2582, "step": 24210 }, { "epoch": 84.1, "learning_rate": 6.490459363957597e-07, "loss": 0.2613, "step": 24220 }, { "epoch": 84.13, "learning_rate": 6.476325088339223e-07, "loss": 0.2637, "step": 24230 }, { "epoch": 84.17, "learning_rate": 6.462190812720848e-07, "loss": 0.2765, "step": 24240 }, { "epoch": 84.2, "learning_rate": 6.448056537102473e-07, "loss": 0.2515, "step": 24250 }, { "epoch": 84.24, "learning_rate": 6.433922261484098e-07, "loss": 0.2331, "step": 24260 }, { "epoch": 84.27, "learning_rate": 6.419787985865724e-07, "loss": 0.2408, "step": 24270 }, { "epoch": 84.3, "learning_rate": 6.40565371024735e-07, "loss": 0.2706, "step": 24280 }, { "epoch": 84.34, "learning_rate": 6.391519434628975e-07, "loss": 0.2605, "step": 24290 }, { "epoch": 84.37, "learning_rate": 6.377385159010601e-07, "loss": 0.2403, "step": 24300 }, { "epoch": 84.41, "learning_rate": 6.363250883392226e-07, "loss": 0.2646, "step": 24310 }, { "epoch": 84.44, "learning_rate": 6.349116607773851e-07, "loss": 0.262, "step": 24320 }, { "epoch": 84.48, "learning_rate": 6.334982332155476e-07, "loss": 0.2664, "step": 24330 }, { "epoch": 84.51, "learning_rate": 6.320848056537103e-07, "loss": 0.2633, "step": 24340 }, { "epoch": 84.55, "learning_rate": 6.306713780918728e-07, "loss": 0.2278, "step": 24350 }, { "epoch": 84.58, "learning_rate": 6.292579505300353e-07, "loss": 0.2645, "step": 24360 }, { "epoch": 84.62, "learning_rate": 6.278445229681979e-07, "loss": 0.2249, "step": 24370 }, { "epoch": 84.65, "learning_rate": 6.264310954063604e-07, "loss": 0.2587, "step": 24380 }, { "epoch": 84.69, "learning_rate": 6.25017667844523e-07, "loss": 0.2471, "step": 24390 }, { "epoch": 84.72, "learning_rate": 6.236042402826855e-07, "loss": 0.258, "step": 24400 }, { "epoch": 84.75, "learning_rate": 6.221908127208481e-07, "loss": 0.2394, "step": 24410 }, { "epoch": 84.79, "learning_rate": 6.207773851590106e-07, "loss": 0.252, "step": 24420 }, { "epoch": 84.82, "learning_rate": 6.193639575971731e-07, "loss": 0.2727, "step": 24430 }, { "epoch": 84.86, "learning_rate": 6.179505300353357e-07, "loss": 0.2699, "step": 24440 }, { "epoch": 84.89, "learning_rate": 6.165371024734983e-07, "loss": 0.2309, "step": 24450 }, { "epoch": 84.93, "learning_rate": 6.151236749116608e-07, "loss": 0.2637, "step": 24460 }, { "epoch": 84.96, "learning_rate": 6.13851590106007e-07, "loss": 0.245, "step": 24470 }, { "epoch": 85.0, "learning_rate": 6.124381625441695e-07, "loss": 0.272, "step": 24480 }, { "epoch": 85.0, "eval_loss": 0.504280149936676, "eval_runtime": 134.0604, "eval_samples_per_second": 3.968, "eval_steps_per_second": 0.992, "eval_wer": 0.1949604679565469, "step": 24480 }, { "epoch": 85.03, "learning_rate": 6.110247349823321e-07, "loss": 0.2629, "step": 24490 }, { "epoch": 85.07, "learning_rate": 6.096113074204947e-07, "loss": 0.2312, "step": 24500 }, { "epoch": 85.1, "learning_rate": 6.081978798586572e-07, "loss": 0.265, "step": 24510 }, { "epoch": 85.14, "learning_rate": 6.067844522968197e-07, "loss": 0.258, "step": 24520 }, { "epoch": 85.17, "learning_rate": 6.053710247349822e-07, "loss": 0.244, "step": 24530 }, { "epoch": 85.21, "learning_rate": 6.039575971731448e-07, "loss": 0.2407, "step": 24540 }, { "epoch": 85.24, "learning_rate": 6.025441696113074e-07, "loss": 0.2632, "step": 24550 }, { "epoch": 85.28, "learning_rate": 6.011307420494699e-07, "loss": 0.2678, "step": 24560 }, { "epoch": 85.31, "learning_rate": 5.997173144876325e-07, "loss": 0.2483, "step": 24570 }, { "epoch": 85.35, "learning_rate": 5.98303886925795e-07, "loss": 0.2801, "step": 24580 }, { "epoch": 85.38, "learning_rate": 5.968904593639575e-07, "loss": 0.251, "step": 24590 }, { "epoch": 85.42, "learning_rate": 5.954770318021201e-07, "loss": 0.2588, "step": 24600 }, { "epoch": 85.45, "learning_rate": 5.940636042402827e-07, "loss": 0.2543, "step": 24610 }, { "epoch": 85.48, "learning_rate": 5.926501766784452e-07, "loss": 0.2755, "step": 24620 }, { "epoch": 85.52, "learning_rate": 5.912367491166077e-07, "loss": 0.2388, "step": 24630 }, { "epoch": 85.55, "learning_rate": 5.898233215547703e-07, "loss": 0.2517, "step": 24640 }, { "epoch": 85.59, "learning_rate": 5.884098939929328e-07, "loss": 0.2513, "step": 24650 }, { "epoch": 85.62, "learning_rate": 5.869964664310953e-07, "loss": 0.2467, "step": 24660 }, { "epoch": 85.66, "learning_rate": 5.85583038869258e-07, "loss": 0.2617, "step": 24670 }, { "epoch": 85.69, "learning_rate": 5.841696113074205e-07, "loss": 0.2484, "step": 24680 }, { "epoch": 85.73, "learning_rate": 5.82756183745583e-07, "loss": 0.2481, "step": 24690 }, { "epoch": 85.76, "learning_rate": 5.813427561837455e-07, "loss": 0.2393, "step": 24700 }, { "epoch": 85.8, "learning_rate": 5.799293286219081e-07, "loss": 0.2372, "step": 24710 }, { "epoch": 85.83, "learning_rate": 5.785159010600707e-07, "loss": 0.2828, "step": 24720 }, { "epoch": 85.87, "learning_rate": 5.771024734982332e-07, "loss": 0.2796, "step": 24730 }, { "epoch": 85.9, "learning_rate": 5.756890459363958e-07, "loss": 0.2604, "step": 24740 }, { "epoch": 85.94, "learning_rate": 5.742756183745583e-07, "loss": 0.2143, "step": 24750 }, { "epoch": 85.97, "learning_rate": 5.728621908127208e-07, "loss": 0.2601, "step": 24760 }, { "epoch": 86.0, "eval_loss": 0.5090940594673157, "eval_runtime": 134.139, "eval_samples_per_second": 3.966, "eval_steps_per_second": 0.992, "eval_wer": 0.19605322362923444, "step": 24768 }, { "epoch": 86.01, "learning_rate": 5.714487632508833e-07, "loss": 0.2614, "step": 24770 }, { "epoch": 86.04, "learning_rate": 5.70035335689046e-07, "loss": 0.2556, "step": 24780 }, { "epoch": 86.08, "learning_rate": 5.686219081272085e-07, "loss": 0.2451, "step": 24790 }, { "epoch": 86.11, "learning_rate": 5.67208480565371e-07, "loss": 0.2619, "step": 24800 }, { "epoch": 86.15, "learning_rate": 5.657950530035336e-07, "loss": 0.263, "step": 24810 }, { "epoch": 86.18, "learning_rate": 5.643816254416961e-07, "loss": 0.2718, "step": 24820 }, { "epoch": 86.21, "learning_rate": 5.629681978798586e-07, "loss": 0.2349, "step": 24830 }, { "epoch": 86.25, "learning_rate": 5.615547703180213e-07, "loss": 0.2553, "step": 24840 }, { "epoch": 86.28, "learning_rate": 5.601413427561838e-07, "loss": 0.2492, "step": 24850 }, { "epoch": 86.32, "learning_rate": 5.587279151943463e-07, "loss": 0.2549, "step": 24860 }, { "epoch": 86.35, "learning_rate": 5.573144876325088e-07, "loss": 0.2416, "step": 24870 }, { "epoch": 86.39, "learning_rate": 5.559010600706714e-07, "loss": 0.2552, "step": 24880 }, { "epoch": 86.42, "learning_rate": 5.544876325088339e-07, "loss": 0.2318, "step": 24890 }, { "epoch": 86.46, "learning_rate": 5.530742049469965e-07, "loss": 0.2538, "step": 24900 }, { "epoch": 86.49, "learning_rate": 5.516607773851591e-07, "loss": 0.2483, "step": 24910 }, { "epoch": 86.53, "learning_rate": 5.502473498233216e-07, "loss": 0.2677, "step": 24920 }, { "epoch": 86.56, "learning_rate": 5.488339222614841e-07, "loss": 0.2506, "step": 24930 }, { "epoch": 86.6, "learning_rate": 5.474204946996465e-07, "loss": 0.2563, "step": 24940 }, { "epoch": 86.63, "learning_rate": 5.460070671378092e-07, "loss": 0.2429, "step": 24950 }, { "epoch": 86.66, "learning_rate": 5.445936395759717e-07, "loss": 0.259, "step": 24960 }, { "epoch": 86.7, "learning_rate": 5.431802120141342e-07, "loss": 0.2554, "step": 24970 }, { "epoch": 86.73, "learning_rate": 5.417667844522968e-07, "loss": 0.2534, "step": 24980 }, { "epoch": 86.77, "learning_rate": 5.403533568904593e-07, "loss": 0.2392, "step": 24990 }, { "epoch": 86.8, "learning_rate": 5.389399293286218e-07, "loss": 0.27, "step": 25000 }, { "epoch": 86.84, "learning_rate": 5.375265017667843e-07, "loss": 0.2516, "step": 25010 }, { "epoch": 86.87, "learning_rate": 5.36113074204947e-07, "loss": 0.2701, "step": 25020 }, { "epoch": 86.91, "learning_rate": 5.346996466431095e-07, "loss": 0.2528, "step": 25030 }, { "epoch": 86.94, "learning_rate": 5.33286219081272e-07, "loss": 0.2286, "step": 25040 }, { "epoch": 86.98, "learning_rate": 5.318727915194346e-07, "loss": 0.2719, "step": 25050 }, { "epoch": 87.0, "eval_loss": 0.5086585283279419, "eval_runtime": 134.1212, "eval_samples_per_second": 3.967, "eval_steps_per_second": 0.992, "eval_wer": 0.19753165777463522, "step": 25056 }, { "epoch": 87.01, "learning_rate": 5.304593639575971e-07, "loss": 0.2532, "step": 25060 }, { "epoch": 87.05, "learning_rate": 5.290459363957596e-07, "loss": 0.2514, "step": 25070 }, { "epoch": 87.08, "learning_rate": 5.276325088339222e-07, "loss": 0.2552, "step": 25080 }, { "epoch": 87.12, "learning_rate": 5.262190812720848e-07, "loss": 0.265, "step": 25090 }, { "epoch": 87.15, "learning_rate": 5.248056537102473e-07, "loss": 0.2704, "step": 25100 }, { "epoch": 87.19, "learning_rate": 5.233922261484098e-07, "loss": 0.2557, "step": 25110 }, { "epoch": 87.22, "learning_rate": 5.219787985865724e-07, "loss": 0.2781, "step": 25120 }, { "epoch": 87.26, "learning_rate": 5.20565371024735e-07, "loss": 0.2355, "step": 25130 }, { "epoch": 87.29, "learning_rate": 5.191519434628975e-07, "loss": 0.2728, "step": 25140 }, { "epoch": 87.33, "learning_rate": 5.177385159010601e-07, "loss": 0.2635, "step": 25150 }, { "epoch": 87.36, "learning_rate": 5.163250883392226e-07, "loss": 0.2442, "step": 25160 }, { "epoch": 87.39, "learning_rate": 5.149116607773851e-07, "loss": 0.2409, "step": 25170 }, { "epoch": 87.43, "learning_rate": 5.134982332155476e-07, "loss": 0.2497, "step": 25180 }, { "epoch": 87.46, "learning_rate": 5.120848056537103e-07, "loss": 0.263, "step": 25190 }, { "epoch": 87.5, "learning_rate": 5.106713780918728e-07, "loss": 0.2511, "step": 25200 }, { "epoch": 87.53, "learning_rate": 5.092579505300353e-07, "loss": 0.2522, "step": 25210 }, { "epoch": 87.57, "learning_rate": 5.078445229681979e-07, "loss": 0.2686, "step": 25220 }, { "epoch": 87.6, "learning_rate": 5.064310954063604e-07, "loss": 0.2407, "step": 25230 }, { "epoch": 87.64, "learning_rate": 5.050176678445229e-07, "loss": 0.228, "step": 25240 }, { "epoch": 87.67, "learning_rate": 5.036042402826855e-07, "loss": 0.2763, "step": 25250 }, { "epoch": 87.71, "learning_rate": 5.021908127208481e-07, "loss": 0.2378, "step": 25260 }, { "epoch": 87.74, "learning_rate": 5.007773851590106e-07, "loss": 0.2532, "step": 25270 }, { "epoch": 87.78, "learning_rate": 4.993639575971731e-07, "loss": 0.2431, "step": 25280 }, { "epoch": 87.81, "learning_rate": 4.979505300353356e-07, "loss": 0.2216, "step": 25290 }, { "epoch": 87.85, "learning_rate": 4.965371024734982e-07, "loss": 0.2579, "step": 25300 }, { "epoch": 87.88, "learning_rate": 4.951236749116608e-07, "loss": 0.2501, "step": 25310 }, { "epoch": 87.91, "learning_rate": 4.937102473498233e-07, "loss": 0.2612, "step": 25320 }, { "epoch": 87.95, "learning_rate": 4.922968197879858e-07, "loss": 0.2665, "step": 25330 }, { "epoch": 87.98, "learning_rate": 4.908833922261484e-07, "loss": 0.269, "step": 25340 }, { "epoch": 88.0, "eval_loss": 0.5126340389251709, "eval_runtime": 134.1929, "eval_samples_per_second": 3.964, "eval_steps_per_second": 0.991, "eval_wer": 0.1965674615928521, "step": 25344 }, { "epoch": 88.02, "learning_rate": 4.894699646643109e-07, "loss": 0.2832, "step": 25350 }, { "epoch": 88.06, "learning_rate": 4.880565371024734e-07, "loss": 0.2522, "step": 25360 }, { "epoch": 88.09, "learning_rate": 4.866431095406361e-07, "loss": 0.232, "step": 25370 }, { "epoch": 88.12, "learning_rate": 4.852296819787986e-07, "loss": 0.2669, "step": 25380 }, { "epoch": 88.16, "learning_rate": 4.838162544169611e-07, "loss": 0.2461, "step": 25390 }, { "epoch": 88.19, "learning_rate": 4.824028268551237e-07, "loss": 0.2498, "step": 25400 }, { "epoch": 88.23, "learning_rate": 4.809893992932862e-07, "loss": 0.2525, "step": 25410 }, { "epoch": 88.26, "learning_rate": 4.795759717314487e-07, "loss": 0.2603, "step": 25420 }, { "epoch": 88.3, "learning_rate": 4.781625441696113e-07, "loss": 0.2594, "step": 25430 }, { "epoch": 88.33, "learning_rate": 4.7674911660777383e-07, "loss": 0.2422, "step": 25440 }, { "epoch": 88.37, "learning_rate": 4.7533568904593634e-07, "loss": 0.2493, "step": 25450 }, { "epoch": 88.4, "learning_rate": 4.739222614840989e-07, "loss": 0.2786, "step": 25460 }, { "epoch": 88.44, "learning_rate": 4.725088339222615e-07, "loss": 0.2218, "step": 25470 }, { "epoch": 88.47, "learning_rate": 4.71095406360424e-07, "loss": 0.2634, "step": 25480 }, { "epoch": 88.51, "learning_rate": 4.6968197879858656e-07, "loss": 0.2572, "step": 25490 }, { "epoch": 88.54, "learning_rate": 4.682685512367491e-07, "loss": 0.249, "step": 25500 }, { "epoch": 88.57, "learning_rate": 4.6685512367491165e-07, "loss": 0.2547, "step": 25510 }, { "epoch": 88.61, "learning_rate": 4.654416961130742e-07, "loss": 0.2611, "step": 25520 }, { "epoch": 88.64, "learning_rate": 4.6402826855123673e-07, "loss": 0.2664, "step": 25530 }, { "epoch": 88.68, "learning_rate": 4.626148409893993e-07, "loss": 0.2758, "step": 25540 }, { "epoch": 88.71, "learning_rate": 4.612014134275618e-07, "loss": 0.2488, "step": 25550 }, { "epoch": 88.75, "learning_rate": 4.597879858657244e-07, "loss": 0.253, "step": 25560 }, { "epoch": 88.78, "learning_rate": 4.583745583038869e-07, "loss": 0.2381, "step": 25570 }, { "epoch": 88.82, "learning_rate": 4.5696113074204947e-07, "loss": 0.2643, "step": 25580 }, { "epoch": 88.85, "learning_rate": 4.5554770318021204e-07, "loss": 0.2523, "step": 25590 }, { "epoch": 88.89, "learning_rate": 4.5413427561837455e-07, "loss": 0.2507, "step": 25600 }, { "epoch": 88.92, "learning_rate": 4.527208480565371e-07, "loss": 0.2359, "step": 25610 }, { "epoch": 88.96, "learning_rate": 4.5130742049469963e-07, "loss": 0.2561, "step": 25620 }, { "epoch": 88.99, "learning_rate": 4.498939929328622e-07, "loss": 0.2863, "step": 25630 }, { "epoch": 89.0, "eval_loss": 0.5174065232276917, "eval_runtime": 135.3515, "eval_samples_per_second": 3.931, "eval_steps_per_second": 0.983, "eval_wer": 0.1965674615928521, "step": 25632 }, { "epoch": 89.03, "learning_rate": 4.4848056537102467e-07, "loss": 0.2527, "step": 25640 }, { "epoch": 89.06, "learning_rate": 4.4706713780918723e-07, "loss": 0.2613, "step": 25650 }, { "epoch": 89.1, "learning_rate": 4.456537102473498e-07, "loss": 0.2368, "step": 25660 }, { "epoch": 89.13, "learning_rate": 4.442402826855123e-07, "loss": 0.2653, "step": 25670 }, { "epoch": 89.17, "learning_rate": 4.428268551236749e-07, "loss": 0.2636, "step": 25680 }, { "epoch": 89.2, "learning_rate": 4.414134275618374e-07, "loss": 0.2154, "step": 25690 }, { "epoch": 89.24, "learning_rate": 4.3999999999999997e-07, "loss": 0.2606, "step": 25700 }, { "epoch": 89.27, "learning_rate": 4.3858657243816254e-07, "loss": 0.2416, "step": 25710 }, { "epoch": 89.3, "learning_rate": 4.3717314487632505e-07, "loss": 0.2521, "step": 25720 }, { "epoch": 89.34, "learning_rate": 4.357597173144876e-07, "loss": 0.2642, "step": 25730 }, { "epoch": 89.37, "learning_rate": 4.3434628975265014e-07, "loss": 0.247, "step": 25740 }, { "epoch": 89.41, "learning_rate": 4.329328621908127e-07, "loss": 0.2563, "step": 25750 }, { "epoch": 89.44, "learning_rate": 4.315194346289752e-07, "loss": 0.2376, "step": 25760 }, { "epoch": 89.48, "learning_rate": 4.301060070671378e-07, "loss": 0.2545, "step": 25770 }, { "epoch": 89.51, "learning_rate": 4.2869257950530036e-07, "loss": 0.2652, "step": 25780 }, { "epoch": 89.55, "learning_rate": 4.2727915194346287e-07, "loss": 0.2539, "step": 25790 }, { "epoch": 89.58, "learning_rate": 4.2586572438162544e-07, "loss": 0.2437, "step": 25800 }, { "epoch": 89.62, "learning_rate": 4.2445229681978796e-07, "loss": 0.2495, "step": 25810 }, { "epoch": 89.65, "learning_rate": 4.230388692579505e-07, "loss": 0.2779, "step": 25820 }, { "epoch": 89.69, "learning_rate": 4.216254416961131e-07, "loss": 0.271, "step": 25830 }, { "epoch": 89.72, "learning_rate": 4.202120141342756e-07, "loss": 0.2341, "step": 25840 }, { "epoch": 89.75, "learning_rate": 4.187985865724382e-07, "loss": 0.2561, "step": 25850 }, { "epoch": 89.79, "learning_rate": 4.173851590106007e-07, "loss": 0.2337, "step": 25860 }, { "epoch": 89.82, "learning_rate": 4.1597173144876326e-07, "loss": 0.277, "step": 25870 }, { "epoch": 89.86, "learning_rate": 4.145583038869258e-07, "loss": 0.2535, "step": 25880 }, { "epoch": 89.89, "learning_rate": 4.1314487632508834e-07, "loss": 0.2577, "step": 25890 }, { "epoch": 89.93, "learning_rate": 4.117314487632509e-07, "loss": 0.232, "step": 25900 }, { "epoch": 89.96, "learning_rate": 4.103180212014134e-07, "loss": 0.2724, "step": 25910 }, { "epoch": 90.0, "learning_rate": 4.0890459363957594e-07, "loss": 0.2581, "step": 25920 }, { "epoch": 90.0, "eval_loss": 0.5159129500389099, "eval_runtime": 134.2388, "eval_samples_per_second": 3.963, "eval_steps_per_second": 0.991, "eval_wer": 0.19688886032011313, "step": 25920 }, { "epoch": 90.03, "learning_rate": 4.0749116607773846e-07, "loss": 0.2464, "step": 25930 }, { "epoch": 90.07, "learning_rate": 4.0607773851590103e-07, "loss": 0.2409, "step": 25940 }, { "epoch": 90.1, "learning_rate": 4.0466431095406354e-07, "loss": 0.2413, "step": 25950 }, { "epoch": 90.14, "learning_rate": 4.032508833922261e-07, "loss": 0.271, "step": 25960 }, { "epoch": 90.17, "learning_rate": 4.018374558303887e-07, "loss": 0.2487, "step": 25970 }, { "epoch": 90.21, "learning_rate": 4.004240282685512e-07, "loss": 0.2356, "step": 25980 }, { "epoch": 90.24, "learning_rate": 3.9901060070671376e-07, "loss": 0.2434, "step": 25990 }, { "epoch": 90.28, "learning_rate": 3.975971731448763e-07, "loss": 0.2607, "step": 26000 }, { "epoch": 90.31, "learning_rate": 3.9618374558303885e-07, "loss": 0.2515, "step": 26010 }, { "epoch": 90.35, "learning_rate": 3.947703180212014e-07, "loss": 0.2596, "step": 26020 }, { "epoch": 90.38, "learning_rate": 3.9335689045936393e-07, "loss": 0.2541, "step": 26030 }, { "epoch": 90.42, "learning_rate": 3.919434628975265e-07, "loss": 0.2471, "step": 26040 }, { "epoch": 90.45, "learning_rate": 3.90530035335689e-07, "loss": 0.2417, "step": 26050 }, { "epoch": 90.48, "learning_rate": 3.891166077738516e-07, "loss": 0.2659, "step": 26060 }, { "epoch": 90.52, "learning_rate": 3.877031802120141e-07, "loss": 0.2496, "step": 26070 }, { "epoch": 90.55, "learning_rate": 3.8628975265017667e-07, "loss": 0.2371, "step": 26080 }, { "epoch": 90.59, "learning_rate": 3.8487632508833924e-07, "loss": 0.2709, "step": 26090 }, { "epoch": 90.62, "learning_rate": 3.8346289752650175e-07, "loss": 0.238, "step": 26100 }, { "epoch": 90.66, "learning_rate": 3.820494699646643e-07, "loss": 0.2642, "step": 26110 }, { "epoch": 90.69, "learning_rate": 3.8063604240282683e-07, "loss": 0.2699, "step": 26120 }, { "epoch": 90.73, "learning_rate": 3.792226148409894e-07, "loss": 0.2729, "step": 26130 }, { "epoch": 90.76, "learning_rate": 3.7780918727915197e-07, "loss": 0.2473, "step": 26140 }, { "epoch": 90.8, "learning_rate": 3.763957597173145e-07, "loss": 0.27, "step": 26150 }, { "epoch": 90.83, "learning_rate": 3.7498233215547706e-07, "loss": 0.267, "step": 26160 }, { "epoch": 90.87, "learning_rate": 3.7356890459363957e-07, "loss": 0.2617, "step": 26170 }, { "epoch": 90.9, "learning_rate": 3.721554770318021e-07, "loss": 0.2436, "step": 26180 }, { "epoch": 90.94, "learning_rate": 3.707420494699646e-07, "loss": 0.2425, "step": 26190 }, { "epoch": 90.97, "learning_rate": 3.6932862190812717e-07, "loss": 0.26, "step": 26200 }, { "epoch": 91.0, "eval_loss": 0.514625608921051, "eval_runtime": 135.1986, "eval_samples_per_second": 3.935, "eval_steps_per_second": 0.984, "eval_wer": 0.19688886032011313, "step": 26208 }, { "epoch": 91.01, "learning_rate": 3.6791519434628974e-07, "loss": 0.2532, "step": 26210 }, { "epoch": 91.04, "learning_rate": 3.6650176678445225e-07, "loss": 0.2408, "step": 26220 }, { "epoch": 91.08, "learning_rate": 3.650883392226148e-07, "loss": 0.2654, "step": 26230 }, { "epoch": 91.11, "learning_rate": 3.6367491166077734e-07, "loss": 0.2836, "step": 26240 }, { "epoch": 91.15, "learning_rate": 3.622614840989399e-07, "loss": 0.2472, "step": 26250 }, { "epoch": 91.18, "learning_rate": 3.608480565371024e-07, "loss": 0.2489, "step": 26260 }, { "epoch": 91.21, "learning_rate": 3.59434628975265e-07, "loss": 0.2713, "step": 26270 }, { "epoch": 91.25, "learning_rate": 3.5802120141342756e-07, "loss": 0.2338, "step": 26280 }, { "epoch": 91.28, "learning_rate": 3.566077738515901e-07, "loss": 0.2466, "step": 26290 }, { "epoch": 91.32, "learning_rate": 3.5519434628975264e-07, "loss": 0.2362, "step": 26300 }, { "epoch": 91.35, "learning_rate": 3.5378091872791516e-07, "loss": 0.2476, "step": 26310 }, { "epoch": 91.39, "learning_rate": 3.523674911660777e-07, "loss": 0.2393, "step": 26320 }, { "epoch": 91.42, "learning_rate": 3.509540636042403e-07, "loss": 0.2541, "step": 26330 }, { "epoch": 91.46, "learning_rate": 3.495406360424028e-07, "loss": 0.2439, "step": 26340 }, { "epoch": 91.49, "learning_rate": 3.481272084805654e-07, "loss": 0.2573, "step": 26350 }, { "epoch": 91.53, "learning_rate": 3.467137809187279e-07, "loss": 0.2586, "step": 26360 }, { "epoch": 91.56, "learning_rate": 3.4530035335689046e-07, "loss": 0.2369, "step": 26370 }, { "epoch": 91.6, "learning_rate": 3.43886925795053e-07, "loss": 0.2543, "step": 26380 }, { "epoch": 91.63, "learning_rate": 3.4247349823321555e-07, "loss": 0.2695, "step": 26390 }, { "epoch": 91.66, "learning_rate": 3.410600706713781e-07, "loss": 0.2457, "step": 26400 }, { "epoch": 91.7, "learning_rate": 3.3964664310954063e-07, "loss": 0.2456, "step": 26410 }, { "epoch": 91.73, "learning_rate": 3.382332155477032e-07, "loss": 0.2432, "step": 26420 }, { "epoch": 91.77, "learning_rate": 3.368197879858657e-07, "loss": 0.2264, "step": 26430 }, { "epoch": 91.8, "learning_rate": 3.354063604240283e-07, "loss": 0.242, "step": 26440 }, { "epoch": 91.84, "learning_rate": 3.3399293286219085e-07, "loss": 0.2651, "step": 26450 }, { "epoch": 91.87, "learning_rate": 3.325795053003533e-07, "loss": 0.2717, "step": 26460 }, { "epoch": 91.91, "learning_rate": 3.311660777385159e-07, "loss": 0.2417, "step": 26470 }, { "epoch": 91.94, "learning_rate": 3.297526501766784e-07, "loss": 0.2447, "step": 26480 }, { "epoch": 91.98, "learning_rate": 3.2833922261484096e-07, "loss": 0.2796, "step": 26490 }, { "epoch": 92.0, "eval_loss": 0.5150091648101807, "eval_runtime": 134.13, "eval_samples_per_second": 3.966, "eval_steps_per_second": 0.992, "eval_wer": 0.1965674615928521, "step": 26496 }, { "epoch": 92.01, "learning_rate": 3.269257950530035e-07, "loss": 0.2811, "step": 26500 }, { "epoch": 92.05, "learning_rate": 3.2551236749116605e-07, "loss": 0.2589, "step": 26510 }, { "epoch": 92.08, "learning_rate": 3.240989399293286e-07, "loss": 0.2453, "step": 26520 }, { "epoch": 92.12, "learning_rate": 3.2268551236749113e-07, "loss": 0.2482, "step": 26530 }, { "epoch": 92.15, "learning_rate": 3.212720848056537e-07, "loss": 0.2619, "step": 26540 }, { "epoch": 92.19, "learning_rate": 3.198586572438162e-07, "loss": 0.2415, "step": 26550 }, { "epoch": 92.22, "learning_rate": 3.184452296819788e-07, "loss": 0.2459, "step": 26560 }, { "epoch": 92.26, "learning_rate": 3.170318021201413e-07, "loss": 0.253, "step": 26570 }, { "epoch": 92.29, "learning_rate": 3.1561837455830387e-07, "loss": 0.2728, "step": 26580 }, { "epoch": 92.33, "learning_rate": 3.1420494699646644e-07, "loss": 0.255, "step": 26590 }, { "epoch": 92.36, "learning_rate": 3.1279151943462895e-07, "loss": 0.2464, "step": 26600 }, { "epoch": 92.39, "learning_rate": 3.113780918727915e-07, "loss": 0.24, "step": 26610 }, { "epoch": 92.43, "learning_rate": 3.0996466431095404e-07, "loss": 0.2343, "step": 26620 }, { "epoch": 92.46, "learning_rate": 3.085512367491166e-07, "loss": 0.245, "step": 26630 }, { "epoch": 92.5, "learning_rate": 3.0713780918727917e-07, "loss": 0.2556, "step": 26640 }, { "epoch": 92.53, "learning_rate": 3.057243816254417e-07, "loss": 0.2431, "step": 26650 }, { "epoch": 92.57, "learning_rate": 3.0431095406360426e-07, "loss": 0.2274, "step": 26660 }, { "epoch": 92.6, "learning_rate": 3.0289752650176677e-07, "loss": 0.254, "step": 26670 }, { "epoch": 92.64, "learning_rate": 3.0148409893992934e-07, "loss": 0.2559, "step": 26680 }, { "epoch": 92.67, "learning_rate": 3.0007067137809186e-07, "loss": 0.2563, "step": 26690 }, { "epoch": 92.71, "learning_rate": 2.986572438162544e-07, "loss": 0.2375, "step": 26700 }, { "epoch": 92.74, "learning_rate": 2.97243816254417e-07, "loss": 0.2797, "step": 26710 }, { "epoch": 92.78, "learning_rate": 2.9583038869257945e-07, "loss": 0.2366, "step": 26720 }, { "epoch": 92.81, "learning_rate": 2.94416961130742e-07, "loss": 0.2638, "step": 26730 }, { "epoch": 92.85, "learning_rate": 2.9300353356890454e-07, "loss": 0.2595, "step": 26740 }, { "epoch": 92.88, "learning_rate": 2.915901060070671e-07, "loss": 0.2488, "step": 26750 }, { "epoch": 92.91, "learning_rate": 2.901766784452297e-07, "loss": 0.2517, "step": 26760 }, { "epoch": 92.95, "learning_rate": 2.887632508833922e-07, "loss": 0.2589, "step": 26770 }, { "epoch": 92.98, "learning_rate": 2.8734982332155476e-07, "loss": 0.2723, "step": 26780 }, { "epoch": 93.0, "eval_loss": 0.5132827758789062, "eval_runtime": 134.2687, "eval_samples_per_second": 3.962, "eval_steps_per_second": 0.991, "eval_wer": 0.19708169955646976, "step": 26784 }, { "epoch": 93.02, "learning_rate": 2.859363957597173e-07, "loss": 0.2599, "step": 26790 }, { "epoch": 93.06, "learning_rate": 2.8452296819787984e-07, "loss": 0.2383, "step": 26800 }, { "epoch": 93.09, "learning_rate": 2.8310954063604236e-07, "loss": 0.2709, "step": 26810 }, { "epoch": 93.12, "learning_rate": 2.816961130742049e-07, "loss": 0.2514, "step": 26820 }, { "epoch": 93.16, "learning_rate": 2.802826855123675e-07, "loss": 0.2503, "step": 26830 }, { "epoch": 93.19, "learning_rate": 2.7886925795053e-07, "loss": 0.2455, "step": 26840 }, { "epoch": 93.23, "learning_rate": 2.774558303886926e-07, "loss": 0.2576, "step": 26850 }, { "epoch": 93.26, "learning_rate": 2.760424028268551e-07, "loss": 0.2415, "step": 26860 }, { "epoch": 93.3, "learning_rate": 2.7462897526501766e-07, "loss": 0.2765, "step": 26870 }, { "epoch": 93.33, "learning_rate": 2.7321554770318023e-07, "loss": 0.2527, "step": 26880 }, { "epoch": 93.37, "learning_rate": 2.7180212014134275e-07, "loss": 0.2404, "step": 26890 }, { "epoch": 93.4, "learning_rate": 2.703886925795053e-07, "loss": 0.2534, "step": 26900 }, { "epoch": 93.44, "learning_rate": 2.6897526501766783e-07, "loss": 0.2223, "step": 26910 }, { "epoch": 93.47, "learning_rate": 2.675618374558304e-07, "loss": 0.2735, "step": 26920 }, { "epoch": 93.51, "learning_rate": 2.661484098939929e-07, "loss": 0.2666, "step": 26930 }, { "epoch": 93.54, "learning_rate": 2.647349823321555e-07, "loss": 0.2513, "step": 26940 }, { "epoch": 93.57, "learning_rate": 2.6332155477031805e-07, "loss": 0.2531, "step": 26950 }, { "epoch": 93.61, "learning_rate": 2.6190812720848057e-07, "loss": 0.2438, "step": 26960 }, { "epoch": 93.64, "learning_rate": 2.6049469964664313e-07, "loss": 0.2672, "step": 26970 }, { "epoch": 93.68, "learning_rate": 2.5908127208480565e-07, "loss": 0.2743, "step": 26980 }, { "epoch": 93.71, "learning_rate": 2.576678445229682e-07, "loss": 0.2549, "step": 26990 }, { "epoch": 93.75, "learning_rate": 2.562544169611307e-07, "loss": 0.2564, "step": 27000 }, { "epoch": 93.78, "learning_rate": 2.5484098939929325e-07, "loss": 0.2593, "step": 27010 }, { "epoch": 93.82, "learning_rate": 2.534275618374558e-07, "loss": 0.2585, "step": 27020 }, { "epoch": 93.85, "learning_rate": 2.5201413427561833e-07, "loss": 0.2472, "step": 27030 }, { "epoch": 93.89, "learning_rate": 2.506007067137809e-07, "loss": 0.2225, "step": 27040 }, { "epoch": 93.92, "learning_rate": 2.4918727915194347e-07, "loss": 0.2766, "step": 27050 }, { "epoch": 93.96, "learning_rate": 2.47773851590106e-07, "loss": 0.2493, "step": 27060 }, { "epoch": 93.99, "learning_rate": 2.4636042402826855e-07, "loss": 0.249, "step": 27070 }, { "epoch": 94.0, "eval_loss": 0.509568452835083, "eval_runtime": 135.0584, "eval_samples_per_second": 3.939, "eval_steps_per_second": 0.985, "eval_wer": 0.19605322362923444, "step": 27072 }, { "epoch": 94.03, "learning_rate": 2.4494699646643107e-07, "loss": 0.2773, "step": 27080 }, { "epoch": 94.06, "learning_rate": 2.4353356890459364e-07, "loss": 0.2497, "step": 27090 }, { "epoch": 94.1, "learning_rate": 2.421201413427562e-07, "loss": 0.2476, "step": 27100 }, { "epoch": 94.13, "learning_rate": 2.407067137809187e-07, "loss": 0.268, "step": 27110 }, { "epoch": 94.17, "learning_rate": 2.392932862190813e-07, "loss": 0.2523, "step": 27120 }, { "epoch": 94.2, "learning_rate": 2.378798586572438e-07, "loss": 0.2356, "step": 27130 }, { "epoch": 94.24, "learning_rate": 2.3646643109540635e-07, "loss": 0.2633, "step": 27140 }, { "epoch": 94.27, "learning_rate": 2.350530035335689e-07, "loss": 0.2345, "step": 27150 }, { "epoch": 94.3, "learning_rate": 2.3363957597173146e-07, "loss": 0.2828, "step": 27160 }, { "epoch": 94.34, "learning_rate": 2.32226148409894e-07, "loss": 0.259, "step": 27170 }, { "epoch": 94.37, "learning_rate": 2.3081272084805654e-07, "loss": 0.2528, "step": 27180 }, { "epoch": 94.41, "learning_rate": 2.2939929328621908e-07, "loss": 0.2359, "step": 27190 }, { "epoch": 94.44, "learning_rate": 2.279858657243816e-07, "loss": 0.2267, "step": 27200 }, { "epoch": 94.48, "learning_rate": 2.2657243816254414e-07, "loss": 0.2596, "step": 27210 }, { "epoch": 94.51, "learning_rate": 2.251590106007067e-07, "loss": 0.259, "step": 27220 }, { "epoch": 94.55, "learning_rate": 2.2374558303886925e-07, "loss": 0.2455, "step": 27230 }, { "epoch": 94.58, "learning_rate": 2.223321554770318e-07, "loss": 0.268, "step": 27240 }, { "epoch": 94.62, "learning_rate": 2.2091872791519433e-07, "loss": 0.2472, "step": 27250 }, { "epoch": 94.65, "learning_rate": 2.1950530035335688e-07, "loss": 0.2573, "step": 27260 }, { "epoch": 94.69, "learning_rate": 2.1809187279151942e-07, "loss": 0.2845, "step": 27270 }, { "epoch": 94.72, "learning_rate": 2.1667844522968196e-07, "loss": 0.2401, "step": 27280 }, { "epoch": 94.75, "learning_rate": 2.1526501766784453e-07, "loss": 0.2497, "step": 27290 }, { "epoch": 94.79, "learning_rate": 2.1385159010600707e-07, "loss": 0.2693, "step": 27300 }, { "epoch": 94.82, "learning_rate": 2.124381625441696e-07, "loss": 0.2634, "step": 27310 }, { "epoch": 94.86, "learning_rate": 2.1102473498233215e-07, "loss": 0.2539, "step": 27320 }, { "epoch": 94.89, "learning_rate": 2.0961130742049467e-07, "loss": 0.2747, "step": 27330 }, { "epoch": 94.93, "learning_rate": 2.081978798586572e-07, "loss": 0.2487, "step": 27340 }, { "epoch": 94.96, "learning_rate": 2.0678445229681978e-07, "loss": 0.2491, "step": 27350 }, { "epoch": 95.0, "learning_rate": 2.0537102473498232e-07, "loss": 0.266, "step": 27360 }, { "epoch": 95.0, "eval_loss": 0.5116358399391174, "eval_runtime": 134.7906, "eval_samples_per_second": 3.947, "eval_steps_per_second": 0.987, "eval_wer": 0.19637462235649547, "step": 27360 }, { "epoch": 95.03, "learning_rate": 2.0395759717314486e-07, "loss": 0.2359, "step": 27370 }, { "epoch": 95.07, "learning_rate": 2.025441696113074e-07, "loss": 0.2421, "step": 27380 }, { "epoch": 95.1, "learning_rate": 2.0113074204946995e-07, "loss": 0.2358, "step": 27390 }, { "epoch": 95.14, "learning_rate": 1.997173144876325e-07, "loss": 0.2741, "step": 27400 }, { "epoch": 95.17, "learning_rate": 1.9830388692579506e-07, "loss": 0.2423, "step": 27410 }, { "epoch": 95.21, "learning_rate": 1.968904593639576e-07, "loss": 0.2617, "step": 27420 }, { "epoch": 95.24, "learning_rate": 1.9547703180212014e-07, "loss": 0.2387, "step": 27430 }, { "epoch": 95.28, "learning_rate": 1.9406360424028268e-07, "loss": 0.2223, "step": 27440 }, { "epoch": 95.31, "learning_rate": 1.9265017667844522e-07, "loss": 0.2613, "step": 27450 }, { "epoch": 95.35, "learning_rate": 1.9123674911660777e-07, "loss": 0.2723, "step": 27460 }, { "epoch": 95.38, "learning_rate": 1.898233215547703e-07, "loss": 0.2495, "step": 27470 }, { "epoch": 95.42, "learning_rate": 1.8840989399293285e-07, "loss": 0.2446, "step": 27480 }, { "epoch": 95.45, "learning_rate": 1.869964664310954e-07, "loss": 0.2454, "step": 27490 }, { "epoch": 95.48, "learning_rate": 1.8558303886925793e-07, "loss": 0.2713, "step": 27500 }, { "epoch": 95.52, "learning_rate": 1.8416961130742048e-07, "loss": 0.2616, "step": 27510 }, { "epoch": 95.55, "learning_rate": 1.8275618374558302e-07, "loss": 0.2538, "step": 27520 }, { "epoch": 95.59, "learning_rate": 1.8134275618374559e-07, "loss": 0.2452, "step": 27530 }, { "epoch": 95.62, "learning_rate": 1.7992932862190813e-07, "loss": 0.2413, "step": 27540 }, { "epoch": 95.66, "learning_rate": 1.7851590106007067e-07, "loss": 0.2753, "step": 27550 }, { "epoch": 95.69, "learning_rate": 1.771024734982332e-07, "loss": 0.2428, "step": 27560 }, { "epoch": 95.73, "learning_rate": 1.7568904593639575e-07, "loss": 0.2359, "step": 27570 }, { "epoch": 95.76, "learning_rate": 1.742756183745583e-07, "loss": 0.2472, "step": 27580 }, { "epoch": 95.8, "learning_rate": 1.7286219081272086e-07, "loss": 0.2241, "step": 27590 }, { "epoch": 95.83, "learning_rate": 1.714487632508834e-07, "loss": 0.2494, "step": 27600 }, { "epoch": 95.87, "learning_rate": 1.7003533568904592e-07, "loss": 0.2686, "step": 27610 }, { "epoch": 95.9, "learning_rate": 1.6862190812720846e-07, "loss": 0.2426, "step": 27620 }, { "epoch": 95.94, "learning_rate": 1.67208480565371e-07, "loss": 0.2698, "step": 27630 }, { "epoch": 95.97, "learning_rate": 1.6579505300353355e-07, "loss": 0.2683, "step": 27640 }, { "epoch": 96.0, "eval_loss": 0.5132885575294495, "eval_runtime": 135.195, "eval_samples_per_second": 3.935, "eval_steps_per_second": 0.984, "eval_wer": 0.1966960210837565, "step": 27648 }, { "epoch": 96.01, "learning_rate": 1.643816254416961e-07, "loss": 0.2756, "step": 27650 }, { "epoch": 96.04, "learning_rate": 1.6296819787985866e-07, "loss": 0.264, "step": 27660 }, { "epoch": 96.08, "learning_rate": 1.615547703180212e-07, "loss": 0.2275, "step": 27670 }, { "epoch": 96.11, "learning_rate": 1.6014134275618374e-07, "loss": 0.2498, "step": 27680 }, { "epoch": 96.15, "learning_rate": 1.5872791519434628e-07, "loss": 0.2453, "step": 27690 }, { "epoch": 96.18, "learning_rate": 1.5731448763250883e-07, "loss": 0.2527, "step": 27700 }, { "epoch": 96.21, "learning_rate": 1.5590106007067137e-07, "loss": 0.2548, "step": 27710 }, { "epoch": 96.25, "learning_rate": 1.5448763250883394e-07, "loss": 0.2589, "step": 27720 }, { "epoch": 96.28, "learning_rate": 1.5307420494699648e-07, "loss": 0.2361, "step": 27730 }, { "epoch": 96.32, "learning_rate": 1.51660777385159e-07, "loss": 0.2798, "step": 27740 }, { "epoch": 96.35, "learning_rate": 1.5024734982332153e-07, "loss": 0.2742, "step": 27750 }, { "epoch": 96.39, "learning_rate": 1.4883392226148408e-07, "loss": 0.2475, "step": 27760 }, { "epoch": 96.42, "learning_rate": 1.4742049469964662e-07, "loss": 0.237, "step": 27770 }, { "epoch": 96.46, "learning_rate": 1.4600706713780919e-07, "loss": 0.2548, "step": 27780 }, { "epoch": 96.49, "learning_rate": 1.4459363957597173e-07, "loss": 0.2458, "step": 27790 }, { "epoch": 96.53, "learning_rate": 1.4318021201413427e-07, "loss": 0.2448, "step": 27800 }, { "epoch": 96.56, "learning_rate": 1.417667844522968e-07, "loss": 0.2604, "step": 27810 }, { "epoch": 96.6, "learning_rate": 1.4035335689045935e-07, "loss": 0.252, "step": 27820 }, { "epoch": 96.63, "learning_rate": 1.389399293286219e-07, "loss": 0.2356, "step": 27830 }, { "epoch": 96.66, "learning_rate": 1.3752650176678446e-07, "loss": 0.2531, "step": 27840 }, { "epoch": 96.7, "learning_rate": 1.36113074204947e-07, "loss": 0.2657, "step": 27850 }, { "epoch": 96.73, "learning_rate": 1.3469964664310955e-07, "loss": 0.2601, "step": 27860 }, { "epoch": 96.77, "learning_rate": 1.332862190812721e-07, "loss": 0.2507, "step": 27870 }, { "epoch": 96.8, "learning_rate": 1.318727915194346e-07, "loss": 0.2657, "step": 27880 }, { "epoch": 96.84, "learning_rate": 1.3045936395759715e-07, "loss": 0.2588, "step": 27890 }, { "epoch": 96.87, "learning_rate": 1.2904593639575972e-07, "loss": 0.2474, "step": 27900 }, { "epoch": 96.91, "learning_rate": 1.2763250883392226e-07, "loss": 0.2616, "step": 27910 }, { "epoch": 96.94, "learning_rate": 1.262190812720848e-07, "loss": 0.2405, "step": 27920 }, { "epoch": 96.98, "learning_rate": 1.2480565371024734e-07, "loss": 0.2451, "step": 27930 }, { "epoch": 97.0, "eval_loss": 0.5141022205352783, "eval_runtime": 134.2101, "eval_samples_per_second": 3.964, "eval_steps_per_second": 0.991, "eval_wer": 0.19650318184739987, "step": 27936 }, { "epoch": 97.01, "learning_rate": 1.2339222614840988e-07, "loss": 0.2512, "step": 27940 }, { "epoch": 97.05, "learning_rate": 1.2197879858657243e-07, "loss": 0.2491, "step": 27950 }, { "epoch": 97.08, "learning_rate": 1.2056537102473497e-07, "loss": 0.2663, "step": 27960 }, { "epoch": 97.12, "learning_rate": 1.1915194346289752e-07, "loss": 0.2532, "step": 27970 }, { "epoch": 97.15, "learning_rate": 1.1773851590106006e-07, "loss": 0.263, "step": 27980 }, { "epoch": 97.19, "learning_rate": 1.163250883392226e-07, "loss": 0.2544, "step": 27990 }, { "epoch": 97.22, "learning_rate": 1.1491166077738515e-07, "loss": 0.2543, "step": 28000 }, { "epoch": 97.26, "learning_rate": 1.134982332155477e-07, "loss": 0.2582, "step": 28010 }, { "epoch": 97.29, "learning_rate": 1.1208480565371025e-07, "loss": 0.2577, "step": 28020 }, { "epoch": 97.33, "learning_rate": 1.1067137809187279e-07, "loss": 0.2445, "step": 28030 }, { "epoch": 97.36, "learning_rate": 1.0925795053003534e-07, "loss": 0.2692, "step": 28040 }, { "epoch": 97.39, "learning_rate": 1.0784452296819787e-07, "loss": 0.2461, "step": 28050 }, { "epoch": 97.43, "learning_rate": 1.0643109540636041e-07, "loss": 0.2136, "step": 28060 }, { "epoch": 97.46, "learning_rate": 1.0501766784452297e-07, "loss": 0.2604, "step": 28070 }, { "epoch": 97.5, "learning_rate": 1.0360424028268551e-07, "loss": 0.2517, "step": 28080 }, { "epoch": 97.53, "learning_rate": 1.0219081272084805e-07, "loss": 0.247, "step": 28090 }, { "epoch": 97.57, "learning_rate": 1.0077738515901061e-07, "loss": 0.2481, "step": 28100 }, { "epoch": 97.6, "learning_rate": 9.936395759717315e-08, "loss": 0.2215, "step": 28110 }, { "epoch": 97.64, "learning_rate": 9.795053003533568e-08, "loss": 0.2549, "step": 28120 }, { "epoch": 97.67, "learning_rate": 9.653710247349822e-08, "loss": 0.2656, "step": 28130 }, { "epoch": 97.71, "learning_rate": 9.512367491166077e-08, "loss": 0.2415, "step": 28140 }, { "epoch": 97.74, "learning_rate": 9.371024734982332e-08, "loss": 0.2388, "step": 28150 }, { "epoch": 97.78, "learning_rate": 9.229681978798586e-08, "loss": 0.2437, "step": 28160 }, { "epoch": 97.81, "learning_rate": 9.088339222614841e-08, "loss": 0.2621, "step": 28170 }, { "epoch": 97.85, "learning_rate": 8.946996466431094e-08, "loss": 0.2629, "step": 28180 }, { "epoch": 97.88, "learning_rate": 8.805653710247348e-08, "loss": 0.2346, "step": 28190 }, { "epoch": 97.91, "learning_rate": 8.664310954063604e-08, "loss": 0.2638, "step": 28200 }, { "epoch": 97.95, "learning_rate": 8.522968197879858e-08, "loss": 0.2465, "step": 28210 }, { "epoch": 97.98, "learning_rate": 8.381625441696112e-08, "loss": 0.2723, "step": 28220 }, { "epoch": 98.0, "eval_loss": 0.5122572779655457, "eval_runtime": 135.6766, "eval_samples_per_second": 3.921, "eval_steps_per_second": 0.98, "eval_wer": 0.19624606286559104, "step": 28224 }, { "epoch": 98.02, "learning_rate": 8.240282685512368e-08, "loss": 0.2508, "step": 28230 }, { "epoch": 98.06, "learning_rate": 8.098939929328622e-08, "loss": 0.2573, "step": 28240 }, { "epoch": 98.09, "learning_rate": 7.957597173144875e-08, "loss": 0.2363, "step": 28250 }, { "epoch": 98.12, "learning_rate": 7.81625441696113e-08, "loss": 0.2677, "step": 28260 }, { "epoch": 98.16, "learning_rate": 7.674911660777385e-08, "loss": 0.2611, "step": 28270 }, { "epoch": 98.19, "learning_rate": 7.533568904593639e-08, "loss": 0.2331, "step": 28280 }, { "epoch": 98.23, "learning_rate": 7.392226148409894e-08, "loss": 0.2688, "step": 28290 }, { "epoch": 98.26, "learning_rate": 7.250883392226148e-08, "loss": 0.2321, "step": 28300 }, { "epoch": 98.3, "learning_rate": 7.109540636042403e-08, "loss": 0.278, "step": 28310 }, { "epoch": 98.33, "learning_rate": 6.968197879858657e-08, "loss": 0.2502, "step": 28320 }, { "epoch": 98.37, "learning_rate": 6.826855123674911e-08, "loss": 0.2497, "step": 28330 }, { "epoch": 98.4, "learning_rate": 6.685512367491165e-08, "loss": 0.2593, "step": 28340 }, { "epoch": 98.44, "learning_rate": 6.544169611307421e-08, "loss": 0.25, "step": 28350 }, { "epoch": 98.47, "learning_rate": 6.402826855123675e-08, "loss": 0.2518, "step": 28360 }, { "epoch": 98.51, "learning_rate": 6.261484098939929e-08, "loss": 0.2586, "step": 28370 }, { "epoch": 98.54, "learning_rate": 6.120141342756183e-08, "loss": 0.2632, "step": 28380 }, { "epoch": 98.57, "learning_rate": 5.978798586572437e-08, "loss": 0.2588, "step": 28390 }, { "epoch": 98.61, "learning_rate": 5.837455830388692e-08, "loss": 0.2575, "step": 28400 }, { "epoch": 98.64, "learning_rate": 5.6961130742049465e-08, "loss": 0.2669, "step": 28410 }, { "epoch": 98.68, "learning_rate": 5.5547703180212014e-08, "loss": 0.2753, "step": 28420 }, { "epoch": 98.71, "learning_rate": 5.4134275618374555e-08, "loss": 0.2383, "step": 28430 }, { "epoch": 98.75, "learning_rate": 5.27208480565371e-08, "loss": 0.2534, "step": 28440 }, { "epoch": 98.78, "learning_rate": 5.1307420494699646e-08, "loss": 0.2444, "step": 28450 }, { "epoch": 98.82, "learning_rate": 4.989399293286219e-08, "loss": 0.2627, "step": 28460 }, { "epoch": 98.85, "learning_rate": 4.848056537102473e-08, "loss": 0.2374, "step": 28470 }, { "epoch": 98.89, "learning_rate": 4.706713780918728e-08, "loss": 0.2649, "step": 28480 }, { "epoch": 98.92, "learning_rate": 4.565371024734982e-08, "loss": 0.2567, "step": 28490 }, { "epoch": 98.96, "learning_rate": 4.424028268551237e-08, "loss": 0.251, "step": 28500 }, { "epoch": 98.99, "learning_rate": 4.282685512367491e-08, "loss": 0.2527, "step": 28510 }, { "epoch": 99.0, "eval_loss": 0.5119685530662537, "eval_runtime": 134.8373, "eval_samples_per_second": 3.945, "eval_steps_per_second": 0.986, "eval_wer": 0.1965674615928521, "step": 28512 }, { "epoch": 99.03, "learning_rate": 4.141342756183745e-08, "loss": 0.2849, "step": 28520 }, { "epoch": 99.06, "learning_rate": 4e-08, "loss": 0.2756, "step": 28530 }, { "epoch": 99.1, "learning_rate": 3.858657243816254e-08, "loss": 0.2378, "step": 28540 }, { "epoch": 99.13, "learning_rate": 3.7173144876325085e-08, "loss": 0.2709, "step": 28550 }, { "epoch": 99.17, "learning_rate": 3.575971731448763e-08, "loss": 0.2569, "step": 28560 }, { "epoch": 99.2, "learning_rate": 3.4346289752650175e-08, "loss": 0.2597, "step": 28570 }, { "epoch": 99.24, "learning_rate": 3.293286219081272e-08, "loss": 0.2418, "step": 28580 }, { "epoch": 99.27, "learning_rate": 3.1519434628975265e-08, "loss": 0.239, "step": 28590 }, { "epoch": 99.3, "learning_rate": 3.010600706713781e-08, "loss": 0.2535, "step": 28600 }, { "epoch": 99.34, "learning_rate": 2.8692579505300353e-08, "loss": 0.2642, "step": 28610 }, { "epoch": 99.37, "learning_rate": 2.7279151943462894e-08, "loss": 0.2302, "step": 28620 }, { "epoch": 99.41, "learning_rate": 2.5865724381625443e-08, "loss": 0.2619, "step": 28630 }, { "epoch": 99.44, "learning_rate": 2.4452296819787985e-08, "loss": 0.232, "step": 28640 }, { "epoch": 99.48, "learning_rate": 2.3038869257950527e-08, "loss": 0.2763, "step": 28650 }, { "epoch": 99.51, "learning_rate": 2.1625441696113075e-08, "loss": 0.2569, "step": 28660 }, { "epoch": 99.55, "learning_rate": 2.0212014134275617e-08, "loss": 0.2466, "step": 28670 }, { "epoch": 99.58, "learning_rate": 1.8798586572438162e-08, "loss": 0.2511, "step": 28680 }, { "epoch": 99.62, "learning_rate": 1.7385159010600704e-08, "loss": 0.2401, "step": 28690 }, { "epoch": 99.65, "learning_rate": 1.597173144876325e-08, "loss": 0.2573, "step": 28700 }, { "epoch": 99.69, "learning_rate": 1.4558303886925795e-08, "loss": 0.2663, "step": 28710 }, { "epoch": 99.72, "learning_rate": 1.314487632508834e-08, "loss": 0.2237, "step": 28720 }, { "epoch": 99.75, "learning_rate": 1.1731448763250882e-08, "loss": 0.2567, "step": 28730 }, { "epoch": 99.79, "learning_rate": 1.0318021201413427e-08, "loss": 0.2448, "step": 28740 }, { "epoch": 99.82, "learning_rate": 8.90459363957597e-09, "loss": 0.2673, "step": 28750 }, { "epoch": 99.86, "learning_rate": 7.491166077738516e-09, "loss": 0.2539, "step": 28760 }, { "epoch": 99.89, "learning_rate": 6.077738515901059e-09, "loss": 0.2329, "step": 28770 }, { "epoch": 99.93, "learning_rate": 4.6643109540636045e-09, "loss": 0.24, "step": 28780 }, { "epoch": 99.96, "learning_rate": 3.250883392226148e-09, "loss": 0.2402, "step": 28790 }, { "epoch": 100.0, "learning_rate": 1.8374558303886924e-09, "loss": 0.2604, "step": 28800 }, { "epoch": 100.0, "eval_loss": 0.5110756158828735, "eval_runtime": 135.2128, "eval_samples_per_second": 3.935, "eval_steps_per_second": 0.984, "eval_wer": 0.19605322362923444, "step": 28800 }, { "epoch": 100.0, "step": 28800, "total_flos": 2.718335465990856e+20, "train_loss": 0.26551002427107756, "train_runtime": 210411.5326, "train_samples_per_second": 2.194, "train_steps_per_second": 0.137 } ], "max_steps": 28800, "num_train_epochs": 100, "total_flos": 2.718335465990856e+20, "trial_name": null, "trial_params": null }