{ "best_metric": 32.33012890539655, "best_model_checkpoint": "whisper-small-mn-12/checkpoint-5000", "epoch": 26.343519494204426, "global_step": 25000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.03, "learning_rate": 4.2000000000000006e-07, "loss": 4.8182, "step": 25 }, { "epoch": 0.05, "learning_rate": 9.200000000000001e-07, "loss": 3.6025, "step": 50 }, { "epoch": 0.08, "learning_rate": 1.42e-06, "loss": 2.8181, "step": 75 }, { "epoch": 0.11, "learning_rate": 1.9200000000000003e-06, "loss": 2.2375, "step": 100 }, { "epoch": 0.13, "learning_rate": 2.42e-06, "loss": 1.7575, "step": 125 }, { "epoch": 0.16, "learning_rate": 2.92e-06, "loss": 1.4302, "step": 150 }, { "epoch": 0.18, "learning_rate": 3.4200000000000007e-06, "loss": 1.2102, "step": 175 }, { "epoch": 0.21, "learning_rate": 3.920000000000001e-06, "loss": 1.0671, "step": 200 }, { "epoch": 0.24, "learning_rate": 4.42e-06, "loss": 0.9255, "step": 225 }, { "epoch": 0.26, "learning_rate": 4.92e-06, "loss": 0.8504, "step": 250 }, { "epoch": 0.29, "learning_rate": 5.420000000000001e-06, "loss": 0.7788, "step": 275 }, { "epoch": 0.32, "learning_rate": 5.92e-06, "loss": 0.7109, "step": 300 }, { "epoch": 0.34, "learning_rate": 6.42e-06, "loss": 0.6795, "step": 325 }, { "epoch": 0.37, "learning_rate": 6.92e-06, "loss": 0.6383, "step": 350 }, { "epoch": 0.4, "learning_rate": 7.420000000000001e-06, "loss": 0.6071, "step": 375 }, { "epoch": 0.42, "learning_rate": 7.92e-06, "loss": 0.5714, "step": 400 }, { "epoch": 0.45, "learning_rate": 8.42e-06, "loss": 0.5448, "step": 425 }, { "epoch": 0.47, "learning_rate": 8.920000000000001e-06, "loss": 0.5279, "step": 450 }, { "epoch": 0.5, "learning_rate": 9.42e-06, "loss": 0.502, "step": 475 }, { "epoch": 0.53, "learning_rate": 9.920000000000002e-06, "loss": 0.4805, "step": 500 }, { "epoch": 0.55, "learning_rate": 9.991428571428573e-06, "loss": 0.4473, "step": 525 }, { "epoch": 0.58, "learning_rate": 9.981224489795918e-06, "loss": 0.4452, "step": 550 }, { "epoch": 0.61, "learning_rate": 9.971020408163266e-06, "loss": 0.4317, "step": 575 }, { "epoch": 0.63, "learning_rate": 9.960816326530613e-06, "loss": 0.4213, "step": 600 }, { "epoch": 0.66, "learning_rate": 9.95061224489796e-06, "loss": 0.4045, "step": 625 }, { "epoch": 0.68, "learning_rate": 9.940408163265307e-06, "loss": 0.4063, "step": 650 }, { "epoch": 0.71, "learning_rate": 9.930204081632654e-06, "loss": 0.4023, "step": 675 }, { "epoch": 0.74, "learning_rate": 9.920000000000002e-06, "loss": 0.3893, "step": 700 }, { "epoch": 0.76, "learning_rate": 9.909795918367347e-06, "loss": 0.382, "step": 725 }, { "epoch": 0.79, "learning_rate": 9.899591836734695e-06, "loss": 0.3822, "step": 750 }, { "epoch": 0.82, "learning_rate": 9.88938775510204e-06, "loss": 0.3608, "step": 775 }, { "epoch": 0.84, "learning_rate": 9.87918367346939e-06, "loss": 0.3661, "step": 800 }, { "epoch": 0.87, "learning_rate": 9.868979591836736e-06, "loss": 0.3623, "step": 825 }, { "epoch": 0.9, "learning_rate": 9.858775510204083e-06, "loss": 0.3527, "step": 850 }, { "epoch": 0.92, "learning_rate": 9.848571428571429e-06, "loss": 0.3541, "step": 875 }, { "epoch": 0.95, "learning_rate": 9.838367346938776e-06, "loss": 0.3376, "step": 900 }, { "epoch": 0.97, "learning_rate": 9.828163265306124e-06, "loss": 0.3309, "step": 925 }, { "epoch": 1.0, "learning_rate": 9.81795918367347e-06, "loss": 0.3311, "step": 950 }, { "epoch": 1.03, "learning_rate": 9.807755102040817e-06, "loss": 0.3086, "step": 975 }, { "epoch": 1.05, "learning_rate": 9.797551020408163e-06, "loss": 0.3012, "step": 1000 }, { "epoch": 1.05, "eval_cer": 17.673927151105712, "eval_loss": 0.3748841881752014, "eval_runtime": 564.5983, "eval_samples_per_second": 0.737, "eval_steps_per_second": 0.023, "eval_wer": 43.23792877430632, "step": 1000 }, { "epoch": 1.08, "learning_rate": 9.78734693877551e-06, "loss": 0.3029, "step": 1025 }, { "epoch": 1.11, "learning_rate": 9.777142857142858e-06, "loss": 0.2934, "step": 1050 }, { "epoch": 1.13, "learning_rate": 9.766938775510205e-06, "loss": 0.2973, "step": 1075 }, { "epoch": 1.16, "learning_rate": 9.756734693877551e-06, "loss": 0.2965, "step": 1100 }, { "epoch": 1.19, "learning_rate": 9.746530612244899e-06, "loss": 0.2958, "step": 1125 }, { "epoch": 1.21, "learning_rate": 9.736326530612246e-06, "loss": 0.2932, "step": 1150 }, { "epoch": 1.24, "learning_rate": 9.726122448979592e-06, "loss": 0.2983, "step": 1175 }, { "epoch": 1.26, "learning_rate": 9.71591836734694e-06, "loss": 0.2921, "step": 1200 }, { "epoch": 1.29, "learning_rate": 9.705714285714287e-06, "loss": 0.2883, "step": 1225 }, { "epoch": 1.32, "learning_rate": 9.695510204081633e-06, "loss": 0.2841, "step": 1250 }, { "epoch": 1.34, "learning_rate": 9.68530612244898e-06, "loss": 0.2758, "step": 1275 }, { "epoch": 1.37, "learning_rate": 9.675102040816328e-06, "loss": 0.2802, "step": 1300 }, { "epoch": 1.4, "learning_rate": 9.664897959183675e-06, "loss": 0.2751, "step": 1325 }, { "epoch": 1.42, "learning_rate": 9.654693877551021e-06, "loss": 0.2803, "step": 1350 }, { "epoch": 1.45, "learning_rate": 9.644489795918368e-06, "loss": 0.2833, "step": 1375 }, { "epoch": 1.48, "learning_rate": 9.634285714285714e-06, "loss": 0.2714, "step": 1400 }, { "epoch": 1.5, "learning_rate": 9.624081632653062e-06, "loss": 0.2795, "step": 1425 }, { "epoch": 1.53, "learning_rate": 9.61387755102041e-06, "loss": 0.2738, "step": 1450 }, { "epoch": 1.55, "learning_rate": 9.603673469387755e-06, "loss": 0.267, "step": 1475 }, { "epoch": 1.58, "learning_rate": 9.593469387755102e-06, "loss": 0.2659, "step": 1500 }, { "epoch": 1.61, "learning_rate": 9.58326530612245e-06, "loss": 0.2688, "step": 1525 }, { "epoch": 1.63, "learning_rate": 9.573061224489797e-06, "loss": 0.2642, "step": 1550 }, { "epoch": 1.66, "learning_rate": 9.562857142857143e-06, "loss": 0.262, "step": 1575 }, { "epoch": 1.69, "learning_rate": 9.55265306122449e-06, "loss": 0.2639, "step": 1600 }, { "epoch": 1.71, "learning_rate": 9.542448979591837e-06, "loss": 0.2665, "step": 1625 }, { "epoch": 1.74, "learning_rate": 9.532244897959184e-06, "loss": 0.2548, "step": 1650 }, { "epoch": 1.77, "learning_rate": 9.522040816326532e-06, "loss": 0.2637, "step": 1675 }, { "epoch": 1.79, "learning_rate": 9.511836734693877e-06, "loss": 0.2569, "step": 1700 }, { "epoch": 1.82, "learning_rate": 9.501632653061226e-06, "loss": 0.258, "step": 1725 }, { "epoch": 1.84, "learning_rate": 9.491428571428572e-06, "loss": 0.2532, "step": 1750 }, { "epoch": 1.87, "learning_rate": 9.48122448979592e-06, "loss": 0.2519, "step": 1775 }, { "epoch": 1.9, "learning_rate": 9.471020408163266e-06, "loss": 0.2532, "step": 1800 }, { "epoch": 1.92, "learning_rate": 9.460816326530613e-06, "loss": 0.258, "step": 1825 }, { "epoch": 1.95, "learning_rate": 9.45061224489796e-06, "loss": 0.2572, "step": 1850 }, { "epoch": 1.98, "learning_rate": 9.440408163265306e-06, "loss": 0.2594, "step": 1875 }, { "epoch": 2.0, "learning_rate": 9.430204081632654e-06, "loss": 0.2473, "step": 1900 }, { "epoch": 2.03, "learning_rate": 9.42e-06, "loss": 0.2181, "step": 1925 }, { "epoch": 2.05, "learning_rate": 9.409795918367349e-06, "loss": 0.2157, "step": 1950 }, { "epoch": 2.08, "learning_rate": 9.399591836734695e-06, "loss": 0.2112, "step": 1975 }, { "epoch": 2.11, "learning_rate": 9.389387755102042e-06, "loss": 0.2171, "step": 2000 }, { "epoch": 2.11, "eval_cer": 15.202921942859044, "eval_loss": 0.30115559697151184, "eval_runtime": 563.7553, "eval_samples_per_second": 0.738, "eval_steps_per_second": 0.023, "eval_wer": 36.743500109241864, "step": 2000 }, { "epoch": 2.13, "learning_rate": 9.379183673469388e-06, "loss": 0.2155, "step": 2025 }, { "epoch": 2.16, "learning_rate": 9.368979591836735e-06, "loss": 0.2168, "step": 2050 }, { "epoch": 2.19, "learning_rate": 9.358775510204083e-06, "loss": 0.2145, "step": 2075 }, { "epoch": 2.21, "learning_rate": 9.348571428571429e-06, "loss": 0.2144, "step": 2100 }, { "epoch": 2.24, "learning_rate": 9.338367346938776e-06, "loss": 0.2123, "step": 2125 }, { "epoch": 2.27, "learning_rate": 9.328163265306122e-06, "loss": 0.2209, "step": 2150 }, { "epoch": 2.29, "learning_rate": 9.317959183673471e-06, "loss": 0.2082, "step": 2175 }, { "epoch": 2.32, "learning_rate": 9.307755102040817e-06, "loss": 0.2076, "step": 2200 }, { "epoch": 2.34, "learning_rate": 9.297551020408164e-06, "loss": 0.2116, "step": 2225 }, { "epoch": 2.37, "learning_rate": 9.287346938775512e-06, "loss": 0.2053, "step": 2250 }, { "epoch": 2.4, "learning_rate": 9.277142857142858e-06, "loss": 0.2152, "step": 2275 }, { "epoch": 2.42, "learning_rate": 9.266938775510205e-06, "loss": 0.211, "step": 2300 }, { "epoch": 2.45, "learning_rate": 9.256734693877551e-06, "loss": 0.2136, "step": 2325 }, { "epoch": 2.48, "learning_rate": 9.246530612244898e-06, "loss": 0.2184, "step": 2350 }, { "epoch": 2.5, "learning_rate": 9.236326530612246e-06, "loss": 0.2045, "step": 2375 }, { "epoch": 2.53, "learning_rate": 9.226122448979593e-06, "loss": 0.214, "step": 2400 }, { "epoch": 2.56, "learning_rate": 9.215918367346939e-06, "loss": 0.211, "step": 2425 }, { "epoch": 2.58, "learning_rate": 9.205714285714287e-06, "loss": 0.2159, "step": 2450 }, { "epoch": 2.61, "learning_rate": 9.195510204081634e-06, "loss": 0.2185, "step": 2475 }, { "epoch": 2.63, "learning_rate": 9.18530612244898e-06, "loss": 0.2119, "step": 2500 }, { "epoch": 2.66, "learning_rate": 9.175102040816327e-06, "loss": 0.2108, "step": 2525 }, { "epoch": 2.69, "learning_rate": 9.164897959183673e-06, "loss": 0.215, "step": 2550 }, { "epoch": 2.71, "learning_rate": 9.15469387755102e-06, "loss": 0.2119, "step": 2575 }, { "epoch": 2.74, "learning_rate": 9.144489795918368e-06, "loss": 0.2169, "step": 2600 }, { "epoch": 2.77, "learning_rate": 9.134285714285716e-06, "loss": 0.2131, "step": 2625 }, { "epoch": 2.79, "learning_rate": 9.124081632653063e-06, "loss": 0.2124, "step": 2650 }, { "epoch": 2.82, "learning_rate": 9.113877551020409e-06, "loss": 0.2052, "step": 2675 }, { "epoch": 2.85, "learning_rate": 9.103673469387756e-06, "loss": 0.2102, "step": 2700 }, { "epoch": 2.87, "learning_rate": 9.093469387755102e-06, "loss": 0.2112, "step": 2725 }, { "epoch": 2.9, "learning_rate": 9.08326530612245e-06, "loss": 0.2108, "step": 2750 }, { "epoch": 2.92, "learning_rate": 9.073061224489797e-06, "loss": 0.2087, "step": 2775 }, { "epoch": 2.95, "learning_rate": 9.062857142857143e-06, "loss": 0.2087, "step": 2800 }, { "epoch": 2.98, "learning_rate": 9.05265306122449e-06, "loss": 0.2018, "step": 2825 }, { "epoch": 3.0, "learning_rate": 9.042448979591838e-06, "loss": 0.1943, "step": 2850 }, { "epoch": 3.03, "learning_rate": 9.032244897959185e-06, "loss": 0.1703, "step": 2875 }, { "epoch": 3.06, "learning_rate": 9.022040816326531e-06, "loss": 0.1695, "step": 2900 }, { "epoch": 3.08, "learning_rate": 9.011836734693879e-06, "loss": 0.179, "step": 2925 }, { "epoch": 3.11, "learning_rate": 9.001632653061224e-06, "loss": 0.1776, "step": 2950 }, { "epoch": 3.13, "learning_rate": 8.991428571428572e-06, "loss": 0.1765, "step": 2975 }, { "epoch": 3.16, "learning_rate": 8.98122448979592e-06, "loss": 0.1732, "step": 3000 }, { "epoch": 3.16, "eval_cer": 13.756094314192055, "eval_loss": 0.28230398893356323, "eval_runtime": 563.7636, "eval_samples_per_second": 0.738, "eval_steps_per_second": 0.023, "eval_wer": 33.42254752020975, "step": 3000 }, { "epoch": 3.19, "learning_rate": 8.971020408163265e-06, "loss": 0.1757, "step": 3025 }, { "epoch": 3.21, "learning_rate": 8.960816326530613e-06, "loss": 0.1745, "step": 3050 }, { "epoch": 3.24, "learning_rate": 8.95061224489796e-06, "loss": 0.1728, "step": 3075 }, { "epoch": 3.27, "learning_rate": 8.940408163265308e-06, "loss": 0.1706, "step": 3100 }, { "epoch": 3.29, "learning_rate": 8.930204081632654e-06, "loss": 0.1754, "step": 3125 }, { "epoch": 3.32, "learning_rate": 8.920000000000001e-06, "loss": 0.1721, "step": 3150 }, { "epoch": 3.35, "learning_rate": 8.909795918367348e-06, "loss": 0.1738, "step": 3175 }, { "epoch": 3.37, "learning_rate": 8.899591836734694e-06, "loss": 0.1722, "step": 3200 }, { "epoch": 3.4, "learning_rate": 8.889387755102042e-06, "loss": 0.1789, "step": 3225 }, { "epoch": 3.42, "learning_rate": 8.879183673469388e-06, "loss": 0.1811, "step": 3250 }, { "epoch": 3.45, "learning_rate": 8.868979591836735e-06, "loss": 0.1759, "step": 3275 }, { "epoch": 3.48, "learning_rate": 8.858775510204083e-06, "loss": 0.1762, "step": 3300 }, { "epoch": 3.5, "learning_rate": 8.84857142857143e-06, "loss": 0.1723, "step": 3325 }, { "epoch": 3.53, "learning_rate": 8.838367346938776e-06, "loss": 0.168, "step": 3350 }, { "epoch": 3.56, "learning_rate": 8.828163265306123e-06, "loss": 0.1761, "step": 3375 }, { "epoch": 3.58, "learning_rate": 8.81795918367347e-06, "loss": 0.1686, "step": 3400 }, { "epoch": 3.61, "learning_rate": 8.807755102040817e-06, "loss": 0.1714, "step": 3425 }, { "epoch": 3.64, "learning_rate": 8.797551020408164e-06, "loss": 0.17, "step": 3450 }, { "epoch": 3.66, "learning_rate": 8.78734693877551e-06, "loss": 0.1742, "step": 3475 }, { "epoch": 3.69, "learning_rate": 8.777142857142857e-06, "loss": 0.1703, "step": 3500 }, { "epoch": 3.71, "learning_rate": 8.766938775510205e-06, "loss": 0.1718, "step": 3525 }, { "epoch": 3.74, "learning_rate": 8.756734693877552e-06, "loss": 0.1701, "step": 3550 }, { "epoch": 3.77, "learning_rate": 8.7465306122449e-06, "loss": 0.1806, "step": 3575 }, { "epoch": 3.79, "learning_rate": 8.736326530612246e-06, "loss": 0.1728, "step": 3600 }, { "epoch": 3.82, "learning_rate": 8.726122448979593e-06, "loss": 0.1723, "step": 3625 }, { "epoch": 3.85, "learning_rate": 8.715918367346939e-06, "loss": 0.1777, "step": 3650 }, { "epoch": 3.87, "learning_rate": 8.705714285714286e-06, "loss": 0.1698, "step": 3675 }, { "epoch": 3.9, "learning_rate": 8.695510204081634e-06, "loss": 0.1696, "step": 3700 }, { "epoch": 3.93, "learning_rate": 8.68530612244898e-06, "loss": 0.1754, "step": 3725 }, { "epoch": 3.95, "learning_rate": 8.675102040816327e-06, "loss": 0.1689, "step": 3750 }, { "epoch": 3.98, "learning_rate": 8.664897959183675e-06, "loss": 0.1723, "step": 3775 }, { "epoch": 4.0, "learning_rate": 8.654693877551022e-06, "loss": 0.1701, "step": 3800 }, { "epoch": 4.03, "learning_rate": 8.644489795918368e-06, "loss": 0.1364, "step": 3825 }, { "epoch": 4.06, "learning_rate": 8.634285714285715e-06, "loss": 0.1422, "step": 3850 }, { "epoch": 4.08, "learning_rate": 8.624081632653061e-06, "loss": 0.1436, "step": 3875 }, { "epoch": 4.11, "learning_rate": 8.613877551020409e-06, "loss": 0.1381, "step": 3900 }, { "epoch": 4.14, "learning_rate": 8.603673469387756e-06, "loss": 0.1364, "step": 3925 }, { "epoch": 4.16, "learning_rate": 8.593469387755102e-06, "loss": 0.1338, "step": 3950 }, { "epoch": 4.19, "learning_rate": 8.58326530612245e-06, "loss": 0.1377, "step": 3975 }, { "epoch": 4.21, "learning_rate": 8.573061224489797e-06, "loss": 0.145, "step": 4000 }, { "epoch": 4.21, "eval_cer": 13.243589530259413, "eval_loss": 0.28217431902885437, "eval_runtime": 565.0992, "eval_samples_per_second": 0.736, "eval_steps_per_second": 0.023, "eval_wer": 32.4994537906926, "step": 4000 }, { "epoch": 4.24, "learning_rate": 8.562857142857144e-06, "loss": 0.1409, "step": 4025 }, { "epoch": 4.27, "learning_rate": 8.55265306122449e-06, "loss": 0.1412, "step": 4050 }, { "epoch": 4.29, "learning_rate": 8.542448979591838e-06, "loss": 0.1428, "step": 4075 }, { "epoch": 4.32, "learning_rate": 8.532244897959185e-06, "loss": 0.139, "step": 4100 }, { "epoch": 4.35, "learning_rate": 8.522040816326531e-06, "loss": 0.1419, "step": 4125 }, { "epoch": 4.37, "learning_rate": 8.511836734693878e-06, "loss": 0.1413, "step": 4150 }, { "epoch": 4.4, "learning_rate": 8.501632653061224e-06, "loss": 0.1334, "step": 4175 }, { "epoch": 4.43, "learning_rate": 8.491428571428572e-06, "loss": 0.1397, "step": 4200 }, { "epoch": 4.45, "learning_rate": 8.48122448979592e-06, "loss": 0.1477, "step": 4225 }, { "epoch": 4.48, "learning_rate": 8.471020408163267e-06, "loss": 0.1444, "step": 4250 }, { "epoch": 4.5, "learning_rate": 8.460816326530612e-06, "loss": 0.1398, "step": 4275 }, { "epoch": 4.53, "learning_rate": 8.45061224489796e-06, "loss": 0.15, "step": 4300 }, { "epoch": 4.56, "learning_rate": 8.440408163265307e-06, "loss": 0.1461, "step": 4325 }, { "epoch": 4.58, "learning_rate": 8.430204081632653e-06, "loss": 0.1387, "step": 4350 }, { "epoch": 4.61, "learning_rate": 8.42e-06, "loss": 0.1455, "step": 4375 }, { "epoch": 4.64, "learning_rate": 8.409795918367346e-06, "loss": 0.1388, "step": 4400 }, { "epoch": 4.66, "learning_rate": 8.399591836734694e-06, "loss": 0.1437, "step": 4425 }, { "epoch": 4.69, "learning_rate": 8.389387755102041e-06, "loss": 0.1452, "step": 4450 }, { "epoch": 4.72, "learning_rate": 8.379183673469389e-06, "loss": 0.1475, "step": 4475 }, { "epoch": 4.74, "learning_rate": 8.368979591836735e-06, "loss": 0.1495, "step": 4500 }, { "epoch": 4.77, "learning_rate": 8.358775510204082e-06, "loss": 0.148, "step": 4525 }, { "epoch": 4.79, "learning_rate": 8.34857142857143e-06, "loss": 0.1438, "step": 4550 }, { "epoch": 4.82, "learning_rate": 8.338367346938776e-06, "loss": 0.1437, "step": 4575 }, { "epoch": 4.85, "learning_rate": 8.328163265306123e-06, "loss": 0.1389, "step": 4600 }, { "epoch": 4.87, "learning_rate": 8.31795918367347e-06, "loss": 0.1496, "step": 4625 }, { "epoch": 4.9, "learning_rate": 8.307755102040816e-06, "loss": 0.1451, "step": 4650 }, { "epoch": 4.93, "learning_rate": 8.297551020408164e-06, "loss": 0.1442, "step": 4675 }, { "epoch": 4.95, "learning_rate": 8.287346938775511e-06, "loss": 0.1546, "step": 4700 }, { "epoch": 4.98, "learning_rate": 8.277142857142859e-06, "loss": 0.1442, "step": 4725 }, { "epoch": 5.01, "learning_rate": 8.266938775510205e-06, "loss": 0.1429, "step": 4750 }, { "epoch": 5.03, "learning_rate": 8.256734693877552e-06, "loss": 0.106, "step": 4775 }, { "epoch": 5.06, "learning_rate": 8.246530612244898e-06, "loss": 0.1083, "step": 4800 }, { "epoch": 5.08, "learning_rate": 8.236326530612245e-06, "loss": 0.1111, "step": 4825 }, { "epoch": 5.11, "learning_rate": 8.226122448979593e-06, "loss": 0.115, "step": 4850 }, { "epoch": 5.14, "learning_rate": 8.215918367346939e-06, "loss": 0.1118, "step": 4875 }, { "epoch": 5.16, "learning_rate": 8.205714285714286e-06, "loss": 0.1097, "step": 4900 }, { "epoch": 5.19, "learning_rate": 8.195510204081634e-06, "loss": 0.1201, "step": 4925 }, { "epoch": 5.22, "learning_rate": 8.185306122448981e-06, "loss": 0.1183, "step": 4950 }, { "epoch": 5.24, "learning_rate": 8.175102040816327e-06, "loss": 0.1106, "step": 4975 }, { "epoch": 5.27, "learning_rate": 8.164897959183674e-06, "loss": 0.1159, "step": 5000 }, { "epoch": 5.27, "eval_cer": 13.34925204253124, "eval_loss": 0.29488590359687805, "eval_runtime": 564.4303, "eval_samples_per_second": 0.737, "eval_steps_per_second": 0.023, "eval_wer": 32.33012890539655, "step": 5000 }, { "epoch": 5.3, "learning_rate": 8.15469387755102e-06, "loss": 0.1147, "step": 5025 }, { "epoch": 5.32, "learning_rate": 8.144489795918368e-06, "loss": 0.1186, "step": 5050 }, { "epoch": 5.35, "learning_rate": 8.134285714285715e-06, "loss": 0.1168, "step": 5075 }, { "epoch": 5.37, "learning_rate": 8.124081632653061e-06, "loss": 0.1132, "step": 5100 }, { "epoch": 5.4, "learning_rate": 8.11387755102041e-06, "loss": 0.1099, "step": 5125 }, { "epoch": 5.43, "learning_rate": 8.103673469387756e-06, "loss": 0.1157, "step": 5150 }, { "epoch": 5.45, "learning_rate": 8.093469387755103e-06, "loss": 0.1131, "step": 5175 }, { "epoch": 5.48, "learning_rate": 8.083265306122449e-06, "loss": 0.1167, "step": 5200 }, { "epoch": 5.51, "learning_rate": 8.073061224489797e-06, "loss": 0.1213, "step": 5225 }, { "epoch": 5.53, "learning_rate": 8.062857142857144e-06, "loss": 0.1182, "step": 5250 }, { "epoch": 5.56, "learning_rate": 8.05265306122449e-06, "loss": 0.116, "step": 5275 }, { "epoch": 5.58, "learning_rate": 8.042448979591837e-06, "loss": 0.1174, "step": 5300 }, { "epoch": 5.61, "learning_rate": 8.032244897959183e-06, "loss": 0.1201, "step": 5325 }, { "epoch": 5.64, "learning_rate": 8.022040816326532e-06, "loss": 0.1173, "step": 5350 }, { "epoch": 5.66, "learning_rate": 8.011836734693878e-06, "loss": 0.1131, "step": 5375 }, { "epoch": 5.69, "learning_rate": 8.001632653061226e-06, "loss": 0.1242, "step": 5400 }, { "epoch": 5.72, "learning_rate": 7.991428571428571e-06, "loss": 0.1171, "step": 5425 }, { "epoch": 5.74, "learning_rate": 7.981224489795919e-06, "loss": 0.1193, "step": 5450 }, { "epoch": 5.77, "learning_rate": 7.971020408163266e-06, "loss": 0.1122, "step": 5475 }, { "epoch": 5.8, "learning_rate": 7.960816326530612e-06, "loss": 0.1139, "step": 5500 }, { "epoch": 5.82, "learning_rate": 7.95061224489796e-06, "loss": 0.1185, "step": 5525 }, { "epoch": 5.85, "learning_rate": 7.940408163265307e-06, "loss": 0.1151, "step": 5550 }, { "epoch": 5.87, "learning_rate": 7.930204081632655e-06, "loss": 0.1179, "step": 5575 }, { "epoch": 5.9, "learning_rate": 7.92e-06, "loss": 0.1145, "step": 5600 }, { "epoch": 5.93, "learning_rate": 7.909795918367348e-06, "loss": 0.1166, "step": 5625 }, { "epoch": 5.95, "learning_rate": 7.899591836734695e-06, "loss": 0.1216, "step": 5650 }, { "epoch": 5.98, "learning_rate": 7.889387755102041e-06, "loss": 0.1182, "step": 5675 }, { "epoch": 6.01, "learning_rate": 7.879183673469389e-06, "loss": 0.1128, "step": 5700 }, { "epoch": 6.03, "learning_rate": 7.868979591836734e-06, "loss": 0.0898, "step": 5725 }, { "epoch": 6.06, "learning_rate": 7.858775510204082e-06, "loss": 0.0839, "step": 5750 }, { "epoch": 6.09, "learning_rate": 7.84857142857143e-06, "loss": 0.0866, "step": 5775 }, { "epoch": 6.11, "learning_rate": 7.838367346938777e-06, "loss": 0.0857, "step": 5800 }, { "epoch": 6.14, "learning_rate": 7.828163265306123e-06, "loss": 0.091, "step": 5825 }, { "epoch": 6.16, "learning_rate": 7.81795918367347e-06, "loss": 0.0874, "step": 5850 }, { "epoch": 6.19, "learning_rate": 7.807755102040818e-06, "loss": 0.085, "step": 5875 }, { "epoch": 6.22, "learning_rate": 7.797551020408163e-06, "loss": 0.0888, "step": 5900 }, { "epoch": 6.24, "learning_rate": 7.787346938775511e-06, "loss": 0.0903, "step": 5925 }, { "epoch": 6.27, "learning_rate": 7.777142857142857e-06, "loss": 0.0884, "step": 5950 }, { "epoch": 6.3, "learning_rate": 7.766938775510204e-06, "loss": 0.0913, "step": 5975 }, { "epoch": 6.32, "learning_rate": 7.756734693877552e-06, "loss": 0.0863, "step": 6000 }, { "epoch": 6.32, "eval_cer": 13.389187480240277, "eval_loss": 0.311605304479599, "eval_runtime": 564.9334, "eval_samples_per_second": 0.736, "eval_steps_per_second": 0.023, "eval_wer": 32.723399606729295, "step": 6000 }, { "epoch": 6.35, "learning_rate": 7.7465306122449e-06, "loss": 0.0905, "step": 6025 }, { "epoch": 6.38, "learning_rate": 7.736326530612247e-06, "loss": 0.0891, "step": 6050 }, { "epoch": 6.4, "learning_rate": 7.726122448979592e-06, "loss": 0.0932, "step": 6075 }, { "epoch": 6.43, "learning_rate": 7.71591836734694e-06, "loss": 0.0902, "step": 6100 }, { "epoch": 6.45, "learning_rate": 7.705714285714286e-06, "loss": 0.0923, "step": 6125 }, { "epoch": 6.48, "learning_rate": 7.695510204081633e-06, "loss": 0.0937, "step": 6150 }, { "epoch": 6.51, "learning_rate": 7.68530612244898e-06, "loss": 0.0902, "step": 6175 }, { "epoch": 6.53, "learning_rate": 7.675102040816327e-06, "loss": 0.0937, "step": 6200 }, { "epoch": 6.56, "learning_rate": 7.664897959183674e-06, "loss": 0.09, "step": 6225 }, { "epoch": 6.59, "learning_rate": 7.654693877551021e-06, "loss": 0.089, "step": 6250 }, { "epoch": 6.61, "learning_rate": 7.644489795918369e-06, "loss": 0.0925, "step": 6275 }, { "epoch": 6.64, "learning_rate": 7.634285714285715e-06, "loss": 0.0873, "step": 6300 }, { "epoch": 6.66, "learning_rate": 7.624081632653062e-06, "loss": 0.0941, "step": 6325 }, { "epoch": 6.69, "learning_rate": 7.613877551020409e-06, "loss": 0.0925, "step": 6350 }, { "epoch": 6.72, "learning_rate": 7.6036734693877555e-06, "loss": 0.0929, "step": 6375 }, { "epoch": 6.74, "learning_rate": 7.593469387755102e-06, "loss": 0.096, "step": 6400 }, { "epoch": 6.77, "learning_rate": 7.58326530612245e-06, "loss": 0.0962, "step": 6425 }, { "epoch": 6.8, "learning_rate": 7.573061224489796e-06, "loss": 0.0955, "step": 6450 }, { "epoch": 6.82, "learning_rate": 7.562857142857144e-06, "loss": 0.0937, "step": 6475 }, { "epoch": 6.85, "learning_rate": 7.55265306122449e-06, "loss": 0.0918, "step": 6500 }, { "epoch": 6.88, "learning_rate": 7.542448979591838e-06, "loss": 0.0932, "step": 6525 }, { "epoch": 6.9, "learning_rate": 7.5322448979591845e-06, "loss": 0.0926, "step": 6550 }, { "epoch": 6.93, "learning_rate": 7.522040816326531e-06, "loss": 0.0945, "step": 6575 }, { "epoch": 6.95, "learning_rate": 7.511836734693878e-06, "loss": 0.0935, "step": 6600 }, { "epoch": 6.98, "learning_rate": 7.501632653061225e-06, "loss": 0.0963, "step": 6625 }, { "epoch": 7.01, "learning_rate": 7.491428571428572e-06, "loss": 0.0865, "step": 6650 }, { "epoch": 7.03, "learning_rate": 7.481224489795919e-06, "loss": 0.0641, "step": 6675 }, { "epoch": 7.06, "learning_rate": 7.471020408163266e-06, "loss": 0.0623, "step": 6700 }, { "epoch": 7.09, "learning_rate": 7.4608163265306136e-06, "loss": 0.0668, "step": 6725 }, { "epoch": 7.11, "learning_rate": 7.45061224489796e-06, "loss": 0.0632, "step": 6750 }, { "epoch": 7.14, "learning_rate": 7.440408163265307e-06, "loss": 0.0671, "step": 6775 }, { "epoch": 7.17, "learning_rate": 7.4302040816326535e-06, "loss": 0.0641, "step": 6800 }, { "epoch": 7.19, "learning_rate": 7.420000000000001e-06, "loss": 0.0676, "step": 6825 }, { "epoch": 7.22, "learning_rate": 7.409795918367348e-06, "loss": 0.0682, "step": 6850 }, { "epoch": 7.24, "learning_rate": 7.399591836734694e-06, "loss": 0.0661, "step": 6875 }, { "epoch": 7.27, "learning_rate": 7.389387755102041e-06, "loss": 0.0711, "step": 6900 }, { "epoch": 7.3, "learning_rate": 7.379183673469389e-06, "loss": 0.068, "step": 6925 }, { "epoch": 7.32, "learning_rate": 7.368979591836736e-06, "loss": 0.0692, "step": 6950 }, { "epoch": 7.35, "learning_rate": 7.3587755102040825e-06, "loss": 0.0672, "step": 6975 }, { "epoch": 7.38, "learning_rate": 7.348571428571429e-06, "loss": 0.0685, "step": 7000 }, { "epoch": 7.38, "eval_cer": 13.307652628250993, "eval_loss": 0.33434030413627625, "eval_runtime": 565.4518, "eval_samples_per_second": 0.736, "eval_steps_per_second": 0.023, "eval_wer": 32.47760541839633, "step": 7000 }, { "epoch": 7.4, "learning_rate": 7.338367346938776e-06, "loss": 0.0657, "step": 7025 }, { "epoch": 7.43, "learning_rate": 7.328163265306123e-06, "loss": 0.068, "step": 7050 }, { "epoch": 7.46, "learning_rate": 7.31795918367347e-06, "loss": 0.0708, "step": 7075 }, { "epoch": 7.48, "learning_rate": 7.3077551020408165e-06, "loss": 0.0689, "step": 7100 }, { "epoch": 7.51, "learning_rate": 7.297551020408163e-06, "loss": 0.0728, "step": 7125 }, { "epoch": 7.53, "learning_rate": 7.287346938775511e-06, "loss": 0.0675, "step": 7150 }, { "epoch": 7.56, "learning_rate": 7.277142857142858e-06, "loss": 0.0667, "step": 7175 }, { "epoch": 7.59, "learning_rate": 7.266938775510205e-06, "loss": 0.0692, "step": 7200 }, { "epoch": 7.61, "learning_rate": 7.256734693877551e-06, "loss": 0.0717, "step": 7225 }, { "epoch": 7.64, "learning_rate": 7.246530612244899e-06, "loss": 0.0694, "step": 7250 }, { "epoch": 7.67, "learning_rate": 7.2363265306122455e-06, "loss": 0.0672, "step": 7275 }, { "epoch": 7.69, "learning_rate": 7.226122448979592e-06, "loss": 0.0709, "step": 7300 }, { "epoch": 7.72, "learning_rate": 7.215918367346939e-06, "loss": 0.0686, "step": 7325 }, { "epoch": 7.74, "learning_rate": 7.205714285714286e-06, "loss": 0.0683, "step": 7350 }, { "epoch": 7.77, "learning_rate": 7.195510204081633e-06, "loss": 0.075, "step": 7375 }, { "epoch": 7.8, "learning_rate": 7.1853061224489804e-06, "loss": 0.0688, "step": 7400 }, { "epoch": 7.82, "learning_rate": 7.175102040816327e-06, "loss": 0.0704, "step": 7425 }, { "epoch": 7.85, "learning_rate": 7.1648979591836746e-06, "loss": 0.0706, "step": 7450 }, { "epoch": 7.88, "learning_rate": 7.154693877551021e-06, "loss": 0.072, "step": 7475 }, { "epoch": 7.9, "learning_rate": 7.144489795918368e-06, "loss": 0.0703, "step": 7500 }, { "epoch": 7.93, "learning_rate": 7.1342857142857145e-06, "loss": 0.0726, "step": 7525 }, { "epoch": 7.96, "learning_rate": 7.124081632653061e-06, "loss": 0.0761, "step": 7550 }, { "epoch": 7.98, "learning_rate": 7.113877551020409e-06, "loss": 0.0704, "step": 7575 }, { "epoch": 8.01, "learning_rate": 7.103673469387755e-06, "loss": 0.0659, "step": 7600 }, { "epoch": 8.03, "learning_rate": 7.093469387755103e-06, "loss": 0.0462, "step": 7625 }, { "epoch": 8.06, "learning_rate": 7.08326530612245e-06, "loss": 0.0447, "step": 7650 }, { "epoch": 8.09, "learning_rate": 7.073061224489797e-06, "loss": 0.0479, "step": 7675 }, { "epoch": 8.11, "learning_rate": 7.0628571428571435e-06, "loss": 0.0489, "step": 7700 }, { "epoch": 8.14, "learning_rate": 7.05265306122449e-06, "loss": 0.0466, "step": 7725 }, { "epoch": 8.17, "learning_rate": 7.042448979591837e-06, "loss": 0.0476, "step": 7750 }, { "epoch": 8.19, "learning_rate": 7.032244897959184e-06, "loss": 0.0463, "step": 7775 }, { "epoch": 8.22, "learning_rate": 7.022040816326531e-06, "loss": 0.0488, "step": 7800 }, { "epoch": 8.25, "learning_rate": 7.0118367346938775e-06, "loss": 0.0484, "step": 7825 }, { "epoch": 8.27, "learning_rate": 7.001632653061226e-06, "loss": 0.0481, "step": 7850 }, { "epoch": 8.3, "learning_rate": 6.9914285714285725e-06, "loss": 0.0481, "step": 7875 }, { "epoch": 8.32, "learning_rate": 6.981224489795919e-06, "loss": 0.05, "step": 7900 }, { "epoch": 8.35, "learning_rate": 6.971020408163266e-06, "loss": 0.0487, "step": 7925 }, { "epoch": 8.38, "learning_rate": 6.960816326530612e-06, "loss": 0.0512, "step": 7950 }, { "epoch": 8.4, "learning_rate": 6.95061224489796e-06, "loss": 0.0489, "step": 7975 }, { "epoch": 8.43, "learning_rate": 6.9404081632653065e-06, "loss": 0.0506, "step": 8000 }, { "epoch": 8.43, "eval_cer": 13.77356606818976, "eval_loss": 0.3583739399909973, "eval_runtime": 563.5904, "eval_samples_per_second": 0.738, "eval_steps_per_second": 0.023, "eval_wer": 33.39523705483941, "step": 8000 }, { "epoch": 8.46, "learning_rate": 6.930204081632653e-06, "loss": 0.0494, "step": 8025 }, { "epoch": 8.48, "learning_rate": 6.92e-06, "loss": 0.0487, "step": 8050 }, { "epoch": 8.51, "learning_rate": 6.909795918367348e-06, "loss": 0.0474, "step": 8075 }, { "epoch": 8.54, "learning_rate": 6.899591836734695e-06, "loss": 0.0529, "step": 8100 }, { "epoch": 8.56, "learning_rate": 6.8893877551020414e-06, "loss": 0.0513, "step": 8125 }, { "epoch": 8.59, "learning_rate": 6.879183673469388e-06, "loss": 0.0489, "step": 8150 }, { "epoch": 8.61, "learning_rate": 6.8689795918367355e-06, "loss": 0.0507, "step": 8175 }, { "epoch": 8.64, "learning_rate": 6.858775510204082e-06, "loss": 0.0485, "step": 8200 }, { "epoch": 8.67, "learning_rate": 6.848571428571429e-06, "loss": 0.05, "step": 8225 }, { "epoch": 8.69, "learning_rate": 6.8383673469387755e-06, "loss": 0.0495, "step": 8250 }, { "epoch": 8.72, "learning_rate": 6.828163265306122e-06, "loss": 0.0518, "step": 8275 }, { "epoch": 8.75, "learning_rate": 6.8179591836734704e-06, "loss": 0.0534, "step": 8300 }, { "epoch": 8.77, "learning_rate": 6.807755102040817e-06, "loss": 0.0504, "step": 8325 }, { "epoch": 8.8, "learning_rate": 6.797551020408164e-06, "loss": 0.0492, "step": 8350 }, { "epoch": 8.83, "learning_rate": 6.787346938775511e-06, "loss": 0.052, "step": 8375 }, { "epoch": 8.85, "learning_rate": 6.777142857142858e-06, "loss": 0.0516, "step": 8400 }, { "epoch": 8.88, "learning_rate": 6.7669387755102045e-06, "loss": 0.052, "step": 8425 }, { "epoch": 8.9, "learning_rate": 6.756734693877551e-06, "loss": 0.0527, "step": 8450 }, { "epoch": 8.93, "learning_rate": 6.746530612244898e-06, "loss": 0.0537, "step": 8475 }, { "epoch": 8.96, "learning_rate": 6.736326530612245e-06, "loss": 0.0492, "step": 8500 }, { "epoch": 8.98, "learning_rate": 6.726122448979593e-06, "loss": 0.0522, "step": 8525 }, { "epoch": 9.01, "learning_rate": 6.715918367346939e-06, "loss": 0.0431, "step": 8550 }, { "epoch": 9.04, "learning_rate": 6.705714285714287e-06, "loss": 0.0316, "step": 8575 }, { "epoch": 9.06, "learning_rate": 6.6955102040816335e-06, "loss": 0.0317, "step": 8600 }, { "epoch": 9.09, "learning_rate": 6.68530612244898e-06, "loss": 0.0325, "step": 8625 }, { "epoch": 9.11, "learning_rate": 6.675102040816327e-06, "loss": 0.0301, "step": 8650 }, { "epoch": 9.14, "learning_rate": 6.664897959183673e-06, "loss": 0.0308, "step": 8675 }, { "epoch": 9.17, "learning_rate": 6.654693877551021e-06, "loss": 0.0325, "step": 8700 }, { "epoch": 9.19, "learning_rate": 6.6444897959183675e-06, "loss": 0.0315, "step": 8725 }, { "epoch": 9.22, "learning_rate": 6.634285714285715e-06, "loss": 0.0332, "step": 8750 }, { "epoch": 9.25, "learning_rate": 6.6240816326530625e-06, "loss": 0.0327, "step": 8775 }, { "epoch": 9.27, "learning_rate": 6.613877551020409e-06, "loss": 0.0345, "step": 8800 }, { "epoch": 9.3, "learning_rate": 6.603673469387756e-06, "loss": 0.035, "step": 8825 }, { "epoch": 9.33, "learning_rate": 6.593469387755102e-06, "loss": 0.0342, "step": 8850 }, { "epoch": 9.35, "learning_rate": 6.583265306122449e-06, "loss": 0.0325, "step": 8875 }, { "epoch": 9.38, "learning_rate": 6.5730612244897965e-06, "loss": 0.0326, "step": 8900 }, { "epoch": 9.4, "learning_rate": 6.562857142857143e-06, "loss": 0.0339, "step": 8925 }, { "epoch": 9.43, "learning_rate": 6.55265306122449e-06, "loss": 0.0322, "step": 8950 }, { "epoch": 9.46, "learning_rate": 6.542448979591838e-06, "loss": 0.0321, "step": 8975 }, { "epoch": 9.48, "learning_rate": 6.532244897959185e-06, "loss": 0.0336, "step": 9000 }, { "epoch": 9.48, "eval_cer": 13.84927700217981, "eval_loss": 0.3860664963722229, "eval_runtime": 566.0258, "eval_samples_per_second": 0.735, "eval_steps_per_second": 0.023, "eval_wer": 33.70111426698711, "step": 9000 }, { "epoch": 9.51, "learning_rate": 6.5220408163265314e-06, "loss": 0.0332, "step": 9025 }, { "epoch": 9.54, "learning_rate": 6.511836734693878e-06, "loss": 0.0351, "step": 9050 }, { "epoch": 9.56, "learning_rate": 6.501632653061225e-06, "loss": 0.0341, "step": 9075 }, { "epoch": 9.59, "learning_rate": 6.491428571428572e-06, "loss": 0.0338, "step": 9100 }, { "epoch": 9.62, "learning_rate": 6.481224489795919e-06, "loss": 0.0359, "step": 9125 }, { "epoch": 9.64, "learning_rate": 6.4710204081632655e-06, "loss": 0.0341, "step": 9150 }, { "epoch": 9.67, "learning_rate": 6.460816326530612e-06, "loss": 0.0358, "step": 9175 }, { "epoch": 9.69, "learning_rate": 6.4506122448979604e-06, "loss": 0.0335, "step": 9200 }, { "epoch": 9.72, "learning_rate": 6.440408163265307e-06, "loss": 0.0342, "step": 9225 }, { "epoch": 9.75, "learning_rate": 6.430204081632654e-06, "loss": 0.0354, "step": 9250 }, { "epoch": 9.77, "learning_rate": 6.42e-06, "loss": 0.0351, "step": 9275 }, { "epoch": 9.8, "learning_rate": 6.409795918367348e-06, "loss": 0.0359, "step": 9300 }, { "epoch": 9.83, "learning_rate": 6.3995918367346945e-06, "loss": 0.0349, "step": 9325 }, { "epoch": 9.85, "learning_rate": 6.389387755102041e-06, "loss": 0.0362, "step": 9350 }, { "epoch": 9.88, "learning_rate": 6.379183673469388e-06, "loss": 0.0324, "step": 9375 }, { "epoch": 9.91, "learning_rate": 6.368979591836734e-06, "loss": 0.0347, "step": 9400 }, { "epoch": 9.93, "learning_rate": 6.358775510204083e-06, "loss": 0.0356, "step": 9425 }, { "epoch": 9.96, "learning_rate": 6.348571428571429e-06, "loss": 0.0335, "step": 9450 }, { "epoch": 9.98, "learning_rate": 6.338367346938776e-06, "loss": 0.0363, "step": 9475 }, { "epoch": 10.01, "learning_rate": 6.3281632653061235e-06, "loss": 0.0288, "step": 9500 }, { "epoch": 10.04, "learning_rate": 6.31795918367347e-06, "loss": 0.0203, "step": 9525 }, { "epoch": 10.06, "learning_rate": 6.307755102040817e-06, "loss": 0.021, "step": 9550 }, { "epoch": 10.09, "learning_rate": 6.297551020408163e-06, "loss": 0.0203, "step": 9575 }, { "epoch": 10.12, "learning_rate": 6.28734693877551e-06, "loss": 0.0197, "step": 9600 }, { "epoch": 10.14, "learning_rate": 6.2771428571428575e-06, "loss": 0.0218, "step": 9625 }, { "epoch": 10.17, "learning_rate": 6.266938775510205e-06, "loss": 0.0217, "step": 9650 }, { "epoch": 10.19, "learning_rate": 6.256734693877552e-06, "loss": 0.0201, "step": 9675 }, { "epoch": 10.22, "learning_rate": 6.246530612244899e-06, "loss": 0.0199, "step": 9700 }, { "epoch": 10.25, "learning_rate": 6.236326530612246e-06, "loss": 0.0204, "step": 9725 }, { "epoch": 10.27, "learning_rate": 6.2261224489795924e-06, "loss": 0.0212, "step": 9750 }, { "epoch": 10.3, "learning_rate": 6.215918367346939e-06, "loss": 0.0214, "step": 9775 }, { "epoch": 10.33, "learning_rate": 6.205714285714286e-06, "loss": 0.0213, "step": 9800 }, { "epoch": 10.35, "learning_rate": 6.195510204081633e-06, "loss": 0.0213, "step": 9825 }, { "epoch": 10.38, "learning_rate": 6.18530612244898e-06, "loss": 0.0212, "step": 9850 }, { "epoch": 10.41, "learning_rate": 6.175102040816327e-06, "loss": 0.0208, "step": 9875 }, { "epoch": 10.43, "learning_rate": 6.164897959183675e-06, "loss": 0.0221, "step": 9900 }, { "epoch": 10.46, "learning_rate": 6.1546938775510214e-06, "loss": 0.0218, "step": 9925 }, { "epoch": 10.48, "learning_rate": 6.144489795918368e-06, "loss": 0.0206, "step": 9950 }, { "epoch": 10.51, "learning_rate": 6.134285714285715e-06, "loss": 0.0222, "step": 9975 }, { "epoch": 10.54, "learning_rate": 6.124081632653061e-06, "loss": 0.0215, "step": 10000 }, { "epoch": 10.54, "eval_cer": 14.01401068272959, "eval_loss": 0.4192809462547302, "eval_runtime": 564.3466, "eval_samples_per_second": 0.737, "eval_steps_per_second": 0.023, "eval_wer": 33.70111426698711, "step": 10000 }, { "epoch": 10.56, "learning_rate": 6.114285714285715e-06, "loss": 0.0216, "step": 10025 }, { "epoch": 10.59, "learning_rate": 6.1040816326530616e-06, "loss": 0.0203, "step": 10050 }, { "epoch": 10.62, "learning_rate": 6.093877551020408e-06, "loss": 0.0228, "step": 10075 }, { "epoch": 10.64, "learning_rate": 6.083673469387756e-06, "loss": 0.0243, "step": 10100 }, { "epoch": 10.67, "learning_rate": 6.073469387755102e-06, "loss": 0.023, "step": 10125 }, { "epoch": 10.7, "learning_rate": 6.06326530612245e-06, "loss": 0.0225, "step": 10150 }, { "epoch": 10.72, "learning_rate": 6.0530612244897964e-06, "loss": 0.0234, "step": 10175 }, { "epoch": 10.75, "learning_rate": 6.042857142857144e-06, "loss": 0.0222, "step": 10200 }, { "epoch": 10.77, "learning_rate": 6.0326530612244906e-06, "loss": 0.0223, "step": 10225 }, { "epoch": 10.8, "learning_rate": 6.022448979591837e-06, "loss": 0.0225, "step": 10250 }, { "epoch": 10.83, "learning_rate": 6.012653061224491e-06, "loss": 0.0212, "step": 10275 }, { "epoch": 10.85, "learning_rate": 6.002448979591837e-06, "loss": 0.0222, "step": 10300 }, { "epoch": 10.88, "learning_rate": 5.992244897959184e-06, "loss": 0.0231, "step": 10325 }, { "epoch": 10.91, "learning_rate": 5.982040816326531e-06, "loss": 0.0228, "step": 10350 }, { "epoch": 10.93, "learning_rate": 5.971836734693877e-06, "loss": 0.0228, "step": 10375 }, { "epoch": 10.96, "learning_rate": 5.961632653061225e-06, "loss": 0.0215, "step": 10400 }, { "epoch": 10.99, "learning_rate": 5.951428571428572e-06, "loss": 0.0233, "step": 10425 }, { "epoch": 11.01, "learning_rate": 5.941224489795919e-06, "loss": 0.0188, "step": 10450 }, { "epoch": 11.04, "learning_rate": 5.931020408163266e-06, "loss": 0.0123, "step": 10475 }, { "epoch": 11.06, "learning_rate": 5.920816326530613e-06, "loss": 0.0122, "step": 10500 }, { "epoch": 11.09, "learning_rate": 5.91061224489796e-06, "loss": 0.0128, "step": 10525 }, { "epoch": 11.12, "learning_rate": 5.900408163265306e-06, "loss": 0.013, "step": 10550 }, { "epoch": 11.14, "learning_rate": 5.890204081632653e-06, "loss": 0.0134, "step": 10575 }, { "epoch": 11.17, "learning_rate": 5.8800000000000005e-06, "loss": 0.0126, "step": 10600 }, { "epoch": 11.2, "learning_rate": 5.869795918367347e-06, "loss": 0.0131, "step": 10625 }, { "epoch": 11.22, "learning_rate": 5.859591836734695e-06, "loss": 0.0126, "step": 10650 }, { "epoch": 11.25, "learning_rate": 5.849387755102042e-06, "loss": 0.0128, "step": 10675 }, { "epoch": 11.28, "learning_rate": 5.839183673469389e-06, "loss": 0.013, "step": 10700 }, { "epoch": 11.3, "learning_rate": 5.828979591836735e-06, "loss": 0.0138, "step": 10725 }, { "epoch": 11.33, "learning_rate": 5.818775510204082e-06, "loss": 0.0129, "step": 10750 }, { "epoch": 11.35, "learning_rate": 5.808571428571429e-06, "loss": 0.0125, "step": 10775 }, { "epoch": 11.38, "learning_rate": 5.798367346938776e-06, "loss": 0.0133, "step": 10800 }, { "epoch": 11.41, "learning_rate": 5.788163265306123e-06, "loss": 0.0139, "step": 10825 }, { "epoch": 11.43, "learning_rate": 5.777959183673469e-06, "loss": 0.0123, "step": 10850 }, { "epoch": 11.46, "learning_rate": 5.767755102040818e-06, "loss": 0.0135, "step": 10875 }, { "epoch": 11.49, "learning_rate": 5.757551020408164e-06, "loss": 0.0136, "step": 10900 }, { "epoch": 11.51, "learning_rate": 5.747346938775511e-06, "loss": 0.0136, "step": 10925 }, { "epoch": 11.54, "learning_rate": 5.737142857142858e-06, "loss": 0.0143, "step": 10950 }, { "epoch": 11.56, "learning_rate": 5.726938775510204e-06, "loss": 0.0137, "step": 10975 }, { "epoch": 11.59, "learning_rate": 5.716734693877552e-06, "loss": 0.0141, "step": 11000 }, { "epoch": 11.59, "eval_cer": 14.029818460156083, "eval_loss": 0.4463140070438385, "eval_runtime": 564.6562, "eval_samples_per_second": 0.737, "eval_steps_per_second": 0.023, "eval_wer": 34.03430194450514, "step": 11000 }, { "epoch": 11.62, "learning_rate": 5.706530612244898e-06, "loss": 0.0144, "step": 11025 }, { "epoch": 11.64, "learning_rate": 5.696326530612245e-06, "loss": 0.0126, "step": 11050 }, { "epoch": 11.67, "learning_rate": 5.686122448979592e-06, "loss": 0.014, "step": 11075 }, { "epoch": 11.7, "learning_rate": 5.67591836734694e-06, "loss": 0.0131, "step": 11100 }, { "epoch": 11.72, "learning_rate": 5.665714285714287e-06, "loss": 0.0136, "step": 11125 }, { "epoch": 11.75, "learning_rate": 5.655510204081633e-06, "loss": 0.0129, "step": 11150 }, { "epoch": 11.78, "learning_rate": 5.64530612244898e-06, "loss": 0.0136, "step": 11175 }, { "epoch": 11.8, "learning_rate": 5.635102040816327e-06, "loss": 0.0141, "step": 11200 }, { "epoch": 11.83, "learning_rate": 5.624897959183674e-06, "loss": 0.0139, "step": 11225 }, { "epoch": 11.85, "learning_rate": 5.614693877551021e-06, "loss": 0.0131, "step": 11250 }, { "epoch": 11.88, "learning_rate": 5.604489795918367e-06, "loss": 0.0135, "step": 11275 }, { "epoch": 11.91, "learning_rate": 5.594285714285714e-06, "loss": 0.0141, "step": 11300 }, { "epoch": 11.93, "learning_rate": 5.5840816326530615e-06, "loss": 0.0138, "step": 11325 }, { "epoch": 11.96, "learning_rate": 5.573877551020409e-06, "loss": 0.0137, "step": 11350 }, { "epoch": 11.99, "learning_rate": 5.563673469387756e-06, "loss": 0.0134, "step": 11375 }, { "epoch": 12.01, "learning_rate": 5.553469387755103e-06, "loss": 0.0112, "step": 11400 }, { "epoch": 12.04, "learning_rate": 5.54326530612245e-06, "loss": 0.0082, "step": 11425 }, { "epoch": 12.07, "learning_rate": 5.533061224489796e-06, "loss": 0.0082, "step": 11450 }, { "epoch": 12.09, "learning_rate": 5.522857142857143e-06, "loss": 0.0078, "step": 11475 }, { "epoch": 12.12, "learning_rate": 5.51265306122449e-06, "loss": 0.0077, "step": 11500 }, { "epoch": 12.14, "learning_rate": 5.502448979591837e-06, "loss": 0.008, "step": 11525 }, { "epoch": 12.17, "learning_rate": 5.492244897959184e-06, "loss": 0.0076, "step": 11550 }, { "epoch": 12.2, "learning_rate": 5.482040816326531e-06, "loss": 0.0073, "step": 11575 }, { "epoch": 12.22, "learning_rate": 5.471836734693879e-06, "loss": 0.0081, "step": 11600 }, { "epoch": 12.25, "learning_rate": 5.461632653061225e-06, "loss": 0.0076, "step": 11625 }, { "epoch": 12.28, "learning_rate": 5.451428571428572e-06, "loss": 0.0083, "step": 11650 }, { "epoch": 12.3, "learning_rate": 5.441224489795919e-06, "loss": 0.0079, "step": 11675 }, { "epoch": 12.33, "learning_rate": 5.431020408163265e-06, "loss": 0.0082, "step": 11700 }, { "epoch": 12.36, "learning_rate": 5.420816326530613e-06, "loss": 0.0078, "step": 11725 }, { "epoch": 12.38, "learning_rate": 5.410612244897959e-06, "loss": 0.0084, "step": 11750 }, { "epoch": 12.41, "learning_rate": 5.400408163265306e-06, "loss": 0.0079, "step": 11775 }, { "epoch": 12.43, "learning_rate": 5.390204081632654e-06, "loss": 0.0084, "step": 11800 }, { "epoch": 12.46, "learning_rate": 5.380000000000001e-06, "loss": 0.0084, "step": 11825 }, { "epoch": 12.49, "learning_rate": 5.369795918367348e-06, "loss": 0.0086, "step": 11850 }, { "epoch": 12.51, "learning_rate": 5.359591836734694e-06, "loss": 0.0081, "step": 11875 }, { "epoch": 12.54, "learning_rate": 5.349387755102041e-06, "loss": 0.0082, "step": 11900 }, { "epoch": 12.57, "learning_rate": 5.339183673469388e-06, "loss": 0.008, "step": 11925 }, { "epoch": 12.59, "learning_rate": 5.328979591836735e-06, "loss": 0.0088, "step": 11950 }, { "epoch": 12.62, "learning_rate": 5.318775510204082e-06, "loss": 0.0085, "step": 11975 }, { "epoch": 12.64, "learning_rate": 5.308571428571428e-06, "loss": 0.0089, "step": 12000 }, { "epoch": 12.64, "eval_cer": 13.805181623042747, "eval_loss": 0.46598222851753235, "eval_runtime": 564.4797, "eval_samples_per_second": 0.737, "eval_steps_per_second": 0.023, "eval_wer": 33.61372077780205, "step": 12000 }, { "epoch": 12.67, "learning_rate": 5.298367346938777e-06, "loss": 0.0085, "step": 12025 }, { "epoch": 12.7, "learning_rate": 5.288163265306123e-06, "loss": 0.0086, "step": 12050 }, { "epoch": 12.72, "learning_rate": 5.27795918367347e-06, "loss": 0.0085, "step": 12075 }, { "epoch": 12.75, "learning_rate": 5.2677551020408166e-06, "loss": 0.0086, "step": 12100 }, { "epoch": 12.78, "learning_rate": 5.257551020408164e-06, "loss": 0.0091, "step": 12125 }, { "epoch": 12.8, "learning_rate": 5.247346938775511e-06, "loss": 0.009, "step": 12150 }, { "epoch": 12.83, "learning_rate": 5.237142857142857e-06, "loss": 0.009, "step": 12175 }, { "epoch": 12.86, "learning_rate": 5.226938775510204e-06, "loss": 0.0084, "step": 12200 }, { "epoch": 12.88, "learning_rate": 5.216734693877551e-06, "loss": 0.0086, "step": 12225 }, { "epoch": 12.91, "learning_rate": 5.206530612244899e-06, "loss": 0.0086, "step": 12250 }, { "epoch": 12.93, "learning_rate": 5.196326530612246e-06, "loss": 0.0093, "step": 12275 }, { "epoch": 12.96, "learning_rate": 5.186122448979592e-06, "loss": 0.0091, "step": 12300 }, { "epoch": 12.99, "learning_rate": 5.17591836734694e-06, "loss": 0.0089, "step": 12325 }, { "epoch": 13.01, "learning_rate": 5.165714285714286e-06, "loss": 0.0073, "step": 12350 }, { "epoch": 13.04, "learning_rate": 5.155510204081633e-06, "loss": 0.0055, "step": 12375 }, { "epoch": 13.07, "learning_rate": 5.14530612244898e-06, "loss": 0.0053, "step": 12400 }, { "epoch": 13.09, "learning_rate": 5.135102040816326e-06, "loss": 0.0051, "step": 12425 }, { "epoch": 13.12, "learning_rate": 5.124897959183674e-06, "loss": 0.0053, "step": 12450 }, { "epoch": 13.15, "learning_rate": 5.114693877551021e-06, "loss": 0.0053, "step": 12475 }, { "epoch": 13.17, "learning_rate": 5.104489795918368e-06, "loss": 0.0052, "step": 12500 }, { "epoch": 13.2, "learning_rate": 5.094285714285715e-06, "loss": 0.0052, "step": 12525 }, { "epoch": 13.22, "learning_rate": 5.084081632653062e-06, "loss": 0.0052, "step": 12550 }, { "epoch": 13.25, "learning_rate": 5.073877551020409e-06, "loss": 0.0051, "step": 12575 }, { "epoch": 13.28, "learning_rate": 5.063673469387755e-06, "loss": 0.0053, "step": 12600 }, { "epoch": 13.3, "learning_rate": 5.053469387755102e-06, "loss": 0.005, "step": 12625 }, { "epoch": 13.33, "learning_rate": 5.043265306122449e-06, "loss": 0.0057, "step": 12650 }, { "epoch": 13.36, "learning_rate": 5.033061224489796e-06, "loss": 0.0051, "step": 12675 }, { "epoch": 13.38, "learning_rate": 5.0228571428571435e-06, "loss": 0.0051, "step": 12700 }, { "epoch": 13.41, "learning_rate": 5.01265306122449e-06, "loss": 0.0055, "step": 12725 }, { "epoch": 13.44, "learning_rate": 5.002448979591838e-06, "loss": 0.0054, "step": 12750 }, { "epoch": 13.46, "learning_rate": 4.992244897959184e-06, "loss": 0.005, "step": 12775 }, { "epoch": 13.49, "learning_rate": 4.982040816326531e-06, "loss": 0.0049, "step": 12800 }, { "epoch": 13.51, "learning_rate": 4.9718367346938776e-06, "loss": 0.0049, "step": 12825 }, { "epoch": 13.54, "learning_rate": 4.961632653061225e-06, "loss": 0.0049, "step": 12850 }, { "epoch": 13.57, "learning_rate": 4.951428571428572e-06, "loss": 0.0053, "step": 12875 }, { "epoch": 13.59, "learning_rate": 4.941224489795919e-06, "loss": 0.0054, "step": 12900 }, { "epoch": 13.62, "learning_rate": 4.931020408163266e-06, "loss": 0.0054, "step": 12925 }, { "epoch": 13.65, "learning_rate": 4.9208163265306125e-06, "loss": 0.0053, "step": 12950 }, { "epoch": 13.67, "learning_rate": 4.91061224489796e-06, "loss": 0.0057, "step": 12975 }, { "epoch": 13.7, "learning_rate": 4.900408163265307e-06, "loss": 0.0057, "step": 13000 }, { "epoch": 13.7, "eval_cer": 13.984891092733415, "eval_loss": 0.4913037419319153, "eval_runtime": 564.9186, "eval_samples_per_second": 0.736, "eval_steps_per_second": 0.023, "eval_wer": 33.97968101376448, "step": 13000 }, { "epoch": 13.72, "learning_rate": 4.890204081632653e-06, "loss": 0.0059, "step": 13025 }, { "epoch": 13.75, "learning_rate": 4.880000000000001e-06, "loss": 0.006, "step": 13050 }, { "epoch": 13.78, "learning_rate": 4.869795918367347e-06, "loss": 0.0057, "step": 13075 }, { "epoch": 13.8, "learning_rate": 4.859591836734695e-06, "loss": 0.0062, "step": 13100 }, { "epoch": 13.83, "learning_rate": 4.8493877551020415e-06, "loss": 0.0058, "step": 13125 }, { "epoch": 13.86, "learning_rate": 4.839183673469388e-06, "loss": 0.0058, "step": 13150 }, { "epoch": 13.88, "learning_rate": 4.828979591836735e-06, "loss": 0.0057, "step": 13175 }, { "epoch": 13.91, "learning_rate": 4.818775510204082e-06, "loss": 0.006, "step": 13200 }, { "epoch": 13.94, "learning_rate": 4.808979591836735e-06, "loss": 0.0059, "step": 13225 }, { "epoch": 13.96, "learning_rate": 4.7987755102040824e-06, "loss": 0.0064, "step": 13250 }, { "epoch": 13.99, "learning_rate": 4.788571428571429e-06, "loss": 0.006, "step": 13275 }, { "epoch": 14.01, "learning_rate": 4.778367346938776e-06, "loss": 0.0051, "step": 13300 }, { "epoch": 14.04, "learning_rate": 4.768163265306122e-06, "loss": 0.0039, "step": 13325 }, { "epoch": 14.07, "learning_rate": 4.75795918367347e-06, "loss": 0.0043, "step": 13350 }, { "epoch": 14.09, "learning_rate": 4.747755102040817e-06, "loss": 0.0042, "step": 13375 }, { "epoch": 14.12, "learning_rate": 4.737551020408164e-06, "loss": 0.0043, "step": 13400 }, { "epoch": 14.15, "learning_rate": 4.727346938775511e-06, "loss": 0.0038, "step": 13425 }, { "epoch": 14.17, "learning_rate": 4.717142857142857e-06, "loss": 0.0035, "step": 13450 }, { "epoch": 14.2, "learning_rate": 4.706938775510205e-06, "loss": 0.0038, "step": 13475 }, { "epoch": 14.23, "learning_rate": 4.696734693877551e-06, "loss": 0.0038, "step": 13500 }, { "epoch": 14.25, "learning_rate": 4.686530612244898e-06, "loss": 0.0037, "step": 13525 }, { "epoch": 14.28, "learning_rate": 4.6763265306122455e-06, "loss": 0.0039, "step": 13550 }, { "epoch": 14.3, "learning_rate": 4.666122448979592e-06, "loss": 0.0036, "step": 13575 }, { "epoch": 14.33, "learning_rate": 4.65591836734694e-06, "loss": 0.0037, "step": 13600 }, { "epoch": 14.36, "learning_rate": 4.645714285714286e-06, "loss": 0.0037, "step": 13625 }, { "epoch": 14.38, "learning_rate": 4.635510204081633e-06, "loss": 0.0034, "step": 13650 }, { "epoch": 14.41, "learning_rate": 4.6253061224489795e-06, "loss": 0.0033, "step": 13675 }, { "epoch": 14.44, "learning_rate": 4.615102040816327e-06, "loss": 0.0038, "step": 13700 }, { "epoch": 14.46, "learning_rate": 4.604897959183674e-06, "loss": 0.0035, "step": 13725 }, { "epoch": 14.49, "learning_rate": 4.594693877551021e-06, "loss": 0.0036, "step": 13750 }, { "epoch": 14.52, "learning_rate": 4.584489795918368e-06, "loss": 0.004, "step": 13775 }, { "epoch": 14.54, "learning_rate": 4.574285714285714e-06, "loss": 0.0037, "step": 13800 }, { "epoch": 14.57, "learning_rate": 4.564081632653062e-06, "loss": 0.0039, "step": 13825 }, { "epoch": 14.59, "learning_rate": 4.5538775510204085e-06, "loss": 0.0039, "step": 13850 }, { "epoch": 14.62, "learning_rate": 4.543673469387755e-06, "loss": 0.0038, "step": 13875 }, { "epoch": 14.65, "learning_rate": 4.533469387755103e-06, "loss": 0.0042, "step": 13900 }, { "epoch": 14.67, "learning_rate": 4.523265306122449e-06, "loss": 0.0043, "step": 13925 }, { "epoch": 14.7, "learning_rate": 4.513061224489797e-06, "loss": 0.0041, "step": 13950 }, { "epoch": 14.73, "learning_rate": 4.5028571428571434e-06, "loss": 0.0038, "step": 13975 }, { "epoch": 14.75, "learning_rate": 4.49265306122449e-06, "loss": 0.0039, "step": 14000 }, { "epoch": 14.75, "eval_cer": 14.065593956437095, "eval_loss": 0.5078141689300537, "eval_runtime": 564.1028, "eval_samples_per_second": 0.737, "eval_steps_per_second": 0.023, "eval_wer": 33.99060519991261, "step": 14000 }, { "epoch": 14.78, "learning_rate": 4.482448979591837e-06, "loss": 0.0039, "step": 14025 }, { "epoch": 14.81, "learning_rate": 4.472244897959184e-06, "loss": 0.0042, "step": 14050 }, { "epoch": 14.83, "learning_rate": 4.462040816326531e-06, "loss": 0.0039, "step": 14075 }, { "epoch": 14.86, "learning_rate": 4.451836734693878e-06, "loss": 0.004, "step": 14100 }, { "epoch": 14.88, "learning_rate": 4.441632653061225e-06, "loss": 0.0039, "step": 14125 }, { "epoch": 14.91, "learning_rate": 4.431428571428572e-06, "loss": 0.0038, "step": 14150 }, { "epoch": 14.94, "learning_rate": 4.421224489795919e-06, "loss": 0.004, "step": 14175 }, { "epoch": 14.96, "learning_rate": 4.411020408163266e-06, "loss": 0.0042, "step": 14200 }, { "epoch": 14.99, "learning_rate": 4.400816326530612e-06, "loss": 0.0039, "step": 14225 }, { "epoch": 15.02, "learning_rate": 4.390612244897959e-06, "loss": 0.0035, "step": 14250 }, { "epoch": 15.04, "learning_rate": 4.3804081632653065e-06, "loss": 0.0028, "step": 14275 }, { "epoch": 15.07, "learning_rate": 4.370204081632653e-06, "loss": 0.0027, "step": 14300 }, { "epoch": 15.09, "learning_rate": 4.360000000000001e-06, "loss": 0.0029, "step": 14325 }, { "epoch": 15.12, "learning_rate": 4.349795918367347e-06, "loss": 0.0033, "step": 14350 }, { "epoch": 15.15, "learning_rate": 4.339591836734694e-06, "loss": 0.0026, "step": 14375 }, { "epoch": 15.17, "learning_rate": 4.329387755102041e-06, "loss": 0.0028, "step": 14400 }, { "epoch": 15.2, "learning_rate": 4.319183673469388e-06, "loss": 0.0028, "step": 14425 }, { "epoch": 15.23, "learning_rate": 4.308979591836735e-06, "loss": 0.003, "step": 14450 }, { "epoch": 15.25, "learning_rate": 4.298775510204082e-06, "loss": 0.0027, "step": 14475 }, { "epoch": 15.28, "learning_rate": 4.288571428571429e-06, "loss": 0.0028, "step": 14500 }, { "epoch": 15.31, "learning_rate": 4.278367346938776e-06, "loss": 0.0028, "step": 14525 }, { "epoch": 15.33, "learning_rate": 4.268163265306123e-06, "loss": 0.0028, "step": 14550 }, { "epoch": 15.36, "learning_rate": 4.2579591836734695e-06, "loss": 0.0028, "step": 14575 }, { "epoch": 15.38, "learning_rate": 4.247755102040816e-06, "loss": 0.0031, "step": 14600 }, { "epoch": 15.41, "learning_rate": 4.237551020408164e-06, "loss": 0.0027, "step": 14625 }, { "epoch": 15.44, "learning_rate": 4.22734693877551e-06, "loss": 0.003, "step": 14650 }, { "epoch": 15.46, "learning_rate": 4.217142857142858e-06, "loss": 0.0028, "step": 14675 }, { "epoch": 15.49, "learning_rate": 4.2069387755102044e-06, "loss": 0.0027, "step": 14700 }, { "epoch": 15.52, "learning_rate": 4.196734693877552e-06, "loss": 0.0027, "step": 14725 }, { "epoch": 15.54, "learning_rate": 4.1865306122448986e-06, "loss": 0.0031, "step": 14750 }, { "epoch": 15.57, "learning_rate": 4.176326530612245e-06, "loss": 0.0031, "step": 14775 }, { "epoch": 15.6, "learning_rate": 4.166122448979592e-06, "loss": 0.0033, "step": 14800 }, { "epoch": 15.62, "learning_rate": 4.1559183673469385e-06, "loss": 0.0036, "step": 14825 }, { "epoch": 15.65, "learning_rate": 4.145714285714286e-06, "loss": 0.0031, "step": 14850 }, { "epoch": 15.67, "learning_rate": 4.1355102040816334e-06, "loss": 0.0033, "step": 14875 }, { "epoch": 15.7, "learning_rate": 4.12530612244898e-06, "loss": 0.0033, "step": 14900 }, { "epoch": 15.73, "learning_rate": 4.115102040816327e-06, "loss": 0.0032, "step": 14925 }, { "epoch": 15.75, "learning_rate": 4.104897959183674e-06, "loss": 0.003, "step": 14950 }, { "epoch": 15.78, "learning_rate": 4.094693877551021e-06, "loss": 0.0032, "step": 14975 }, { "epoch": 15.81, "learning_rate": 4.0844897959183675e-06, "loss": 0.0033, "step": 15000 }, { "epoch": 15.81, "eval_cer": 13.919164018170624, "eval_loss": 0.5243561863899231, "eval_runtime": 564.6517, "eval_samples_per_second": 0.737, "eval_steps_per_second": 0.023, "eval_wer": 33.77212147694997, "step": 15000 }, { "epoch": 15.83, "learning_rate": 4.074285714285714e-06, "loss": 0.0031, "step": 15025 }, { "epoch": 15.86, "learning_rate": 4.064081632653062e-06, "loss": 0.003, "step": 15050 }, { "epoch": 15.89, "learning_rate": 4.053877551020409e-06, "loss": 0.0033, "step": 15075 }, { "epoch": 15.91, "learning_rate": 4.043673469387756e-06, "loss": 0.0032, "step": 15100 }, { "epoch": 15.94, "learning_rate": 4.033469387755102e-06, "loss": 0.0033, "step": 15125 }, { "epoch": 15.96, "learning_rate": 4.023265306122449e-06, "loss": 0.0031, "step": 15150 }, { "epoch": 15.99, "learning_rate": 4.0130612244897965e-06, "loss": 0.0035, "step": 15175 }, { "epoch": 16.02, "learning_rate": 4.002857142857143e-06, "loss": 0.003, "step": 15200 }, { "epoch": 16.04, "learning_rate": 3.99265306122449e-06, "loss": 0.0027, "step": 15225 }, { "epoch": 16.07, "learning_rate": 3.982448979591837e-06, "loss": 0.0027, "step": 15250 }, { "epoch": 16.1, "learning_rate": 3.972244897959184e-06, "loss": 0.0024, "step": 15275 }, { "epoch": 16.12, "learning_rate": 3.962040816326531e-06, "loss": 0.0021, "step": 15300 }, { "epoch": 16.15, "learning_rate": 3.951836734693878e-06, "loss": 0.0021, "step": 15325 }, { "epoch": 16.17, "learning_rate": 3.941632653061225e-06, "loss": 0.0024, "step": 15350 }, { "epoch": 16.2, "learning_rate": 3.931428571428571e-06, "loss": 0.0026, "step": 15375 }, { "epoch": 16.23, "learning_rate": 3.921224489795919e-06, "loss": 0.0023, "step": 15400 }, { "epoch": 16.25, "learning_rate": 3.9110204081632654e-06, "loss": 0.0021, "step": 15425 }, { "epoch": 16.28, "learning_rate": 3.900816326530613e-06, "loss": 0.0022, "step": 15450 }, { "epoch": 16.31, "learning_rate": 3.8906122448979595e-06, "loss": 0.0024, "step": 15475 }, { "epoch": 16.33, "learning_rate": 3.880408163265306e-06, "loss": 0.0024, "step": 15500 }, { "epoch": 16.36, "learning_rate": 3.870204081632654e-06, "loss": 0.0023, "step": 15525 }, { "epoch": 16.39, "learning_rate": 3.86e-06, "loss": 0.0024, "step": 15550 }, { "epoch": 16.41, "learning_rate": 3.849795918367347e-06, "loss": 0.0025, "step": 15575 }, { "epoch": 16.44, "learning_rate": 3.8395918367346944e-06, "loss": 0.0024, "step": 15600 }, { "epoch": 16.46, "learning_rate": 3.829387755102041e-06, "loss": 0.0026, "step": 15625 }, { "epoch": 16.49, "learning_rate": 3.8191836734693886e-06, "loss": 0.0023, "step": 15650 }, { "epoch": 16.52, "learning_rate": 3.808979591836735e-06, "loss": 0.0025, "step": 15675 }, { "epoch": 16.54, "learning_rate": 3.798775510204082e-06, "loss": 0.0025, "step": 15700 }, { "epoch": 16.57, "learning_rate": 3.7885714285714285e-06, "loss": 0.0025, "step": 15725 }, { "epoch": 16.6, "learning_rate": 3.778367346938776e-06, "loss": 0.0024, "step": 15750 }, { "epoch": 16.62, "learning_rate": 3.768163265306123e-06, "loss": 0.0025, "step": 15775 }, { "epoch": 16.65, "learning_rate": 3.7579591836734697e-06, "loss": 0.0025, "step": 15800 }, { "epoch": 16.68, "learning_rate": 3.7477551020408163e-06, "loss": 0.0027, "step": 15825 }, { "epoch": 16.7, "learning_rate": 3.7375510204081634e-06, "loss": 0.0026, "step": 15850 }, { "epoch": 16.73, "learning_rate": 3.727346938775511e-06, "loss": 0.0027, "step": 15875 }, { "epoch": 16.75, "learning_rate": 3.7171428571428575e-06, "loss": 0.003, "step": 15900 }, { "epoch": 16.78, "learning_rate": 3.706938775510204e-06, "loss": 0.0027, "step": 15925 }, { "epoch": 16.81, "learning_rate": 3.696734693877551e-06, "loss": 0.0026, "step": 15950 }, { "epoch": 16.83, "learning_rate": 3.6865306122448987e-06, "loss": 0.0024, "step": 15975 }, { "epoch": 16.86, "learning_rate": 3.6763265306122453e-06, "loss": 0.0024, "step": 16000 }, { "epoch": 16.86, "eval_cer": 13.791037822187462, "eval_loss": 0.535828173160553, "eval_runtime": 565.1108, "eval_samples_per_second": 0.736, "eval_steps_per_second": 0.023, "eval_wer": 33.76119729080184, "step": 16000 }, { "epoch": 16.89, "learning_rate": 3.666122448979592e-06, "loss": 0.0026, "step": 16025 }, { "epoch": 16.91, "learning_rate": 3.655918367346939e-06, "loss": 0.0028, "step": 16050 }, { "epoch": 16.94, "learning_rate": 3.6457142857142857e-06, "loss": 0.0025, "step": 16075 }, { "epoch": 16.97, "learning_rate": 3.635510204081633e-06, "loss": 0.0027, "step": 16100 }, { "epoch": 16.99, "learning_rate": 3.6253061224489798e-06, "loss": 0.0028, "step": 16125 }, { "epoch": 17.02, "learning_rate": 3.615102040816327e-06, "loss": 0.0023, "step": 16150 }, { "epoch": 17.04, "learning_rate": 3.6048979591836735e-06, "loss": 0.0019, "step": 16175 }, { "epoch": 17.07, "learning_rate": 3.594693877551021e-06, "loss": 0.002, "step": 16200 }, { "epoch": 17.1, "learning_rate": 3.5844897959183676e-06, "loss": 0.0018, "step": 16225 }, { "epoch": 17.12, "learning_rate": 3.5742857142857147e-06, "loss": 0.0022, "step": 16250 }, { "epoch": 17.15, "learning_rate": 3.5640816326530613e-06, "loss": 0.002, "step": 16275 }, { "epoch": 17.18, "learning_rate": 3.5538775510204084e-06, "loss": 0.0019, "step": 16300 }, { "epoch": 17.2, "learning_rate": 3.5436734693877554e-06, "loss": 0.0021, "step": 16325 }, { "epoch": 17.23, "learning_rate": 3.5334693877551025e-06, "loss": 0.002, "step": 16350 }, { "epoch": 17.26, "learning_rate": 3.523265306122449e-06, "loss": 0.0019, "step": 16375 }, { "epoch": 17.28, "learning_rate": 3.513061224489796e-06, "loss": 0.0022, "step": 16400 }, { "epoch": 17.31, "learning_rate": 3.5028571428571433e-06, "loss": 0.0023, "step": 16425 }, { "epoch": 17.33, "learning_rate": 3.4926530612244903e-06, "loss": 0.0018, "step": 16450 }, { "epoch": 17.36, "learning_rate": 3.482448979591837e-06, "loss": 0.0021, "step": 16475 }, { "epoch": 17.39, "learning_rate": 3.472244897959184e-06, "loss": 0.0019, "step": 16500 }, { "epoch": 17.41, "learning_rate": 3.4620408163265307e-06, "loss": 0.0019, "step": 16525 }, { "epoch": 17.44, "learning_rate": 3.451836734693878e-06, "loss": 0.0017, "step": 16550 }, { "epoch": 17.47, "learning_rate": 3.441632653061225e-06, "loss": 0.0019, "step": 16575 }, { "epoch": 17.49, "learning_rate": 3.431428571428572e-06, "loss": 0.0021, "step": 16600 }, { "epoch": 17.52, "learning_rate": 3.4212244897959185e-06, "loss": 0.0021, "step": 16625 }, { "epoch": 17.54, "learning_rate": 3.411020408163266e-06, "loss": 0.0019, "step": 16650 }, { "epoch": 17.57, "learning_rate": 3.4008163265306126e-06, "loss": 0.0018, "step": 16675 }, { "epoch": 17.6, "learning_rate": 3.3906122448979597e-06, "loss": 0.0019, "step": 16700 }, { "epoch": 17.62, "learning_rate": 3.3804081632653063e-06, "loss": 0.0017, "step": 16725 }, { "epoch": 17.65, "learning_rate": 3.370204081632653e-06, "loss": 0.0018, "step": 16750 }, { "epoch": 17.68, "learning_rate": 3.3600000000000004e-06, "loss": 0.0019, "step": 16775 }, { "epoch": 17.7, "learning_rate": 3.3497959183673475e-06, "loss": 0.0019, "step": 16800 }, { "epoch": 17.73, "learning_rate": 3.339591836734694e-06, "loss": 0.0019, "step": 16825 }, { "epoch": 17.76, "learning_rate": 3.3293877551020408e-06, "loss": 0.002, "step": 16850 }, { "epoch": 17.78, "learning_rate": 3.3191836734693883e-06, "loss": 0.002, "step": 16875 }, { "epoch": 17.81, "learning_rate": 3.308979591836735e-06, "loss": 0.0021, "step": 16900 }, { "epoch": 17.83, "learning_rate": 3.298775510204082e-06, "loss": 0.0018, "step": 16925 }, { "epoch": 17.86, "learning_rate": 3.2885714285714286e-06, "loss": 0.0017, "step": 16950 }, { "epoch": 17.89, "learning_rate": 3.2783673469387757e-06, "loss": 0.0018, "step": 16975 }, { "epoch": 17.91, "learning_rate": 3.2681632653061227e-06, "loss": 0.0018, "step": 17000 }, { "epoch": 17.91, "eval_cer": 13.846781037322994, "eval_loss": 0.546908974647522, "eval_runtime": 565.3766, "eval_samples_per_second": 0.736, "eval_steps_per_second": 0.023, "eval_wer": 33.646493336246444, "step": 17000 }, { "epoch": 17.94, "learning_rate": 3.25795918367347e-06, "loss": 0.0019, "step": 17025 }, { "epoch": 17.97, "learning_rate": 3.2477551020408164e-06, "loss": 0.0022, "step": 17050 }, { "epoch": 17.99, "learning_rate": 3.2375510204081635e-06, "loss": 0.0018, "step": 17075 }, { "epoch": 18.02, "learning_rate": 3.22734693877551e-06, "loss": 0.0016, "step": 17100 }, { "epoch": 18.05, "learning_rate": 3.2171428571428576e-06, "loss": 0.0014, "step": 17125 }, { "epoch": 18.07, "learning_rate": 3.2069387755102043e-06, "loss": 0.0013, "step": 17150 }, { "epoch": 18.1, "learning_rate": 3.1967346938775513e-06, "loss": 0.0014, "step": 17175 }, { "epoch": 18.12, "learning_rate": 3.186530612244898e-06, "loss": 0.0014, "step": 17200 }, { "epoch": 18.15, "learning_rate": 3.1763265306122454e-06, "loss": 0.0016, "step": 17225 }, { "epoch": 18.18, "learning_rate": 3.166122448979592e-06, "loss": 0.0014, "step": 17250 }, { "epoch": 18.2, "learning_rate": 3.1563265306122452e-06, "loss": 0.0013, "step": 17275 }, { "epoch": 18.23, "learning_rate": 3.1461224489795923e-06, "loss": 0.0012, "step": 17300 }, { "epoch": 18.26, "learning_rate": 3.135918367346939e-06, "loss": 0.0013, "step": 17325 }, { "epoch": 18.28, "learning_rate": 3.125714285714286e-06, "loss": 0.0013, "step": 17350 }, { "epoch": 18.31, "learning_rate": 3.115510204081633e-06, "loss": 0.0013, "step": 17375 }, { "epoch": 18.34, "learning_rate": 3.10530612244898e-06, "loss": 0.0012, "step": 17400 }, { "epoch": 18.36, "learning_rate": 3.0951020408163267e-06, "loss": 0.0015, "step": 17425 }, { "epoch": 18.39, "learning_rate": 3.084897959183674e-06, "loss": 0.0013, "step": 17450 }, { "epoch": 18.41, "learning_rate": 3.0746938775510204e-06, "loss": 0.0018, "step": 17475 }, { "epoch": 18.44, "learning_rate": 3.064489795918368e-06, "loss": 0.0012, "step": 17500 }, { "epoch": 18.47, "learning_rate": 3.0542857142857146e-06, "loss": 0.0013, "step": 17525 }, { "epoch": 18.49, "learning_rate": 3.0440816326530616e-06, "loss": 0.0012, "step": 17550 }, { "epoch": 18.52, "learning_rate": 3.0338775510204083e-06, "loss": 0.0011, "step": 17575 }, { "epoch": 18.55, "learning_rate": 3.023673469387755e-06, "loss": 0.001, "step": 17600 }, { "epoch": 18.57, "learning_rate": 3.0134693877551024e-06, "loss": 0.0015, "step": 17625 }, { "epoch": 18.6, "learning_rate": 3.0032653061224495e-06, "loss": 0.0012, "step": 17650 }, { "epoch": 18.62, "learning_rate": 2.993061224489796e-06, "loss": 0.0015, "step": 17675 }, { "epoch": 18.65, "learning_rate": 2.9828571428571427e-06, "loss": 0.0017, "step": 17700 }, { "epoch": 18.68, "learning_rate": 2.9726530612244902e-06, "loss": 0.0018, "step": 17725 }, { "epoch": 18.7, "learning_rate": 2.9624489795918373e-06, "loss": 0.0014, "step": 17750 }, { "epoch": 18.73, "learning_rate": 2.952244897959184e-06, "loss": 0.0012, "step": 17775 }, { "epoch": 18.76, "learning_rate": 2.9420408163265306e-06, "loss": 0.0015, "step": 17800 }, { "epoch": 18.78, "learning_rate": 2.9318367346938776e-06, "loss": 0.0014, "step": 17825 }, { "epoch": 18.81, "learning_rate": 2.921632653061225e-06, "loss": 0.0013, "step": 17850 }, { "epoch": 18.84, "learning_rate": 2.9114285714285717e-06, "loss": 0.0011, "step": 17875 }, { "epoch": 18.86, "learning_rate": 2.9012244897959184e-06, "loss": 0.0014, "step": 17900 }, { "epoch": 18.89, "learning_rate": 2.8910204081632654e-06, "loss": 0.0013, "step": 17925 }, { "epoch": 18.91, "learning_rate": 2.8808163265306125e-06, "loss": 0.0014, "step": 17950 }, { "epoch": 18.94, "learning_rate": 2.8706122448979596e-06, "loss": 0.0017, "step": 17975 }, { "epoch": 18.97, "learning_rate": 2.8604081632653062e-06, "loss": 0.0013, "step": 18000 }, { "epoch": 18.97, "eval_cer": 13.75526232590645, "eval_loss": 0.5613543391227722, "eval_runtime": 565.0787, "eval_samples_per_second": 0.736, "eval_steps_per_second": 0.023, "eval_wer": 33.66834170854271, "step": 18000 }, { "epoch": 18.99, "learning_rate": 2.8502040816326533e-06, "loss": 0.0015, "step": 18025 }, { "epoch": 19.02, "learning_rate": 2.84e-06, "loss": 0.0012, "step": 18050 }, { "epoch": 19.05, "learning_rate": 2.8297959183673474e-06, "loss": 0.0011, "step": 18075 }, { "epoch": 19.07, "learning_rate": 2.819591836734694e-06, "loss": 0.0013, "step": 18100 }, { "epoch": 19.1, "learning_rate": 2.809387755102041e-06, "loss": 0.0012, "step": 18125 }, { "epoch": 19.13, "learning_rate": 2.7991836734693877e-06, "loss": 0.0011, "step": 18150 }, { "epoch": 19.15, "learning_rate": 2.7889795918367352e-06, "loss": 0.0013, "step": 18175 }, { "epoch": 19.18, "learning_rate": 2.778775510204082e-06, "loss": 0.0011, "step": 18200 }, { "epoch": 19.2, "learning_rate": 2.768571428571429e-06, "loss": 0.001, "step": 18225 }, { "epoch": 19.23, "learning_rate": 2.7583673469387756e-06, "loss": 0.0011, "step": 18250 }, { "epoch": 19.26, "learning_rate": 2.7481632653061226e-06, "loss": 0.001, "step": 18275 }, { "epoch": 19.28, "learning_rate": 2.7383673469387758e-06, "loss": 0.001, "step": 18300 }, { "epoch": 19.31, "learning_rate": 2.7281632653061224e-06, "loss": 0.0013, "step": 18325 }, { "epoch": 19.34, "learning_rate": 2.71795918367347e-06, "loss": 0.001, "step": 18350 }, { "epoch": 19.36, "learning_rate": 2.7077551020408165e-06, "loss": 0.0011, "step": 18375 }, { "epoch": 19.39, "learning_rate": 2.6975510204081636e-06, "loss": 0.0013, "step": 18400 }, { "epoch": 19.42, "learning_rate": 2.6873469387755102e-06, "loss": 0.0012, "step": 18425 }, { "epoch": 19.44, "learning_rate": 2.6771428571428577e-06, "loss": 0.0012, "step": 18450 }, { "epoch": 19.47, "learning_rate": 2.6669387755102043e-06, "loss": 0.001, "step": 18475 }, { "epoch": 19.49, "learning_rate": 2.6567346938775514e-06, "loss": 0.001, "step": 18500 }, { "epoch": 19.52, "learning_rate": 2.646530612244898e-06, "loss": 0.001, "step": 18525 }, { "epoch": 19.55, "learning_rate": 2.6363265306122447e-06, "loss": 0.0009, "step": 18550 }, { "epoch": 19.57, "learning_rate": 2.626122448979592e-06, "loss": 0.001, "step": 18575 }, { "epoch": 19.6, "learning_rate": 2.6159183673469392e-06, "loss": 0.0009, "step": 18600 }, { "epoch": 19.63, "learning_rate": 2.605714285714286e-06, "loss": 0.0011, "step": 18625 }, { "epoch": 19.65, "learning_rate": 2.5955102040816325e-06, "loss": 0.001, "step": 18650 }, { "epoch": 19.68, "learning_rate": 2.58530612244898e-06, "loss": 0.0009, "step": 18675 }, { "epoch": 19.7, "learning_rate": 2.575102040816327e-06, "loss": 0.001, "step": 18700 }, { "epoch": 19.73, "learning_rate": 2.5648979591836737e-06, "loss": 0.001, "step": 18725 }, { "epoch": 19.76, "learning_rate": 2.5546938775510203e-06, "loss": 0.0011, "step": 18750 }, { "epoch": 19.78, "learning_rate": 2.5444897959183674e-06, "loss": 0.001, "step": 18775 }, { "epoch": 19.81, "learning_rate": 2.534285714285715e-06, "loss": 0.0012, "step": 18800 }, { "epoch": 19.84, "learning_rate": 2.5240816326530615e-06, "loss": 0.0014, "step": 18825 }, { "epoch": 19.86, "learning_rate": 2.513877551020408e-06, "loss": 0.0012, "step": 18850 }, { "epoch": 19.89, "learning_rate": 2.5036734693877552e-06, "loss": 0.0012, "step": 18875 }, { "epoch": 19.92, "learning_rate": 2.4934693877551023e-06, "loss": 0.0014, "step": 18900 }, { "epoch": 19.94, "learning_rate": 2.4832653061224494e-06, "loss": 0.0013, "step": 18925 }, { "epoch": 19.97, "learning_rate": 2.473061224489796e-06, "loss": 0.0011, "step": 18950 }, { "epoch": 19.99, "learning_rate": 2.462857142857143e-06, "loss": 0.0012, "step": 18975 }, { "epoch": 20.02, "learning_rate": 2.45265306122449e-06, "loss": 0.0014, "step": 19000 }, { "epoch": 20.02, "eval_cer": 13.888380451603242, "eval_loss": 0.5706824064254761, "eval_runtime": 564.8076, "eval_samples_per_second": 0.737, "eval_steps_per_second": 0.023, "eval_wer": 33.65741752239458, "step": 19000 }, { "epoch": 20.05, "learning_rate": 2.4424489795918368e-06, "loss": 0.0011, "step": 19025 }, { "epoch": 20.07, "learning_rate": 2.432244897959184e-06, "loss": 0.0011, "step": 19050 }, { "epoch": 20.1, "learning_rate": 2.422040816326531e-06, "loss": 0.0013, "step": 19075 }, { "epoch": 20.13, "learning_rate": 2.411836734693878e-06, "loss": 0.0013, "step": 19100 }, { "epoch": 20.15, "learning_rate": 2.4016326530612246e-06, "loss": 0.0011, "step": 19125 }, { "epoch": 20.18, "learning_rate": 2.3914285714285716e-06, "loss": 0.0014, "step": 19150 }, { "epoch": 20.21, "learning_rate": 2.3812244897959187e-06, "loss": 0.0011, "step": 19175 }, { "epoch": 20.23, "learning_rate": 2.3710204081632653e-06, "loss": 0.0011, "step": 19200 }, { "epoch": 20.26, "learning_rate": 2.3608163265306124e-06, "loss": 0.001, "step": 19225 }, { "epoch": 20.28, "learning_rate": 2.3506122448979595e-06, "loss": 0.0013, "step": 19250 }, { "epoch": 20.31, "learning_rate": 2.3404081632653065e-06, "loss": 0.0011, "step": 19275 }, { "epoch": 20.34, "learning_rate": 2.330204081632653e-06, "loss": 0.001, "step": 19300 }, { "epoch": 20.36, "learning_rate": 2.3200000000000002e-06, "loss": 0.0011, "step": 19325 }, { "epoch": 20.39, "learning_rate": 2.3097959183673473e-06, "loss": 0.001, "step": 19350 }, { "epoch": 20.42, "learning_rate": 2.299591836734694e-06, "loss": 0.001, "step": 19375 }, { "epoch": 20.44, "learning_rate": 2.289387755102041e-06, "loss": 0.0015, "step": 19400 }, { "epoch": 20.47, "learning_rate": 2.2791836734693876e-06, "loss": 0.0011, "step": 19425 }, { "epoch": 20.5, "learning_rate": 2.268979591836735e-06, "loss": 0.001, "step": 19450 }, { "epoch": 20.52, "learning_rate": 2.2587755102040818e-06, "loss": 0.0008, "step": 19475 }, { "epoch": 20.55, "learning_rate": 2.248571428571429e-06, "loss": 0.0008, "step": 19500 }, { "epoch": 20.57, "learning_rate": 2.2383673469387755e-06, "loss": 0.0009, "step": 19525 }, { "epoch": 20.6, "learning_rate": 2.228163265306123e-06, "loss": 0.0009, "step": 19550 }, { "epoch": 20.63, "learning_rate": 2.2179591836734696e-06, "loss": 0.0009, "step": 19575 }, { "epoch": 20.65, "learning_rate": 2.2077551020408162e-06, "loss": 0.0008, "step": 19600 }, { "epoch": 20.68, "learning_rate": 2.1975510204081633e-06, "loss": 0.0011, "step": 19625 }, { "epoch": 20.71, "learning_rate": 2.1873469387755104e-06, "loss": 0.0008, "step": 19650 }, { "epoch": 20.73, "learning_rate": 2.1771428571428574e-06, "loss": 0.0007, "step": 19675 }, { "epoch": 20.76, "learning_rate": 2.166938775510204e-06, "loss": 0.0007, "step": 19700 }, { "epoch": 20.79, "learning_rate": 2.156734693877551e-06, "loss": 0.0008, "step": 19725 }, { "epoch": 20.81, "learning_rate": 2.146530612244898e-06, "loss": 0.0009, "step": 19750 }, { "epoch": 20.84, "learning_rate": 2.1363265306122452e-06, "loss": 0.0009, "step": 19775 }, { "epoch": 20.86, "learning_rate": 2.126122448979592e-06, "loss": 0.001, "step": 19800 }, { "epoch": 20.89, "learning_rate": 2.115918367346939e-06, "loss": 0.0011, "step": 19825 }, { "epoch": 20.92, "learning_rate": 2.105714285714286e-06, "loss": 0.0009, "step": 19850 }, { "epoch": 20.94, "learning_rate": 2.0955102040816326e-06, "loss": 0.001, "step": 19875 }, { "epoch": 20.97, "learning_rate": 2.0853061224489797e-06, "loss": 0.0007, "step": 19900 }, { "epoch": 21.0, "learning_rate": 2.0751020408163268e-06, "loss": 0.0011, "step": 19925 }, { "epoch": 21.02, "learning_rate": 2.064897959183674e-06, "loss": 0.0008, "step": 19950 }, { "epoch": 21.05, "learning_rate": 2.0546938775510205e-06, "loss": 0.0006, "step": 19975 }, { "epoch": 21.07, "learning_rate": 2.0444897959183675e-06, "loss": 0.0006, "step": 20000 }, { "epoch": 21.07, "eval_cer": 14.076409804149959, "eval_loss": 0.5835161209106445, "eval_runtime": 564.962, "eval_samples_per_second": 0.736, "eval_steps_per_second": 0.023, "eval_wer": 34.06707450294953, "step": 20000 }, { "epoch": 21.1, "learning_rate": 2.0342857142857146e-06, "loss": 0.0008, "step": 20025 }, { "epoch": 21.13, "learning_rate": 2.0240816326530612e-06, "loss": 0.0008, "step": 20050 }, { "epoch": 21.15, "learning_rate": 2.0138775510204083e-06, "loss": 0.0007, "step": 20075 }, { "epoch": 21.18, "learning_rate": 2.0036734693877554e-06, "loss": 0.001, "step": 20100 }, { "epoch": 21.21, "learning_rate": 1.9934693877551024e-06, "loss": 0.0007, "step": 20125 }, { "epoch": 21.23, "learning_rate": 1.983265306122449e-06, "loss": 0.0006, "step": 20150 }, { "epoch": 21.26, "learning_rate": 1.973061224489796e-06, "loss": 0.0007, "step": 20175 }, { "epoch": 21.29, "learning_rate": 1.962857142857143e-06, "loss": 0.0008, "step": 20200 }, { "epoch": 21.31, "learning_rate": 1.95265306122449e-06, "loss": 0.0008, "step": 20225 }, { "epoch": 21.34, "learning_rate": 1.942448979591837e-06, "loss": 0.0007, "step": 20250 }, { "epoch": 21.36, "learning_rate": 1.932244897959184e-06, "loss": 0.0008, "step": 20275 }, { "epoch": 21.39, "learning_rate": 1.922040816326531e-06, "loss": 0.0008, "step": 20300 }, { "epoch": 21.42, "learning_rate": 1.9118367346938776e-06, "loss": 0.0007, "step": 20325 }, { "epoch": 21.44, "learning_rate": 1.9016326530612247e-06, "loss": 0.0007, "step": 20350 }, { "epoch": 21.47, "learning_rate": 1.8914285714285716e-06, "loss": 0.0006, "step": 20375 }, { "epoch": 21.5, "learning_rate": 1.8812244897959186e-06, "loss": 0.0008, "step": 20400 }, { "epoch": 21.52, "learning_rate": 1.8710204081632655e-06, "loss": 0.0008, "step": 20425 }, { "epoch": 21.55, "learning_rate": 1.8608163265306123e-06, "loss": 0.0006, "step": 20450 }, { "epoch": 21.58, "learning_rate": 1.8506122448979594e-06, "loss": 0.0006, "step": 20475 }, { "epoch": 21.6, "learning_rate": 1.8404081632653062e-06, "loss": 0.0006, "step": 20500 }, { "epoch": 21.63, "learning_rate": 1.8302040816326533e-06, "loss": 0.0008, "step": 20525 }, { "epoch": 21.65, "learning_rate": 1.8200000000000002e-06, "loss": 0.0008, "step": 20550 }, { "epoch": 21.68, "learning_rate": 1.8097959183673472e-06, "loss": 0.0007, "step": 20575 }, { "epoch": 21.71, "learning_rate": 1.799591836734694e-06, "loss": 0.0006, "step": 20600 }, { "epoch": 21.73, "learning_rate": 1.789387755102041e-06, "loss": 0.0006, "step": 20625 }, { "epoch": 21.76, "learning_rate": 1.779183673469388e-06, "loss": 0.0009, "step": 20650 }, { "epoch": 21.79, "learning_rate": 1.7689795918367348e-06, "loss": 0.0008, "step": 20675 }, { "epoch": 21.81, "learning_rate": 1.7587755102040819e-06, "loss": 0.0008, "step": 20700 }, { "epoch": 21.84, "learning_rate": 1.7485714285714287e-06, "loss": 0.0007, "step": 20725 }, { "epoch": 21.87, "learning_rate": 1.7383673469387758e-06, "loss": 0.0007, "step": 20750 }, { "epoch": 21.89, "learning_rate": 1.7285714285714287e-06, "loss": 0.0007, "step": 20775 }, { "epoch": 21.92, "learning_rate": 1.7183673469387758e-06, "loss": 0.0007, "step": 20800 }, { "epoch": 21.94, "learning_rate": 1.7081632653061226e-06, "loss": 0.0009, "step": 20825 }, { "epoch": 21.97, "learning_rate": 1.6979591836734697e-06, "loss": 0.0008, "step": 20850 }, { "epoch": 22.0, "learning_rate": 1.6877551020408163e-06, "loss": 0.001, "step": 20875 }, { "epoch": 22.02, "learning_rate": 1.6775510204081636e-06, "loss": 0.0006, "step": 20900 }, { "epoch": 22.05, "learning_rate": 1.6673469387755102e-06, "loss": 0.0006, "step": 20925 }, { "epoch": 22.08, "learning_rate": 1.657142857142857e-06, "loss": 0.0006, "step": 20950 }, { "epoch": 22.1, "learning_rate": 1.6469387755102042e-06, "loss": 0.0005, "step": 20975 }, { "epoch": 22.13, "learning_rate": 1.636734693877551e-06, "loss": 0.0007, "step": 21000 }, { "epoch": 22.13, "eval_cer": 14.077241792435563, "eval_loss": 0.592703104019165, "eval_runtime": 564.5247, "eval_samples_per_second": 0.737, "eval_steps_per_second": 0.023, "eval_wer": 33.974218920690404, "step": 21000 }, { "epoch": 22.15, "learning_rate": 1.626530612244898e-06, "loss": 0.0007, "step": 21025 }, { "epoch": 22.18, "learning_rate": 1.616326530612245e-06, "loss": 0.0006, "step": 21050 }, { "epoch": 22.21, "learning_rate": 1.606122448979592e-06, "loss": 0.0005, "step": 21075 }, { "epoch": 22.23, "learning_rate": 1.5959183673469388e-06, "loss": 0.0006, "step": 21100 }, { "epoch": 22.26, "learning_rate": 1.5857142857142857e-06, "loss": 0.0007, "step": 21125 }, { "epoch": 22.29, "learning_rate": 1.5755102040816328e-06, "loss": 0.0005, "step": 21150 }, { "epoch": 22.31, "learning_rate": 1.5653061224489796e-06, "loss": 0.0005, "step": 21175 }, { "epoch": 22.34, "learning_rate": 1.5551020408163267e-06, "loss": 0.0007, "step": 21200 }, { "epoch": 22.37, "learning_rate": 1.5448979591836735e-06, "loss": 0.0006, "step": 21225 }, { "epoch": 22.39, "learning_rate": 1.5346938775510206e-06, "loss": 0.0005, "step": 21250 }, { "epoch": 22.42, "learning_rate": 1.5244897959183674e-06, "loss": 0.0005, "step": 21275 }, { "epoch": 22.44, "learning_rate": 1.5142857142857145e-06, "loss": 0.0005, "step": 21300 }, { "epoch": 22.47, "learning_rate": 1.5040816326530613e-06, "loss": 0.0006, "step": 21325 }, { "epoch": 22.5, "learning_rate": 1.4938775510204082e-06, "loss": 0.0005, "step": 21350 }, { "epoch": 22.52, "learning_rate": 1.4836734693877553e-06, "loss": 0.0005, "step": 21375 }, { "epoch": 22.55, "learning_rate": 1.473469387755102e-06, "loss": 0.0006, "step": 21400 }, { "epoch": 22.58, "learning_rate": 1.4632653061224492e-06, "loss": 0.0006, "step": 21425 }, { "epoch": 22.6, "learning_rate": 1.453061224489796e-06, "loss": 0.0005, "step": 21450 }, { "epoch": 22.63, "learning_rate": 1.442857142857143e-06, "loss": 0.0005, "step": 21475 }, { "epoch": 22.66, "learning_rate": 1.43265306122449e-06, "loss": 0.0007, "step": 21500 }, { "epoch": 22.68, "learning_rate": 1.422448979591837e-06, "loss": 0.0006, "step": 21525 }, { "epoch": 22.71, "learning_rate": 1.4122448979591838e-06, "loss": 0.0005, "step": 21550 }, { "epoch": 22.73, "learning_rate": 1.4020408163265307e-06, "loss": 0.0005, "step": 21575 }, { "epoch": 22.76, "learning_rate": 1.3918367346938778e-06, "loss": 0.0004, "step": 21600 }, { "epoch": 22.79, "learning_rate": 1.3816326530612246e-06, "loss": 0.0004, "step": 21625 }, { "epoch": 22.81, "learning_rate": 1.3714285714285717e-06, "loss": 0.0005, "step": 21650 }, { "epoch": 22.84, "learning_rate": 1.3612244897959185e-06, "loss": 0.0006, "step": 21675 }, { "epoch": 22.87, "learning_rate": 1.3510204081632656e-06, "loss": 0.0006, "step": 21700 }, { "epoch": 22.89, "learning_rate": 1.3408163265306124e-06, "loss": 0.0005, "step": 21725 }, { "epoch": 22.92, "learning_rate": 1.3306122448979595e-06, "loss": 0.0005, "step": 21750 }, { "epoch": 22.95, "learning_rate": 1.3204081632653063e-06, "loss": 0.0005, "step": 21775 }, { "epoch": 22.97, "learning_rate": 1.310204081632653e-06, "loss": 0.0006, "step": 21800 }, { "epoch": 23.0, "learning_rate": 1.3e-06, "loss": 0.0005, "step": 21825 }, { "epoch": 23.02, "learning_rate": 1.289795918367347e-06, "loss": 0.0004, "step": 21850 }, { "epoch": 23.05, "learning_rate": 1.279591836734694e-06, "loss": 0.0004, "step": 21875 }, { "epoch": 23.08, "learning_rate": 1.2693877551020408e-06, "loss": 0.0004, "step": 21900 }, { "epoch": 23.1, "learning_rate": 1.2591836734693879e-06, "loss": 0.0004, "step": 21925 }, { "epoch": 23.13, "learning_rate": 1.2489795918367347e-06, "loss": 0.0005, "step": 21950 }, { "epoch": 23.16, "learning_rate": 1.2387755102040818e-06, "loss": 0.0005, "step": 21975 }, { "epoch": 23.18, "learning_rate": 1.2285714285714286e-06, "loss": 0.0005, "step": 22000 }, { "epoch": 23.18, "eval_cer": 14.028986471870475, "eval_loss": 0.5993762016296387, "eval_runtime": 564.5393, "eval_samples_per_second": 0.737, "eval_steps_per_second": 0.023, "eval_wer": 34.039764037579204, "step": 22000 }, { "epoch": 23.21, "learning_rate": 1.2183673469387757e-06, "loss": 0.0005, "step": 22025 }, { "epoch": 23.23, "learning_rate": 1.2081632653061225e-06, "loss": 0.0005, "step": 22050 }, { "epoch": 23.26, "learning_rate": 1.1979591836734694e-06, "loss": 0.0004, "step": 22075 }, { "epoch": 23.29, "learning_rate": 1.1877551020408165e-06, "loss": 0.0004, "step": 22100 }, { "epoch": 23.31, "learning_rate": 1.1775510204081633e-06, "loss": 0.0006, "step": 22125 }, { "epoch": 23.34, "learning_rate": 1.1673469387755104e-06, "loss": 0.0004, "step": 22150 }, { "epoch": 23.37, "learning_rate": 1.1571428571428572e-06, "loss": 0.0004, "step": 22175 }, { "epoch": 23.39, "learning_rate": 1.1469387755102043e-06, "loss": 0.0003, "step": 22200 }, { "epoch": 23.42, "learning_rate": 1.1367346938775511e-06, "loss": 0.0004, "step": 22225 }, { "epoch": 23.45, "learning_rate": 1.1265306122448982e-06, "loss": 0.0003, "step": 22250 }, { "epoch": 23.47, "learning_rate": 1.116326530612245e-06, "loss": 0.0004, "step": 22275 }, { "epoch": 23.5, "learning_rate": 1.106122448979592e-06, "loss": 0.0004, "step": 22300 }, { "epoch": 23.52, "learning_rate": 1.0959183673469388e-06, "loss": 0.0004, "step": 22325 }, { "epoch": 23.55, "learning_rate": 1.0857142857142858e-06, "loss": 0.0004, "step": 22350 }, { "epoch": 23.58, "learning_rate": 1.0755102040816327e-06, "loss": 0.0005, "step": 22375 }, { "epoch": 23.6, "learning_rate": 1.0653061224489797e-06, "loss": 0.0005, "step": 22400 }, { "epoch": 23.63, "learning_rate": 1.0551020408163266e-06, "loss": 0.0005, "step": 22425 }, { "epoch": 23.66, "learning_rate": 1.0448979591836736e-06, "loss": 0.0006, "step": 22450 }, { "epoch": 23.68, "learning_rate": 1.0346938775510205e-06, "loss": 0.0004, "step": 22475 }, { "epoch": 23.71, "learning_rate": 1.0244897959183673e-06, "loss": 0.0005, "step": 22500 }, { "epoch": 23.74, "learning_rate": 1.0142857142857144e-06, "loss": 0.0004, "step": 22525 }, { "epoch": 23.76, "learning_rate": 1.0040816326530613e-06, "loss": 0.0005, "step": 22550 }, { "epoch": 23.79, "learning_rate": 9.938775510204083e-07, "loss": 0.0004, "step": 22575 }, { "epoch": 23.81, "learning_rate": 9.836734693877552e-07, "loss": 0.0004, "step": 22600 }, { "epoch": 23.84, "learning_rate": 9.734693877551022e-07, "loss": 0.0004, "step": 22625 }, { "epoch": 23.87, "learning_rate": 9.63265306122449e-07, "loss": 0.0004, "step": 22650 }, { "epoch": 23.89, "learning_rate": 9.53061224489796e-07, "loss": 0.0004, "step": 22675 }, { "epoch": 23.92, "learning_rate": 9.42857142857143e-07, "loss": 0.0004, "step": 22700 }, { "epoch": 23.95, "learning_rate": 9.326530612244898e-07, "loss": 0.0004, "step": 22725 }, { "epoch": 23.97, "learning_rate": 9.224489795918368e-07, "loss": 0.0004, "step": 22750 }, { "epoch": 24.0, "learning_rate": 9.122448979591838e-07, "loss": 0.0004, "step": 22775 }, { "epoch": 24.03, "learning_rate": 9.020408163265307e-07, "loss": 0.0004, "step": 22800 }, { "epoch": 24.05, "learning_rate": 8.918367346938777e-07, "loss": 0.0007, "step": 22825 }, { "epoch": 24.08, "learning_rate": 8.816326530612246e-07, "loss": 0.0004, "step": 22850 }, { "epoch": 24.1, "learning_rate": 8.714285714285716e-07, "loss": 0.0003, "step": 22875 }, { "epoch": 24.13, "learning_rate": 8.612244897959185e-07, "loss": 0.0004, "step": 22900 }, { "epoch": 24.16, "learning_rate": 8.510204081632653e-07, "loss": 0.0003, "step": 22925 }, { "epoch": 24.18, "learning_rate": 8.408163265306122e-07, "loss": 0.0004, "step": 22950 }, { "epoch": 24.21, "learning_rate": 8.306122448979592e-07, "loss": 0.0004, "step": 22975 }, { "epoch": 24.24, "learning_rate": 8.204081632653062e-07, "loss": 0.0004, "step": 23000 }, { "epoch": 24.24, "eval_cer": 13.92165998302744, "eval_loss": 0.606694757938385, "eval_runtime": 564.7849, "eval_samples_per_second": 0.737, "eval_steps_per_second": 0.023, "eval_wer": 33.94690845532008, "step": 23000 }, { "epoch": 24.26, "learning_rate": 8.102040816326531e-07, "loss": 0.0004, "step": 23025 }, { "epoch": 24.29, "learning_rate": 8.000000000000001e-07, "loss": 0.0003, "step": 23050 }, { "epoch": 24.32, "learning_rate": 7.89795918367347e-07, "loss": 0.0003, "step": 23075 }, { "epoch": 24.34, "learning_rate": 7.79591836734694e-07, "loss": 0.0004, "step": 23100 }, { "epoch": 24.37, "learning_rate": 7.693877551020409e-07, "loss": 0.0003, "step": 23125 }, { "epoch": 24.39, "learning_rate": 7.591836734693878e-07, "loss": 0.0006, "step": 23150 }, { "epoch": 24.42, "learning_rate": 7.489795918367347e-07, "loss": 0.0003, "step": 23175 }, { "epoch": 24.45, "learning_rate": 7.387755102040817e-07, "loss": 0.0003, "step": 23200 }, { "epoch": 24.47, "learning_rate": 7.285714285714287e-07, "loss": 0.0003, "step": 23225 }, { "epoch": 24.5, "learning_rate": 7.183673469387756e-07, "loss": 0.0005, "step": 23250 }, { "epoch": 24.53, "learning_rate": 7.081632653061226e-07, "loss": 0.0003, "step": 23275 }, { "epoch": 24.55, "learning_rate": 6.979591836734695e-07, "loss": 0.0004, "step": 23300 }, { "epoch": 24.58, "learning_rate": 6.877551020408165e-07, "loss": 0.0003, "step": 23325 }, { "epoch": 24.6, "learning_rate": 6.775510204081632e-07, "loss": 0.0004, "step": 23350 }, { "epoch": 24.63, "learning_rate": 6.673469387755102e-07, "loss": 0.0003, "step": 23375 }, { "epoch": 24.66, "learning_rate": 6.571428571428571e-07, "loss": 0.0003, "step": 23400 }, { "epoch": 24.68, "learning_rate": 6.469387755102041e-07, "loss": 0.0003, "step": 23425 }, { "epoch": 24.71, "learning_rate": 6.367346938775511e-07, "loss": 0.0003, "step": 23450 }, { "epoch": 24.74, "learning_rate": 6.26530612244898e-07, "loss": 0.0003, "step": 23475 }, { "epoch": 24.76, "learning_rate": 6.163265306122449e-07, "loss": 0.0003, "step": 23500 }, { "epoch": 24.79, "learning_rate": 6.061224489795918e-07, "loss": 0.0003, "step": 23525 }, { "epoch": 24.82, "learning_rate": 5.959183673469388e-07, "loss": 0.0003, "step": 23550 }, { "epoch": 24.84, "learning_rate": 5.857142857142857e-07, "loss": 0.0003, "step": 23575 }, { "epoch": 24.87, "learning_rate": 5.755102040816327e-07, "loss": 0.0003, "step": 23600 }, { "epoch": 24.89, "learning_rate": 5.653061224489796e-07, "loss": 0.0004, "step": 23625 }, { "epoch": 24.92, "learning_rate": 5.551020408163266e-07, "loss": 0.0003, "step": 23650 }, { "epoch": 24.95, "learning_rate": 5.448979591836736e-07, "loss": 0.0003, "step": 23675 }, { "epoch": 24.97, "learning_rate": 5.346938775510205e-07, "loss": 0.0003, "step": 23700 }, { "epoch": 25.0, "learning_rate": 5.244897959183674e-07, "loss": 0.0003, "step": 23725 }, { "epoch": 25.03, "learning_rate": 5.142857142857143e-07, "loss": 0.0005, "step": 23750 }, { "epoch": 25.05, "learning_rate": 5.040816326530613e-07, "loss": 0.0004, "step": 23775 }, { "epoch": 25.08, "learning_rate": 4.938775510204082e-07, "loss": 0.0003, "step": 23800 }, { "epoch": 25.11, "learning_rate": 4.836734693877551e-07, "loss": 0.0003, "step": 23825 }, { "epoch": 25.13, "learning_rate": 4.7346938775510204e-07, "loss": 0.0003, "step": 23850 }, { "epoch": 25.16, "learning_rate": 4.63265306122449e-07, "loss": 0.0003, "step": 23875 }, { "epoch": 25.18, "learning_rate": 4.5306122448979596e-07, "loss": 0.0003, "step": 23900 }, { "epoch": 25.21, "learning_rate": 4.4285714285714286e-07, "loss": 0.0003, "step": 23925 }, { "epoch": 25.24, "learning_rate": 4.326530612244898e-07, "loss": 0.0003, "step": 23950 }, { "epoch": 25.26, "learning_rate": 4.2244897959183677e-07, "loss": 0.0003, "step": 23975 }, { "epoch": 25.29, "learning_rate": 4.1224489795918373e-07, "loss": 0.0003, "step": 24000 }, { "epoch": 25.29, "eval_cer": 13.959099455879661, "eval_loss": 0.6108967065811157, "eval_runtime": 564.9633, "eval_samples_per_second": 0.736, "eval_steps_per_second": 0.023, "eval_wer": 33.96875682761634, "step": 24000 }, { "epoch": 25.32, "learning_rate": 4.020408163265307e-07, "loss": 0.0003, "step": 24025 }, { "epoch": 25.34, "learning_rate": 3.9183673469387754e-07, "loss": 0.0003, "step": 24050 }, { "epoch": 25.37, "learning_rate": 3.816326530612245e-07, "loss": 0.0003, "step": 24075 }, { "epoch": 25.4, "learning_rate": 3.7142857142857145e-07, "loss": 0.0003, "step": 24100 }, { "epoch": 25.42, "learning_rate": 3.612244897959184e-07, "loss": 0.0003, "step": 24125 }, { "epoch": 25.45, "learning_rate": 3.510204081632653e-07, "loss": 0.0003, "step": 24150 }, { "epoch": 25.47, "learning_rate": 3.4081632653061227e-07, "loss": 0.0003, "step": 24175 }, { "epoch": 25.5, "learning_rate": 3.306122448979592e-07, "loss": 0.0003, "step": 24200 }, { "epoch": 25.53, "learning_rate": 3.204081632653062e-07, "loss": 0.0003, "step": 24225 }, { "epoch": 25.55, "learning_rate": 3.102040816326531e-07, "loss": 0.0003, "step": 24250 }, { "epoch": 25.58, "learning_rate": 3.0000000000000004e-07, "loss": 0.0003, "step": 24275 }, { "epoch": 25.61, "learning_rate": 2.8979591836734694e-07, "loss": 0.0003, "step": 24300 }, { "epoch": 25.63, "learning_rate": 2.795918367346939e-07, "loss": 0.0003, "step": 24325 }, { "epoch": 25.66, "learning_rate": 2.6938775510204086e-07, "loss": 0.0003, "step": 24350 }, { "epoch": 25.68, "learning_rate": 2.5918367346938776e-07, "loss": 0.0003, "step": 24375 }, { "epoch": 25.71, "learning_rate": 2.489795918367347e-07, "loss": 0.0003, "step": 24400 }, { "epoch": 25.74, "learning_rate": 2.387755102040816e-07, "loss": 0.0003, "step": 24425 }, { "epoch": 25.76, "learning_rate": 2.285714285714286e-07, "loss": 0.0003, "step": 24450 }, { "epoch": 25.79, "learning_rate": 2.1836734693877553e-07, "loss": 0.0003, "step": 24475 }, { "epoch": 25.82, "learning_rate": 2.0816326530612246e-07, "loss": 0.0003, "step": 24500 }, { "epoch": 25.84, "learning_rate": 1.9795918367346942e-07, "loss": 0.0003, "step": 24525 }, { "epoch": 25.87, "learning_rate": 1.8775510204081635e-07, "loss": 0.0003, "step": 24550 }, { "epoch": 25.9, "learning_rate": 1.7755102040816328e-07, "loss": 0.0003, "step": 24575 }, { "epoch": 25.92, "learning_rate": 1.673469387755102e-07, "loss": 0.0003, "step": 24600 }, { "epoch": 25.95, "learning_rate": 1.5714285714285717e-07, "loss": 0.0003, "step": 24625 }, { "epoch": 25.97, "learning_rate": 1.469387755102041e-07, "loss": 0.0003, "step": 24650 }, { "epoch": 26.0, "learning_rate": 1.3673469387755103e-07, "loss": 0.0003, "step": 24675 }, { "epoch": 26.03, "learning_rate": 1.2653061224489798e-07, "loss": 0.0003, "step": 24700 }, { "epoch": 26.05, "learning_rate": 1.1632653061224491e-07, "loss": 0.0002, "step": 24725 }, { "epoch": 26.08, "learning_rate": 1.0612244897959186e-07, "loss": 0.0002, "step": 24750 }, { "epoch": 26.11, "learning_rate": 9.591836734693879e-08, "loss": 0.0003, "step": 24775 }, { "epoch": 26.13, "learning_rate": 8.571428571428573e-08, "loss": 0.0002, "step": 24800 }, { "epoch": 26.16, "learning_rate": 7.551020408163266e-08, "loss": 0.0002, "step": 24825 }, { "epoch": 26.19, "learning_rate": 6.53061224489796e-08, "loss": 0.0003, "step": 24850 }, { "epoch": 26.21, "learning_rate": 5.510204081632654e-08, "loss": 0.0003, "step": 24875 }, { "epoch": 26.24, "learning_rate": 4.4897959183673476e-08, "loss": 0.0002, "step": 24900 }, { "epoch": 26.26, "learning_rate": 3.469387755102041e-08, "loss": 0.0002, "step": 24925 }, { "epoch": 26.29, "learning_rate": 2.4489795918367346e-08, "loss": 0.0002, "step": 24950 }, { "epoch": 26.32, "learning_rate": 1.4285714285714288e-08, "loss": 0.0003, "step": 24975 }, { "epoch": 26.34, "learning_rate": 4.081632653061225e-09, "loss": 0.0003, "step": 25000 }, { "epoch": 26.34, "eval_cer": 13.83596518961013, "eval_loss": 0.6130102872848511, "eval_runtime": 564.4854, "eval_samples_per_second": 0.737, "eval_steps_per_second": 0.023, "eval_wer": 33.82674240769063, "step": 25000 }, { "epoch": 26.34, "step": 25000, "total_flos": 2.3081579771314176e+20, "train_loss": 0.0802921476102434, "train_runtime": 80869.9548, "train_samples_per_second": 9.892, "train_steps_per_second": 0.309 }, { "epoch": 26.34, "eval_cer": 13.34925204253124, "eval_loss": 0.29488590359687805, "eval_runtime": 564.894, "eval_samples_per_second": 0.736, "eval_steps_per_second": 0.023, "eval_wer": 32.33012890539655, "step": 25000 } ], "max_steps": 25000, "num_train_epochs": 27, "total_flos": 2.3081579771314176e+20, "trial_name": null, "trial_params": null }