{ "best_metric": 0.1691386103630066, "best_model_checkpoint": "facebook/wav2vec2-xls-r-300m-/home/yehor/ext-disk/cv10-with-noise/train.csv/checkpoint-1000", "epoch": 17.1875, "global_step": 22000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.02, "learning_rate": 1.9e-06, "loss": 1.3873, "step": 20 }, { "epoch": 0.03, "learning_rate": 3.7e-06, "loss": 1.5023, "step": 40 }, { "epoch": 0.05, "learning_rate": 5.7000000000000005e-06, "loss": 1.5009, "step": 60 }, { "epoch": 0.06, "learning_rate": 7.7e-06, "loss": 1.3846, "step": 80 }, { "epoch": 0.08, "learning_rate": 9.7e-06, "loss": 1.4476, "step": 100 }, { "epoch": 0.09, "learning_rate": 1.1700000000000001e-05, "loss": 1.2564, "step": 120 }, { "epoch": 0.11, "learning_rate": 1.3700000000000001e-05, "loss": 1.3335, "step": 140 }, { "epoch": 0.12, "learning_rate": 1.5700000000000002e-05, "loss": 1.3105, "step": 160 }, { "epoch": 0.14, "learning_rate": 1.77e-05, "loss": 1.2823, "step": 180 }, { "epoch": 0.16, "learning_rate": 1.9600000000000002e-05, "loss": 1.3257, "step": 200 }, { "epoch": 0.17, "learning_rate": 2.16e-05, "loss": 1.2603, "step": 220 }, { "epoch": 0.19, "learning_rate": 2.36e-05, "loss": 1.2935, "step": 240 }, { "epoch": 0.2, "learning_rate": 2.5600000000000002e-05, "loss": 1.2542, "step": 260 }, { "epoch": 0.22, "learning_rate": 2.7600000000000003e-05, "loss": 1.2697, "step": 280 }, { "epoch": 0.23, "learning_rate": 2.96e-05, "loss": 1.3247, "step": 300 }, { "epoch": 0.25, "learning_rate": 3.16e-05, "loss": 1.2125, "step": 320 }, { "epoch": 0.27, "learning_rate": 3.3600000000000004e-05, "loss": 1.2742, "step": 340 }, { "epoch": 0.28, "learning_rate": 3.56e-05, "loss": 1.2861, "step": 360 }, { "epoch": 0.3, "learning_rate": 3.76e-05, "loss": 1.2738, "step": 380 }, { "epoch": 0.31, "learning_rate": 3.960000000000001e-05, "loss": 1.3923, "step": 400 }, { "epoch": 0.33, "learning_rate": 4.16e-05, "loss": 1.235, "step": 420 }, { "epoch": 0.34, "learning_rate": 4.36e-05, "loss": 1.3023, "step": 440 }, { "epoch": 0.36, "learning_rate": 4.5600000000000004e-05, "loss": 1.2928, "step": 460 }, { "epoch": 0.38, "learning_rate": 4.76e-05, "loss": 1.2866, "step": 480 }, { "epoch": 0.39, "learning_rate": 4.96e-05, "loss": 1.3532, "step": 500 }, { "epoch": 0.41, "learning_rate": 4.999874902267397e-05, "loss": 1.2502, "step": 520 }, { "epoch": 0.42, "learning_rate": 4.9997185301016416e-05, "loss": 1.3252, "step": 540 }, { "epoch": 0.44, "learning_rate": 4.999562157935888e-05, "loss": 1.3115, "step": 560 }, { "epoch": 0.45, "learning_rate": 4.999405785770133e-05, "loss": 1.2741, "step": 580 }, { "epoch": 0.47, "learning_rate": 4.999249413604379e-05, "loss": 1.338, "step": 600 }, { "epoch": 0.48, "learning_rate": 4.9990930414386236e-05, "loss": 1.236, "step": 620 }, { "epoch": 0.5, "learning_rate": 4.99893666927287e-05, "loss": 1.2748, "step": 640 }, { "epoch": 0.52, "learning_rate": 4.998780297107115e-05, "loss": 1.3075, "step": 660 }, { "epoch": 0.53, "learning_rate": 4.998623924941361e-05, "loss": 1.249, "step": 680 }, { "epoch": 0.55, "learning_rate": 4.998467552775606e-05, "loss": 1.3587, "step": 700 }, { "epoch": 0.56, "learning_rate": 4.998311180609852e-05, "loss": 1.2371, "step": 720 }, { "epoch": 0.58, "learning_rate": 4.998154808444097e-05, "loss": 1.3295, "step": 740 }, { "epoch": 0.59, "learning_rate": 4.997998436278343e-05, "loss": 1.323, "step": 760 }, { "epoch": 0.61, "learning_rate": 4.997842064112588e-05, "loss": 1.2567, "step": 780 }, { "epoch": 0.62, "learning_rate": 4.997685691946834e-05, "loss": 1.3447, "step": 800 }, { "epoch": 0.64, "learning_rate": 4.997529319781079e-05, "loss": 1.2195, "step": 820 }, { "epoch": 0.66, "learning_rate": 4.997372947615325e-05, "loss": 1.2824, "step": 840 }, { "epoch": 0.67, "learning_rate": 4.99721657544957e-05, "loss": 1.2633, "step": 860 }, { "epoch": 0.69, "learning_rate": 4.997060203283816e-05, "loss": 1.2948, "step": 880 }, { "epoch": 0.7, "learning_rate": 4.996903831118061e-05, "loss": 1.2916, "step": 900 }, { "epoch": 0.72, "learning_rate": 4.996747458952307e-05, "loss": 1.263, "step": 920 }, { "epoch": 0.73, "learning_rate": 4.996591086786552e-05, "loss": 1.2602, "step": 940 }, { "epoch": 0.75, "learning_rate": 4.996434714620798e-05, "loss": 1.2901, "step": 960 }, { "epoch": 0.77, "learning_rate": 4.996278342455043e-05, "loss": 1.2749, "step": 980 }, { "epoch": 0.78, "learning_rate": 4.996121970289289e-05, "loss": 1.3405, "step": 1000 }, { "epoch": 0.78, "eval_cer": 0.0811, "eval_loss": 0.1691386103630066, "eval_runtime": 209.1048, "eval_samples_per_second": 18.115, "eval_steps_per_second": 0.569, "eval_wer": 0.3881, "step": 1000 }, { "epoch": 0.8, "learning_rate": 4.995965598123534e-05, "loss": 1.2395, "step": 1020 }, { "epoch": 0.81, "learning_rate": 4.99580922595778e-05, "loss": 1.2685, "step": 1040 }, { "epoch": 0.83, "learning_rate": 4.995652853792025e-05, "loss": 1.2596, "step": 1060 }, { "epoch": 0.84, "learning_rate": 4.995496481626271e-05, "loss": 1.2438, "step": 1080 }, { "epoch": 0.86, "learning_rate": 4.995340109460516e-05, "loss": 1.3028, "step": 1100 }, { "epoch": 0.88, "learning_rate": 4.995183737294762e-05, "loss": 1.2125, "step": 1120 }, { "epoch": 0.89, "learning_rate": 4.995027365129007e-05, "loss": 1.2664, "step": 1140 }, { "epoch": 0.91, "learning_rate": 4.994870992963253e-05, "loss": 1.2806, "step": 1160 }, { "epoch": 0.92, "learning_rate": 4.994714620797498e-05, "loss": 1.2685, "step": 1180 }, { "epoch": 0.94, "learning_rate": 4.994558248631744e-05, "loss": 1.2862, "step": 1200 }, { "epoch": 0.95, "learning_rate": 4.994401876465989e-05, "loss": 1.1859, "step": 1220 }, { "epoch": 0.97, "learning_rate": 4.994245504300235e-05, "loss": 1.2897, "step": 1240 }, { "epoch": 0.98, "learning_rate": 4.99408913213448e-05, "loss": 1.245, "step": 1260 }, { "epoch": 1.0, "learning_rate": 4.993932759968726e-05, "loss": 1.3432, "step": 1280 }, { "epoch": 1.02, "learning_rate": 4.993776387802971e-05, "loss": 1.1923, "step": 1300 }, { "epoch": 1.03, "learning_rate": 4.9936200156372173e-05, "loss": 1.2749, "step": 1320 }, { "epoch": 1.05, "learning_rate": 4.993463643471462e-05, "loss": 1.2846, "step": 1340 }, { "epoch": 1.06, "learning_rate": 4.9933072713057077e-05, "loss": 1.2717, "step": 1360 }, { "epoch": 1.08, "learning_rate": 4.993150899139953e-05, "loss": 1.3046, "step": 1380 }, { "epoch": 1.09, "learning_rate": 4.992994526974199e-05, "loss": 1.2192, "step": 1400 }, { "epoch": 1.11, "learning_rate": 4.992838154808444e-05, "loss": 1.2909, "step": 1420 }, { "epoch": 1.12, "learning_rate": 4.9926817826426896e-05, "loss": 1.2481, "step": 1440 }, { "epoch": 1.14, "learning_rate": 4.992525410476935e-05, "loss": 1.2766, "step": 1460 }, { "epoch": 1.16, "learning_rate": 4.9923690383111806e-05, "loss": 1.2956, "step": 1480 }, { "epoch": 1.17, "learning_rate": 4.992212666145427e-05, "loss": 1.2238, "step": 1500 }, { "epoch": 1.19, "learning_rate": 4.9920562939796716e-05, "loss": 1.2528, "step": 1520 }, { "epoch": 1.2, "learning_rate": 4.991899921813917e-05, "loss": 1.2687, "step": 1540 }, { "epoch": 1.22, "learning_rate": 4.9917435496481626e-05, "loss": 1.2511, "step": 1560 }, { "epoch": 1.23, "learning_rate": 4.991587177482409e-05, "loss": 1.3194, "step": 1580 }, { "epoch": 1.25, "learning_rate": 4.9914308053166536e-05, "loss": 1.2336, "step": 1600 }, { "epoch": 1.27, "learning_rate": 4.991274433150899e-05, "loss": 1.2586, "step": 1620 }, { "epoch": 1.28, "learning_rate": 4.9911180609851446e-05, "loss": 1.2796, "step": 1640 }, { "epoch": 1.3, "learning_rate": 4.990961688819391e-05, "loss": 1.2528, "step": 1660 }, { "epoch": 1.31, "learning_rate": 4.990805316653636e-05, "loss": 1.2877, "step": 1680 }, { "epoch": 1.33, "learning_rate": 4.990648944487881e-05, "loss": 1.2321, "step": 1700 }, { "epoch": 1.34, "learning_rate": 4.9904925723221266e-05, "loss": 1.2896, "step": 1720 }, { "epoch": 1.36, "learning_rate": 4.990336200156373e-05, "loss": 1.272, "step": 1740 }, { "epoch": 1.38, "learning_rate": 4.990179827990618e-05, "loss": 1.2468, "step": 1760 }, { "epoch": 1.39, "learning_rate": 4.990023455824863e-05, "loss": 1.3006, "step": 1780 }, { "epoch": 1.41, "learning_rate": 4.9898670836591086e-05, "loss": 1.2059, "step": 1800 }, { "epoch": 1.42, "learning_rate": 4.989710711493355e-05, "loss": 1.2593, "step": 1820 }, { "epoch": 1.44, "learning_rate": 4.9895543393276e-05, "loss": 1.2779, "step": 1840 }, { "epoch": 1.45, "learning_rate": 4.989397967161845e-05, "loss": 1.2444, "step": 1860 }, { "epoch": 1.47, "learning_rate": 4.9892415949960906e-05, "loss": 1.2703, "step": 1880 }, { "epoch": 1.48, "learning_rate": 4.989085222830336e-05, "loss": 1.2044, "step": 1900 }, { "epoch": 1.5, "learning_rate": 4.988928850664582e-05, "loss": 1.2612, "step": 1920 }, { "epoch": 1.52, "learning_rate": 4.988772478498828e-05, "loss": 1.2238, "step": 1940 }, { "epoch": 1.53, "learning_rate": 4.9886161063330726e-05, "loss": 1.2442, "step": 1960 }, { "epoch": 1.55, "learning_rate": 4.988459734167318e-05, "loss": 1.3162, "step": 1980 }, { "epoch": 1.56, "learning_rate": 4.988303362001564e-05, "loss": 1.2067, "step": 2000 }, { "epoch": 1.56, "eval_cer": 0.0812, "eval_loss": 0.1771017163991928, "eval_runtime": 204.9956, "eval_samples_per_second": 18.478, "eval_steps_per_second": 0.581, "eval_wer": 0.387, "step": 2000 }, { "epoch": 1.58, "learning_rate": 4.98814698983581e-05, "loss": 1.2496, "step": 2020 }, { "epoch": 1.59, "learning_rate": 4.9879906176700546e-05, "loss": 1.207, "step": 2040 }, { "epoch": 1.61, "learning_rate": 4.9878342455043e-05, "loss": 1.2513, "step": 2060 }, { "epoch": 1.62, "learning_rate": 4.987677873338546e-05, "loss": 1.2956, "step": 2080 }, { "epoch": 1.64, "learning_rate": 4.987521501172792e-05, "loss": 1.2087, "step": 2100 }, { "epoch": 1.66, "learning_rate": 4.987365129007037e-05, "loss": 1.286, "step": 2120 }, { "epoch": 1.67, "learning_rate": 4.987208756841282e-05, "loss": 1.254, "step": 2140 }, { "epoch": 1.69, "learning_rate": 4.987052384675528e-05, "loss": 1.2085, "step": 2160 }, { "epoch": 1.7, "learning_rate": 4.986896012509774e-05, "loss": 1.3, "step": 2180 }, { "epoch": 1.72, "learning_rate": 4.986739640344019e-05, "loss": 1.211, "step": 2200 }, { "epoch": 1.73, "learning_rate": 4.986583268178264e-05, "loss": 1.3375, "step": 2220 }, { "epoch": 1.75, "learning_rate": 4.98642689601251e-05, "loss": 1.305, "step": 2240 }, { "epoch": 1.77, "learning_rate": 4.986270523846756e-05, "loss": 1.2224, "step": 2260 }, { "epoch": 1.78, "learning_rate": 4.986114151681001e-05, "loss": 1.3084, "step": 2280 }, { "epoch": 1.8, "learning_rate": 4.985957779515247e-05, "loss": 1.2488, "step": 2300 }, { "epoch": 1.81, "learning_rate": 4.9858014073494915e-05, "loss": 1.2654, "step": 2320 }, { "epoch": 1.83, "learning_rate": 4.985645035183738e-05, "loss": 1.2396, "step": 2340 }, { "epoch": 1.84, "learning_rate": 4.985488663017983e-05, "loss": 1.2673, "step": 2360 }, { "epoch": 1.86, "learning_rate": 4.985340109460516e-05, "loss": 1.3211, "step": 2380 }, { "epoch": 1.88, "learning_rate": 4.985183737294762e-05, "loss": 1.2117, "step": 2400 }, { "epoch": 1.89, "learning_rate": 4.9850273651290076e-05, "loss": 1.2614, "step": 2420 }, { "epoch": 1.91, "learning_rate": 4.9848709929632524e-05, "loss": 1.2526, "step": 2440 }, { "epoch": 1.92, "learning_rate": 4.984714620797498e-05, "loss": 1.2746, "step": 2460 }, { "epoch": 1.94, "learning_rate": 4.984558248631744e-05, "loss": 1.2889, "step": 2480 }, { "epoch": 1.95, "learning_rate": 4.9844018764659896e-05, "loss": 1.1897, "step": 2500 }, { "epoch": 1.97, "learning_rate": 4.984245504300235e-05, "loss": 1.2919, "step": 2520 }, { "epoch": 1.98, "learning_rate": 4.98408913213448e-05, "loss": 1.287, "step": 2540 }, { "epoch": 2.0, "learning_rate": 4.983932759968726e-05, "loss": 1.3291, "step": 2560 }, { "epoch": 2.02, "learning_rate": 4.9837763878029716e-05, "loss": 1.2409, "step": 2580 }, { "epoch": 2.03, "learning_rate": 4.983620015637217e-05, "loss": 1.2328, "step": 2600 }, { "epoch": 2.05, "learning_rate": 4.983463643471462e-05, "loss": 1.2733, "step": 2620 }, { "epoch": 2.06, "learning_rate": 4.9833072713057074e-05, "loss": 1.2412, "step": 2640 }, { "epoch": 2.08, "learning_rate": 4.9831508991399536e-05, "loss": 1.2744, "step": 2660 }, { "epoch": 2.09, "learning_rate": 4.982994526974199e-05, "loss": 1.2137, "step": 2680 }, { "epoch": 2.11, "learning_rate": 4.982838154808444e-05, "loss": 1.2255, "step": 2700 }, { "epoch": 2.12, "learning_rate": 4.9826817826426894e-05, "loss": 1.2593, "step": 2720 }, { "epoch": 2.14, "learning_rate": 4.9825254104769356e-05, "loss": 1.2192, "step": 2740 }, { "epoch": 2.16, "learning_rate": 4.982369038311181e-05, "loss": 1.2736, "step": 2760 }, { "epoch": 2.17, "learning_rate": 4.9822126661454266e-05, "loss": 1.1969, "step": 2780 }, { "epoch": 2.19, "learning_rate": 4.9820562939796714e-05, "loss": 1.2642, "step": 2800 }, { "epoch": 2.2, "learning_rate": 4.9818999218139176e-05, "loss": 1.2489, "step": 2820 }, { "epoch": 2.22, "learning_rate": 4.981743549648163e-05, "loss": 1.2073, "step": 2840 }, { "epoch": 2.23, "learning_rate": 4.9815871774824086e-05, "loss": 1.2976, "step": 2860 }, { "epoch": 2.25, "learning_rate": 4.9814308053166534e-05, "loss": 1.2086, "step": 2880 }, { "epoch": 2.27, "learning_rate": 4.9812744331508996e-05, "loss": 1.3276, "step": 2900 }, { "epoch": 2.28, "learning_rate": 4.981118060985145e-05, "loss": 1.2663, "step": 2920 }, { "epoch": 2.3, "learning_rate": 4.9809616888193906e-05, "loss": 1.2333, "step": 2940 }, { "epoch": 2.31, "learning_rate": 4.980805316653636e-05, "loss": 1.2822, "step": 2960 }, { "epoch": 2.33, "learning_rate": 4.9806489444878815e-05, "loss": 1.2047, "step": 2980 }, { "epoch": 2.34, "learning_rate": 4.980492572322127e-05, "loss": 1.2678, "step": 3000 }, { "epoch": 2.34, "eval_cer": 0.0857, "eval_loss": 0.1775198131799698, "eval_runtime": 205.8124, "eval_samples_per_second": 18.405, "eval_steps_per_second": 0.578, "eval_wer": 0.4054, "step": 3000 }, { "epoch": 2.36, "learning_rate": 4.9803362001563725e-05, "loss": 1.238, "step": 3020 }, { "epoch": 2.38, "learning_rate": 4.980179827990618e-05, "loss": 1.2223, "step": 3040 }, { "epoch": 2.39, "learning_rate": 4.980023455824863e-05, "loss": 1.2509, "step": 3060 }, { "epoch": 2.41, "learning_rate": 4.979867083659109e-05, "loss": 1.1967, "step": 3080 }, { "epoch": 2.42, "learning_rate": 4.9797107114933545e-05, "loss": 1.2329, "step": 3100 }, { "epoch": 2.44, "learning_rate": 4.9795543393276e-05, "loss": 1.2557, "step": 3120 }, { "epoch": 2.45, "learning_rate": 4.9793979671618455e-05, "loss": 1.2301, "step": 3140 }, { "epoch": 2.47, "learning_rate": 4.979241594996091e-05, "loss": 1.3269, "step": 3160 }, { "epoch": 2.48, "learning_rate": 4.9790852228303365e-05, "loss": 1.2115, "step": 3180 }, { "epoch": 2.5, "learning_rate": 4.978928850664582e-05, "loss": 1.2187, "step": 3200 }, { "epoch": 2.52, "learning_rate": 4.9787724784988275e-05, "loss": 1.2468, "step": 3220 }, { "epoch": 2.53, "learning_rate": 4.978616106333073e-05, "loss": 1.2157, "step": 3240 }, { "epoch": 2.55, "learning_rate": 4.9784597341673185e-05, "loss": 1.2824, "step": 3260 }, { "epoch": 2.56, "learning_rate": 4.978303362001564e-05, "loss": 1.2243, "step": 3280 }, { "epoch": 2.58, "learning_rate": 4.9781469898358095e-05, "loss": 1.2637, "step": 3300 }, { "epoch": 2.59, "learning_rate": 4.977990617670055e-05, "loss": 1.2281, "step": 3320 }, { "epoch": 2.61, "learning_rate": 4.9778342455043005e-05, "loss": 1.2227, "step": 3340 }, { "epoch": 2.62, "learning_rate": 4.977677873338546e-05, "loss": 1.3163, "step": 3360 }, { "epoch": 2.64, "learning_rate": 4.9775215011727915e-05, "loss": 1.2271, "step": 3380 }, { "epoch": 2.66, "learning_rate": 4.977365129007037e-05, "loss": 1.2802, "step": 3400 }, { "epoch": 2.67, "learning_rate": 4.9772087568412825e-05, "loss": 1.2588, "step": 3420 }, { "epoch": 2.69, "learning_rate": 4.977052384675528e-05, "loss": 1.2276, "step": 3440 }, { "epoch": 2.7, "learning_rate": 4.9768960125097735e-05, "loss": 1.3012, "step": 3460 }, { "epoch": 2.72, "learning_rate": 4.976739640344019e-05, "loss": 1.2268, "step": 3480 }, { "epoch": 2.73, "learning_rate": 4.9765832681782645e-05, "loss": 1.2364, "step": 3500 }, { "epoch": 2.75, "learning_rate": 4.97642689601251e-05, "loss": 1.2548, "step": 3520 }, { "epoch": 2.77, "learning_rate": 4.9762705238467555e-05, "loss": 1.2396, "step": 3540 }, { "epoch": 2.78, "learning_rate": 4.976114151681001e-05, "loss": 1.2735, "step": 3560 }, { "epoch": 2.8, "learning_rate": 4.9759577795152465e-05, "loss": 1.1825, "step": 3580 }, { "epoch": 2.81, "learning_rate": 4.975801407349492e-05, "loss": 1.2765, "step": 3600 }, { "epoch": 2.83, "learning_rate": 4.9756450351837375e-05, "loss": 1.271, "step": 3620 }, { "epoch": 2.84, "learning_rate": 4.975488663017983e-05, "loss": 1.2182, "step": 3640 }, { "epoch": 2.86, "learning_rate": 4.9753322908522285e-05, "loss": 1.2692, "step": 3660 }, { "epoch": 2.88, "learning_rate": 4.975175918686474e-05, "loss": 1.2052, "step": 3680 }, { "epoch": 2.89, "learning_rate": 4.9750195465207195e-05, "loss": 1.2371, "step": 3700 }, { "epoch": 2.91, "learning_rate": 4.974863174354965e-05, "loss": 1.2511, "step": 3720 }, { "epoch": 2.92, "learning_rate": 4.9747068021892104e-05, "loss": 1.2198, "step": 3740 }, { "epoch": 2.94, "learning_rate": 4.9745504300234566e-05, "loss": 1.3216, "step": 3760 }, { "epoch": 2.95, "learning_rate": 4.9743940578577014e-05, "loss": 1.1973, "step": 3780 }, { "epoch": 2.97, "learning_rate": 4.974237685691947e-05, "loss": 1.2838, "step": 3800 }, { "epoch": 2.98, "learning_rate": 4.9740813135261924e-05, "loss": 1.2279, "step": 3820 }, { "epoch": 3.0, "learning_rate": 4.9739249413604386e-05, "loss": 1.2567, "step": 3840 }, { "epoch": 3.02, "learning_rate": 4.9737685691946834e-05, "loss": 1.2005, "step": 3860 }, { "epoch": 3.03, "learning_rate": 4.973612197028929e-05, "loss": 1.2558, "step": 3880 }, { "epoch": 3.05, "learning_rate": 4.9734558248631744e-05, "loss": 1.2342, "step": 3900 }, { "epoch": 3.06, "learning_rate": 4.97329945269742e-05, "loss": 1.2282, "step": 3920 }, { "epoch": 3.08, "learning_rate": 4.9731430805316654e-05, "loss": 1.2982, "step": 3940 }, { "epoch": 3.09, "learning_rate": 4.972986708365911e-05, "loss": 1.1869, "step": 3960 }, { "epoch": 3.11, "learning_rate": 4.9728303362001564e-05, "loss": 1.2467, "step": 3980 }, { "epoch": 3.12, "learning_rate": 4.972673964034402e-05, "loss": 1.1948, "step": 4000 }, { "epoch": 3.12, "eval_cer": 0.0818, "eval_loss": 0.1827949732542038, "eval_runtime": 203.6961, "eval_samples_per_second": 18.596, "eval_steps_per_second": 0.584, "eval_wer": 0.39, "step": 4000 }, { "epoch": 3.14, "learning_rate": 4.972517591868648e-05, "loss": 1.2302, "step": 4020 }, { "epoch": 3.16, "learning_rate": 4.972361219702893e-05, "loss": 1.2305, "step": 4040 }, { "epoch": 3.17, "learning_rate": 4.9722048475371384e-05, "loss": 1.1915, "step": 4060 }, { "epoch": 3.19, "learning_rate": 4.972048475371384e-05, "loss": 1.2451, "step": 4080 }, { "epoch": 3.2, "learning_rate": 4.97189210320563e-05, "loss": 1.272, "step": 4100 }, { "epoch": 3.22, "learning_rate": 4.971735731039875e-05, "loss": 1.2177, "step": 4120 }, { "epoch": 3.23, "learning_rate": 4.9715793588741204e-05, "loss": 1.2703, "step": 4140 }, { "epoch": 3.25, "learning_rate": 4.971422986708366e-05, "loss": 1.2107, "step": 4160 }, { "epoch": 3.27, "learning_rate": 4.971266614542612e-05, "loss": 1.2415, "step": 4180 }, { "epoch": 3.28, "learning_rate": 4.9711102423768576e-05, "loss": 1.2583, "step": 4200 }, { "epoch": 3.3, "learning_rate": 4.9709538702111024e-05, "loss": 1.239, "step": 4220 }, { "epoch": 3.31, "learning_rate": 4.970797498045348e-05, "loss": 1.28, "step": 4240 }, { "epoch": 3.33, "learning_rate": 4.970641125879594e-05, "loss": 1.1845, "step": 4260 }, { "epoch": 3.34, "learning_rate": 4.9704847537138396e-05, "loss": 1.2771, "step": 4280 }, { "epoch": 3.36, "learning_rate": 4.9703283815480844e-05, "loss": 1.2498, "step": 4300 }, { "epoch": 3.38, "learning_rate": 4.97017200938233e-05, "loss": 1.2496, "step": 4320 }, { "epoch": 3.39, "learning_rate": 4.9700156372165754e-05, "loss": 1.266, "step": 4340 }, { "epoch": 3.41, "learning_rate": 4.9698592650508215e-05, "loss": 1.2179, "step": 4360 }, { "epoch": 3.42, "learning_rate": 4.969702892885067e-05, "loss": 1.2424, "step": 4380 }, { "epoch": 3.44, "learning_rate": 4.969546520719312e-05, "loss": 1.2421, "step": 4400 }, { "epoch": 3.45, "learning_rate": 4.9693901485535574e-05, "loss": 1.2112, "step": 4420 }, { "epoch": 3.47, "learning_rate": 4.9692337763878035e-05, "loss": 1.2812, "step": 4440 }, { "epoch": 3.48, "learning_rate": 4.969077404222049e-05, "loss": 1.1999, "step": 4460 }, { "epoch": 3.5, "learning_rate": 4.968921032056294e-05, "loss": 1.2714, "step": 4480 }, { "epoch": 3.52, "learning_rate": 4.9687646598905393e-05, "loss": 1.2659, "step": 4500 }, { "epoch": 3.53, "learning_rate": 4.9686082877247855e-05, "loss": 1.234, "step": 4520 }, { "epoch": 3.55, "learning_rate": 4.968451915559031e-05, "loss": 1.3003, "step": 4540 }, { "epoch": 3.56, "learning_rate": 4.968295543393276e-05, "loss": 1.1792, "step": 4560 }, { "epoch": 3.58, "learning_rate": 4.968139171227521e-05, "loss": 1.2378, "step": 4580 }, { "epoch": 3.59, "learning_rate": 4.9679827990617675e-05, "loss": 1.1859, "step": 4600 }, { "epoch": 3.61, "learning_rate": 4.967826426896013e-05, "loss": 1.2221, "step": 4620 }, { "epoch": 3.62, "learning_rate": 4.9676700547302585e-05, "loss": 1.3189, "step": 4640 }, { "epoch": 3.64, "learning_rate": 4.967513682564503e-05, "loss": 1.2093, "step": 4660 }, { "epoch": 3.66, "learning_rate": 4.9673573103987495e-05, "loss": 1.2444, "step": 4680 }, { "epoch": 3.67, "learning_rate": 4.967200938232995e-05, "loss": 1.2443, "step": 4700 }, { "epoch": 3.69, "learning_rate": 4.9670445660672405e-05, "loss": 1.2201, "step": 4720 }, { "epoch": 3.7, "learning_rate": 4.966888193901485e-05, "loss": 1.2984, "step": 4740 }, { "epoch": 3.72, "learning_rate": 4.9667318217357315e-05, "loss": 1.1541, "step": 4760 }, { "epoch": 3.73, "learning_rate": 4.966575449569977e-05, "loss": 1.2569, "step": 4780 }, { "epoch": 3.75, "learning_rate": 4.9664190774042225e-05, "loss": 1.2343, "step": 4800 }, { "epoch": 3.77, "learning_rate": 4.966262705238468e-05, "loss": 1.2383, "step": 4820 }, { "epoch": 3.78, "learning_rate": 4.966106333072713e-05, "loss": 1.2854, "step": 4840 }, { "epoch": 3.8, "learning_rate": 4.965949960906959e-05, "loss": 1.2075, "step": 4860 }, { "epoch": 3.81, "learning_rate": 4.9657935887412045e-05, "loss": 1.2634, "step": 4880 }, { "epoch": 3.83, "learning_rate": 4.96563721657545e-05, "loss": 1.2514, "step": 4900 }, { "epoch": 3.84, "learning_rate": 4.965480844409695e-05, "loss": 1.2496, "step": 4920 }, { "epoch": 3.86, "learning_rate": 4.965324472243941e-05, "loss": 1.2448, "step": 4940 }, { "epoch": 3.88, "learning_rate": 4.9651681000781865e-05, "loss": 1.2003, "step": 4960 }, { "epoch": 3.89, "learning_rate": 4.965011727912432e-05, "loss": 1.2258, "step": 4980 }, { "epoch": 3.91, "learning_rate": 4.9648553557466775e-05, "loss": 1.2391, "step": 5000 }, { "epoch": 3.91, "eval_cer": 0.0813, "eval_loss": 0.18853867053985596, "eval_runtime": 232.3133, "eval_samples_per_second": 16.306, "eval_steps_per_second": 0.512, "eval_wer": 0.3882, "step": 5000 }, { "epoch": 3.92, "learning_rate": 4.964698983580923e-05, "loss": 1.1997, "step": 5020 }, { "epoch": 3.94, "learning_rate": 4.9645504300234564e-05, "loss": 1.2773, "step": 5040 }, { "epoch": 3.95, "learning_rate": 4.964394057857701e-05, "loss": 1.1888, "step": 5060 }, { "epoch": 3.97, "learning_rate": 4.964237685691947e-05, "loss": 1.2591, "step": 5080 }, { "epoch": 3.98, "learning_rate": 4.964081313526193e-05, "loss": 1.251, "step": 5100 }, { "epoch": 4.0, "learning_rate": 4.9639249413604384e-05, "loss": 1.2784, "step": 5120 }, { "epoch": 4.02, "learning_rate": 4.963768569194683e-05, "loss": 1.2064, "step": 5140 }, { "epoch": 4.03, "learning_rate": 4.963612197028929e-05, "loss": 1.2284, "step": 5160 }, { "epoch": 4.05, "learning_rate": 4.963455824863175e-05, "loss": 1.2262, "step": 5180 }, { "epoch": 4.06, "learning_rate": 4.9632994526974204e-05, "loss": 1.2599, "step": 5200 }, { "epoch": 4.08, "learning_rate": 4.963143080531666e-05, "loss": 1.2459, "step": 5220 }, { "epoch": 4.09, "learning_rate": 4.962986708365911e-05, "loss": 1.1851, "step": 5240 }, { "epoch": 4.11, "learning_rate": 4.962830336200157e-05, "loss": 1.2696, "step": 5260 }, { "epoch": 4.12, "learning_rate": 4.9626739640344023e-05, "loss": 1.2703, "step": 5280 }, { "epoch": 4.14, "learning_rate": 4.962517591868648e-05, "loss": 1.2191, "step": 5300 }, { "epoch": 4.16, "learning_rate": 4.962361219702893e-05, "loss": 1.2728, "step": 5320 }, { "epoch": 4.17, "learning_rate": 4.962204847537139e-05, "loss": 1.2002, "step": 5340 }, { "epoch": 4.19, "learning_rate": 4.962048475371384e-05, "loss": 1.2316, "step": 5360 }, { "epoch": 4.2, "learning_rate": 4.96189210320563e-05, "loss": 1.22, "step": 5380 }, { "epoch": 4.22, "learning_rate": 4.9617357310398747e-05, "loss": 1.2319, "step": 5400 }, { "epoch": 4.23, "learning_rate": 4.961579358874121e-05, "loss": 1.2072, "step": 5420 }, { "epoch": 4.25, "learning_rate": 4.961422986708366e-05, "loss": 1.2148, "step": 5440 }, { "epoch": 4.27, "learning_rate": 4.961266614542612e-05, "loss": 1.2211, "step": 5460 }, { "epoch": 4.28, "learning_rate": 4.961110242376857e-05, "loss": 1.1976, "step": 5480 }, { "epoch": 4.3, "learning_rate": 4.960953870211102e-05, "loss": 1.2191, "step": 5500 }, { "epoch": 4.31, "learning_rate": 4.960797498045348e-05, "loss": 1.1971, "step": 5520 }, { "epoch": 4.33, "learning_rate": 4.960641125879594e-05, "loss": 1.1755, "step": 5540 }, { "epoch": 4.34, "learning_rate": 4.960484753713839e-05, "loss": 1.2363, "step": 5560 }, { "epoch": 4.36, "learning_rate": 4.960328381548084e-05, "loss": 1.1963, "step": 5580 }, { "epoch": 4.38, "learning_rate": 4.96017200938233e-05, "loss": 1.1846, "step": 5600 }, { "epoch": 4.39, "learning_rate": 4.960015637216576e-05, "loss": 1.2689, "step": 5620 }, { "epoch": 4.41, "learning_rate": 4.959859265050821e-05, "loss": 1.1421, "step": 5640 }, { "epoch": 4.42, "learning_rate": 4.959702892885067e-05, "loss": 1.2535, "step": 5660 }, { "epoch": 4.44, "learning_rate": 4.959546520719312e-05, "loss": 1.2417, "step": 5680 }, { "epoch": 4.45, "learning_rate": 4.959390148553558e-05, "loss": 1.2004, "step": 5700 }, { "epoch": 4.47, "learning_rate": 4.959233776387803e-05, "loss": 1.1777, "step": 5720 }, { "epoch": 4.48, "learning_rate": 4.959077404222049e-05, "loss": 1.1552, "step": 5740 }, { "epoch": 4.5, "learning_rate": 4.958921032056294e-05, "loss": 1.2118, "step": 5760 }, { "epoch": 4.52, "learning_rate": 4.95876465989054e-05, "loss": 1.236, "step": 5780 }, { "epoch": 4.53, "learning_rate": 4.958608287724785e-05, "loss": 1.2112, "step": 5800 }, { "epoch": 4.55, "learning_rate": 4.958451915559031e-05, "loss": 1.2351, "step": 5820 }, { "epoch": 4.56, "learning_rate": 4.958295543393276e-05, "loss": 1.1556, "step": 5840 }, { "epoch": 4.58, "learning_rate": 4.958139171227522e-05, "loss": 1.2655, "step": 5860 }, { "epoch": 4.59, "learning_rate": 4.957982799061767e-05, "loss": 1.2375, "step": 5880 }, { "epoch": 4.61, "learning_rate": 4.957826426896013e-05, "loss": 1.2298, "step": 5900 }, { "epoch": 4.62, "learning_rate": 4.957670054730258e-05, "loss": 1.2429, "step": 5920 }, { "epoch": 4.64, "learning_rate": 4.957513682564504e-05, "loss": 1.1583, "step": 5940 }, { "epoch": 4.66, "learning_rate": 4.957357310398749e-05, "loss": 1.2323, "step": 5960 }, { "epoch": 4.67, "learning_rate": 4.957200938232995e-05, "loss": 1.2378, "step": 5980 }, { "epoch": 4.69, "learning_rate": 4.95704456606724e-05, "loss": 1.1844, "step": 6000 }, { "epoch": 4.69, "eval_cer": 0.0775, "eval_loss": 0.182363361120224, "eval_runtime": 217.3693, "eval_samples_per_second": 17.427, "eval_steps_per_second": 0.547, "eval_wer": 0.3739, "step": 6000 }, { "epoch": 4.7, "learning_rate": 4.956888193901486e-05, "loss": 1.2492, "step": 6020 }, { "epoch": 4.72, "learning_rate": 4.956731821735731e-05, "loss": 1.1634, "step": 6040 }, { "epoch": 4.73, "learning_rate": 4.956575449569977e-05, "loss": 1.2397, "step": 6060 }, { "epoch": 4.75, "learning_rate": 4.956419077404222e-05, "loss": 1.2019, "step": 6080 }, { "epoch": 4.77, "learning_rate": 4.956262705238468e-05, "loss": 1.2111, "step": 6100 }, { "epoch": 4.78, "learning_rate": 4.956106333072713e-05, "loss": 1.2573, "step": 6120 }, { "epoch": 4.8, "learning_rate": 4.955949960906959e-05, "loss": 1.191, "step": 6140 }, { "epoch": 4.81, "learning_rate": 4.955793588741204e-05, "loss": 1.2297, "step": 6160 }, { "epoch": 4.83, "learning_rate": 4.95563721657545e-05, "loss": 1.2067, "step": 6180 }, { "epoch": 4.84, "learning_rate": 4.955480844409695e-05, "loss": 1.1944, "step": 6200 }, { "epoch": 4.86, "learning_rate": 4.955324472243941e-05, "loss": 1.2391, "step": 6220 }, { "epoch": 4.88, "learning_rate": 4.955168100078186e-05, "loss": 1.1761, "step": 6240 }, { "epoch": 4.89, "learning_rate": 4.955011727912432e-05, "loss": 1.2434, "step": 6260 }, { "epoch": 4.91, "learning_rate": 4.954855355746678e-05, "loss": 1.2346, "step": 6280 }, { "epoch": 4.92, "learning_rate": 4.954698983580923e-05, "loss": 1.2137, "step": 6300 }, { "epoch": 4.94, "learning_rate": 4.954542611415168e-05, "loss": 1.2652, "step": 6320 }, { "epoch": 4.95, "learning_rate": 4.954386239249414e-05, "loss": 1.1937, "step": 6340 }, { "epoch": 4.97, "learning_rate": 4.95422986708366e-05, "loss": 1.225, "step": 6360 }, { "epoch": 4.98, "learning_rate": 4.954073494917905e-05, "loss": 1.2629, "step": 6380 }, { "epoch": 5.0, "learning_rate": 4.95391712275215e-05, "loss": 1.256, "step": 6400 }, { "epoch": 5.02, "learning_rate": 4.953760750586396e-05, "loss": 1.1885, "step": 6420 }, { "epoch": 5.03, "learning_rate": 4.953604378420641e-05, "loss": 1.2654, "step": 6440 }, { "epoch": 5.05, "learning_rate": 4.9534480062548874e-05, "loss": 1.178, "step": 6460 }, { "epoch": 5.06, "learning_rate": 4.953291634089132e-05, "loss": 1.185, "step": 6480 }, { "epoch": 5.08, "learning_rate": 4.953135261923378e-05, "loss": 1.2438, "step": 6500 }, { "epoch": 5.09, "learning_rate": 4.952978889757623e-05, "loss": 1.1841, "step": 6520 }, { "epoch": 5.11, "learning_rate": 4.9528225175918694e-05, "loss": 1.2014, "step": 6540 }, { "epoch": 5.12, "learning_rate": 4.952666145426114e-05, "loss": 1.2134, "step": 6560 }, { "epoch": 5.14, "learning_rate": 4.95250977326036e-05, "loss": 1.2219, "step": 6580 }, { "epoch": 5.16, "learning_rate": 4.952353401094605e-05, "loss": 1.2398, "step": 6600 }, { "epoch": 5.17, "learning_rate": 4.9521970289288513e-05, "loss": 1.1636, "step": 6620 }, { "epoch": 5.19, "learning_rate": 4.952040656763096e-05, "loss": 1.1736, "step": 6640 }, { "epoch": 5.2, "learning_rate": 4.951884284597342e-05, "loss": 1.237, "step": 6660 }, { "epoch": 5.22, "learning_rate": 4.951727912431587e-05, "loss": 1.2309, "step": 6680 }, { "epoch": 5.23, "learning_rate": 4.951571540265833e-05, "loss": 1.241, "step": 6700 }, { "epoch": 5.25, "learning_rate": 4.951415168100079e-05, "loss": 1.1852, "step": 6720 }, { "epoch": 5.27, "learning_rate": 4.9512587959343237e-05, "loss": 1.2101, "step": 6740 }, { "epoch": 5.28, "learning_rate": 4.951102423768569e-05, "loss": 1.1873, "step": 6760 }, { "epoch": 5.3, "learning_rate": 4.950946051602815e-05, "loss": 1.1672, "step": 6780 }, { "epoch": 5.31, "learning_rate": 4.950789679437061e-05, "loss": 1.27, "step": 6800 }, { "epoch": 5.33, "learning_rate": 4.9506333072713056e-05, "loss": 1.1752, "step": 6820 }, { "epoch": 5.34, "learning_rate": 4.950476935105551e-05, "loss": 1.206, "step": 6840 }, { "epoch": 5.36, "learning_rate": 4.9503205629397966e-05, "loss": 1.228, "step": 6860 }, { "epoch": 5.38, "learning_rate": 4.950164190774043e-05, "loss": 1.234, "step": 6880 }, { "epoch": 5.39, "learning_rate": 4.950007818608288e-05, "loss": 1.2421, "step": 6900 }, { "epoch": 5.41, "learning_rate": 4.949851446442533e-05, "loss": 1.1855, "step": 6920 }, { "epoch": 5.42, "learning_rate": 4.9496950742767786e-05, "loss": 1.26, "step": 6940 }, { "epoch": 5.44, "learning_rate": 4.949538702111025e-05, "loss": 1.2573, "step": 6960 }, { "epoch": 5.45, "learning_rate": 4.94938232994527e-05, "loss": 1.2045, "step": 6980 }, { "epoch": 5.47, "learning_rate": 4.949225957779515e-05, "loss": 1.2104, "step": 7000 }, { "epoch": 5.47, "eval_cer": 0.0788, "eval_loss": 0.1948978453874588, "eval_runtime": 216.8449, "eval_samples_per_second": 17.469, "eval_steps_per_second": 0.549, "eval_wer": 0.3859, "step": 7000 }, { "epoch": 5.48, "learning_rate": 4.9490695856137606e-05, "loss": 1.1683, "step": 7020 }, { "epoch": 5.5, "learning_rate": 4.948913213448007e-05, "loss": 1.2448, "step": 7040 }, { "epoch": 5.52, "learning_rate": 4.9487646598905395e-05, "loss": 1.2103, "step": 7060 }, { "epoch": 5.53, "learning_rate": 4.948616106333073e-05, "loss": 1.2073, "step": 7080 }, { "epoch": 5.55, "learning_rate": 4.9484597341673185e-05, "loss": 1.2467, "step": 7100 }, { "epoch": 5.56, "learning_rate": 4.948303362001564e-05, "loss": 1.171, "step": 7120 }, { "epoch": 5.58, "learning_rate": 4.9481469898358095e-05, "loss": 1.2299, "step": 7140 }, { "epoch": 5.59, "learning_rate": 4.947990617670055e-05, "loss": 1.235, "step": 7160 }, { "epoch": 5.61, "learning_rate": 4.9478342455043004e-05, "loss": 1.2087, "step": 7180 }, { "epoch": 5.62, "learning_rate": 4.947677873338546e-05, "loss": 1.257, "step": 7200 }, { "epoch": 5.64, "learning_rate": 4.9475215011727914e-05, "loss": 1.154, "step": 7220 }, { "epoch": 5.66, "learning_rate": 4.947365129007037e-05, "loss": 1.2187, "step": 7240 }, { "epoch": 5.67, "learning_rate": 4.9472087568412824e-05, "loss": 1.16, "step": 7260 }, { "epoch": 5.69, "learning_rate": 4.947052384675528e-05, "loss": 1.1965, "step": 7280 }, { "epoch": 5.7, "learning_rate": 4.9468960125097734e-05, "loss": 1.2916, "step": 7300 }, { "epoch": 5.72, "learning_rate": 4.946739640344019e-05, "loss": 1.1897, "step": 7320 }, { "epoch": 5.73, "learning_rate": 4.9465832681782644e-05, "loss": 1.2386, "step": 7340 }, { "epoch": 5.75, "learning_rate": 4.94642689601251e-05, "loss": 1.2106, "step": 7360 }, { "epoch": 5.77, "learning_rate": 4.9462705238467554e-05, "loss": 1.2148, "step": 7380 }, { "epoch": 5.78, "learning_rate": 4.946114151681001e-05, "loss": 1.2698, "step": 7400 }, { "epoch": 5.8, "learning_rate": 4.9459577795152464e-05, "loss": 1.1778, "step": 7420 }, { "epoch": 5.81, "learning_rate": 4.945801407349492e-05, "loss": 1.2407, "step": 7440 }, { "epoch": 5.83, "learning_rate": 4.9456450351837374e-05, "loss": 1.218, "step": 7460 }, { "epoch": 5.84, "learning_rate": 4.945488663017983e-05, "loss": 1.1853, "step": 7480 }, { "epoch": 5.86, "learning_rate": 4.9453322908522284e-05, "loss": 1.231, "step": 7500 }, { "epoch": 5.88, "learning_rate": 4.945175918686474e-05, "loss": 1.1855, "step": 7520 }, { "epoch": 5.89, "learning_rate": 4.9450195465207194e-05, "loss": 1.2287, "step": 7540 }, { "epoch": 5.91, "learning_rate": 4.944863174354965e-05, "loss": 1.2002, "step": 7560 }, { "epoch": 5.92, "learning_rate": 4.9447068021892104e-05, "loss": 1.2184, "step": 7580 }, { "epoch": 5.94, "learning_rate": 4.9445504300234566e-05, "loss": 1.2369, "step": 7600 }, { "epoch": 5.95, "learning_rate": 4.9443940578577014e-05, "loss": 1.1743, "step": 7620 }, { "epoch": 5.97, "learning_rate": 4.944237685691947e-05, "loss": 1.2273, "step": 7640 }, { "epoch": 5.98, "learning_rate": 4.9440813135261924e-05, "loss": 1.2251, "step": 7660 }, { "epoch": 6.0, "learning_rate": 4.9439249413604386e-05, "loss": 1.2241, "step": 7680 }, { "epoch": 6.02, "learning_rate": 4.9437685691946834e-05, "loss": 1.165, "step": 7700 }, { "epoch": 6.03, "learning_rate": 4.943612197028929e-05, "loss": 1.2257, "step": 7720 }, { "epoch": 6.05, "learning_rate": 4.9434558248631744e-05, "loss": 1.2073, "step": 7740 }, { "epoch": 6.06, "learning_rate": 4.9432994526974205e-05, "loss": 1.2371, "step": 7760 }, { "epoch": 6.08, "learning_rate": 4.943143080531666e-05, "loss": 1.2584, "step": 7780 }, { "epoch": 6.09, "learning_rate": 4.942986708365911e-05, "loss": 1.1683, "step": 7800 }, { "epoch": 6.11, "learning_rate": 4.9428303362001564e-05, "loss": 1.2194, "step": 7820 }, { "epoch": 6.12, "learning_rate": 4.942673964034402e-05, "loss": 1.2369, "step": 7840 }, { "epoch": 6.14, "learning_rate": 4.942517591868648e-05, "loss": 1.2147, "step": 7860 }, { "epoch": 6.16, "learning_rate": 4.942361219702893e-05, "loss": 1.2766, "step": 7880 }, { "epoch": 6.17, "learning_rate": 4.9422048475371384e-05, "loss": 1.1701, "step": 7900 }, { "epoch": 6.19, "learning_rate": 4.942048475371384e-05, "loss": 1.2333, "step": 7920 }, { "epoch": 6.2, "learning_rate": 4.94189210320563e-05, "loss": 1.1741, "step": 7940 }, { "epoch": 6.22, "learning_rate": 4.9417357310398755e-05, "loss": 1.2315, "step": 7960 }, { "epoch": 6.23, "learning_rate": 4.9415793588741203e-05, "loss": 1.2349, "step": 7980 }, { "epoch": 6.25, "learning_rate": 4.941422986708366e-05, "loss": 1.1613, "step": 8000 }, { "epoch": 6.25, "eval_cer": 0.0786, "eval_loss": 0.18531309068202972, "eval_runtime": 243.1453, "eval_samples_per_second": 15.579, "eval_steps_per_second": 0.489, "eval_wer": 0.3788, "step": 8000 }, { "epoch": 6.27, "learning_rate": 4.941266614542612e-05, "loss": 1.2077, "step": 8020 }, { "epoch": 6.28, "learning_rate": 4.9411102423768575e-05, "loss": 1.2182, "step": 8040 }, { "epoch": 6.3, "learning_rate": 4.940953870211102e-05, "loss": 1.2086, "step": 8060 }, { "epoch": 6.31, "learning_rate": 4.940797498045348e-05, "loss": 1.2209, "step": 8080 }, { "epoch": 6.33, "learning_rate": 4.940641125879594e-05, "loss": 1.1535, "step": 8100 }, { "epoch": 6.34, "learning_rate": 4.9404847537138395e-05, "loss": 1.2179, "step": 8120 }, { "epoch": 6.36, "learning_rate": 4.940328381548084e-05, "loss": 1.1955, "step": 8140 }, { "epoch": 6.38, "learning_rate": 4.94017200938233e-05, "loss": 1.1731, "step": 8160 }, { "epoch": 6.39, "learning_rate": 4.940015637216576e-05, "loss": 1.1931, "step": 8180 }, { "epoch": 6.41, "learning_rate": 4.9398592650508215e-05, "loss": 1.167, "step": 8200 }, { "epoch": 6.42, "learning_rate": 4.939702892885067e-05, "loss": 1.2239, "step": 8220 }, { "epoch": 6.44, "learning_rate": 4.939546520719312e-05, "loss": 1.2248, "step": 8240 }, { "epoch": 6.45, "learning_rate": 4.939390148553557e-05, "loss": 1.1992, "step": 8260 }, { "epoch": 6.47, "learning_rate": 4.9392337763878035e-05, "loss": 1.2442, "step": 8280 }, { "epoch": 6.48, "learning_rate": 4.939077404222049e-05, "loss": 1.1633, "step": 8300 }, { "epoch": 6.5, "learning_rate": 4.938921032056294e-05, "loss": 1.2167, "step": 8320 }, { "epoch": 6.52, "learning_rate": 4.938764659890539e-05, "loss": 1.1829, "step": 8340 }, { "epoch": 6.53, "learning_rate": 4.9386082877247855e-05, "loss": 1.2181, "step": 8360 }, { "epoch": 6.55, "learning_rate": 4.938451915559031e-05, "loss": 1.2706, "step": 8380 }, { "epoch": 6.56, "learning_rate": 4.9382955433932765e-05, "loss": 1.1758, "step": 8400 }, { "epoch": 6.58, "learning_rate": 4.938139171227521e-05, "loss": 1.2098, "step": 8420 }, { "epoch": 6.59, "learning_rate": 4.9379827990617675e-05, "loss": 1.2032, "step": 8440 }, { "epoch": 6.61, "learning_rate": 4.937826426896013e-05, "loss": 1.2275, "step": 8460 }, { "epoch": 6.62, "learning_rate": 4.9376700547302585e-05, "loss": 1.2327, "step": 8480 }, { "epoch": 6.64, "learning_rate": 4.937513682564503e-05, "loss": 1.1662, "step": 8500 }, { "epoch": 6.66, "learning_rate": 4.9373573103987494e-05, "loss": 1.214, "step": 8520 }, { "epoch": 6.67, "learning_rate": 4.937200938232995e-05, "loss": 1.1788, "step": 8540 }, { "epoch": 6.69, "learning_rate": 4.9370445660672404e-05, "loss": 1.19, "step": 8560 }, { "epoch": 6.7, "learning_rate": 4.936888193901486e-05, "loss": 1.2033, "step": 8580 }, { "epoch": 6.72, "learning_rate": 4.9367318217357314e-05, "loss": 1.1832, "step": 8600 }, { "epoch": 6.73, "learning_rate": 4.936575449569977e-05, "loss": 1.1976, "step": 8620 }, { "epoch": 6.75, "learning_rate": 4.9364190774042224e-05, "loss": 1.1575, "step": 8640 }, { "epoch": 6.77, "learning_rate": 4.936262705238468e-05, "loss": 1.1951, "step": 8660 }, { "epoch": 6.78, "learning_rate": 4.936106333072713e-05, "loss": 1.2353, "step": 8680 }, { "epoch": 6.8, "learning_rate": 4.935949960906959e-05, "loss": 1.1899, "step": 8700 }, { "epoch": 6.81, "learning_rate": 4.9357935887412044e-05, "loss": 1.2149, "step": 8720 }, { "epoch": 6.83, "learning_rate": 4.93563721657545e-05, "loss": 1.2089, "step": 8740 }, { "epoch": 6.84, "learning_rate": 4.935480844409695e-05, "loss": 1.1872, "step": 8760 }, { "epoch": 6.86, "learning_rate": 4.935324472243941e-05, "loss": 1.2313, "step": 8780 }, { "epoch": 6.88, "learning_rate": 4.9351681000781864e-05, "loss": 1.1576, "step": 8800 }, { "epoch": 6.89, "learning_rate": 4.935011727912432e-05, "loss": 1.175, "step": 8820 }, { "epoch": 6.91, "learning_rate": 4.9348553557466774e-05, "loss": 1.2048, "step": 8840 }, { "epoch": 6.92, "learning_rate": 4.934698983580923e-05, "loss": 1.1697, "step": 8860 }, { "epoch": 6.94, "learning_rate": 4.9345426114151684e-05, "loss": 1.2244, "step": 8880 }, { "epoch": 6.95, "learning_rate": 4.934386239249414e-05, "loss": 1.1768, "step": 8900 }, { "epoch": 6.97, "learning_rate": 4.9342298670836594e-05, "loss": 1.242, "step": 8920 }, { "epoch": 6.98, "learning_rate": 4.934073494917905e-05, "loss": 1.2084, "step": 8940 }, { "epoch": 7.0, "learning_rate": 4.9339171227521504e-05, "loss": 1.2426, "step": 8960 }, { "epoch": 7.02, "learning_rate": 4.933760750586396e-05, "loss": 1.1756, "step": 8980 }, { "epoch": 7.03, "learning_rate": 4.9336043784206414e-05, "loss": 1.192, "step": 9000 }, { "epoch": 7.03, "eval_cer": 0.0787, "eval_loss": 0.18708373606204987, "eval_runtime": 243.1858, "eval_samples_per_second": 15.577, "eval_steps_per_second": 0.489, "eval_wer": 0.3767, "step": 9000 }, { "epoch": 7.05, "learning_rate": 4.933448006254887e-05, "loss": 1.2209, "step": 9020 }, { "epoch": 7.06, "learning_rate": 4.9332916340891324e-05, "loss": 1.2009, "step": 9040 }, { "epoch": 7.08, "learning_rate": 4.933135261923378e-05, "loss": 1.2355, "step": 9060 }, { "epoch": 7.09, "learning_rate": 4.9329788897576234e-05, "loss": 1.1415, "step": 9080 }, { "epoch": 7.11, "learning_rate": 4.932822517591869e-05, "loss": 1.2035, "step": 9100 }, { "epoch": 7.12, "learning_rate": 4.9326661454261144e-05, "loss": 1.2272, "step": 9120 }, { "epoch": 7.14, "learning_rate": 4.93250977326036e-05, "loss": 1.1643, "step": 9140 }, { "epoch": 7.16, "learning_rate": 4.9323534010946054e-05, "loss": 1.2402, "step": 9160 }, { "epoch": 7.17, "learning_rate": 4.932197028928851e-05, "loss": 1.1933, "step": 9180 }, { "epoch": 7.19, "learning_rate": 4.9320406567630964e-05, "loss": 1.2193, "step": 9200 }, { "epoch": 7.2, "learning_rate": 4.931884284597342e-05, "loss": 1.1871, "step": 9220 }, { "epoch": 7.22, "learning_rate": 4.9317279124315874e-05, "loss": 1.186, "step": 9240 }, { "epoch": 7.23, "learning_rate": 4.931571540265833e-05, "loss": 1.2193, "step": 9260 }, { "epoch": 7.25, "learning_rate": 4.9314151681000783e-05, "loss": 1.1795, "step": 9280 }, { "epoch": 7.27, "learning_rate": 4.931258795934324e-05, "loss": 1.2275, "step": 9300 }, { "epoch": 7.28, "learning_rate": 4.9311024237685693e-05, "loss": 1.1778, "step": 9320 }, { "epoch": 7.3, "learning_rate": 4.930946051602815e-05, "loss": 1.1746, "step": 9340 }, { "epoch": 7.31, "learning_rate": 4.93078967943706e-05, "loss": 1.2312, "step": 9360 }, { "epoch": 7.33, "learning_rate": 4.930633307271306e-05, "loss": 1.1581, "step": 9380 }, { "epoch": 7.34, "learning_rate": 4.930476935105551e-05, "loss": 1.2374, "step": 9400 }, { "epoch": 7.36, "learning_rate": 4.930320562939797e-05, "loss": 1.1868, "step": 9420 }, { "epoch": 7.38, "learning_rate": 4.930164190774042e-05, "loss": 1.208, "step": 9440 }, { "epoch": 7.39, "learning_rate": 4.9300078186082885e-05, "loss": 1.2142, "step": 9460 }, { "epoch": 7.41, "learning_rate": 4.929851446442533e-05, "loss": 1.1677, "step": 9480 }, { "epoch": 7.42, "learning_rate": 4.929695074276779e-05, "loss": 1.2215, "step": 9500 }, { "epoch": 7.44, "learning_rate": 4.929538702111024e-05, "loss": 1.212, "step": 9520 }, { "epoch": 7.45, "learning_rate": 4.9293823299452705e-05, "loss": 1.1614, "step": 9540 }, { "epoch": 7.47, "learning_rate": 4.929225957779515e-05, "loss": 1.2365, "step": 9560 }, { "epoch": 7.48, "learning_rate": 4.929069585613761e-05, "loss": 1.1695, "step": 9580 }, { "epoch": 7.5, "learning_rate": 4.928913213448006e-05, "loss": 1.2207, "step": 9600 }, { "epoch": 7.52, "learning_rate": 4.928756841282252e-05, "loss": 1.1323, "step": 9620 }, { "epoch": 7.53, "learning_rate": 4.928600469116498e-05, "loss": 1.1878, "step": 9640 }, { "epoch": 7.55, "learning_rate": 4.928444096950743e-05, "loss": 1.2146, "step": 9660 }, { "epoch": 7.56, "learning_rate": 4.928287724784988e-05, "loss": 1.1632, "step": 9680 }, { "epoch": 7.58, "learning_rate": 4.928131352619234e-05, "loss": 1.2028, "step": 9700 }, { "epoch": 7.59, "learning_rate": 4.92797498045348e-05, "loss": 1.1682, "step": 9720 }, { "epoch": 7.61, "learning_rate": 4.927818608287725e-05, "loss": 1.2092, "step": 9740 }, { "epoch": 7.62, "learning_rate": 4.92766223612197e-05, "loss": 1.2433, "step": 9760 }, { "epoch": 7.64, "learning_rate": 4.927505863956216e-05, "loss": 1.1546, "step": 9780 }, { "epoch": 7.66, "learning_rate": 4.927349491790462e-05, "loss": 1.2328, "step": 9800 }, { "epoch": 7.67, "learning_rate": 4.9271931196247075e-05, "loss": 1.1795, "step": 9820 }, { "epoch": 7.69, "learning_rate": 4.927036747458952e-05, "loss": 1.1942, "step": 9840 }, { "epoch": 7.7, "learning_rate": 4.926880375293198e-05, "loss": 1.2614, "step": 9860 }, { "epoch": 7.72, "learning_rate": 4.926724003127444e-05, "loss": 1.1619, "step": 9880 }, { "epoch": 7.73, "learning_rate": 4.9265676309616894e-05, "loss": 1.1962, "step": 9900 }, { "epoch": 7.75, "learning_rate": 4.926411258795934e-05, "loss": 1.1822, "step": 9920 }, { "epoch": 7.77, "learning_rate": 4.92625488663018e-05, "loss": 1.2189, "step": 9940 }, { "epoch": 7.78, "learning_rate": 4.926098514464426e-05, "loss": 1.2327, "step": 9960 }, { "epoch": 7.8, "learning_rate": 4.9259421422986714e-05, "loss": 1.1526, "step": 9980 }, { "epoch": 7.81, "learning_rate": 4.925785770132916e-05, "loss": 1.2293, "step": 10000 }, { "epoch": 7.81, "eval_cer": 0.0832, "eval_loss": 0.1896892637014389, "eval_runtime": 244.7311, "eval_samples_per_second": 15.478, "eval_steps_per_second": 0.486, "eval_wer": 0.3976, "step": 10000 }, { "epoch": 7.83, "learning_rate": 4.925629397967162e-05, "loss": 1.24, "step": 10020 }, { "epoch": 7.84, "learning_rate": 4.925473025801407e-05, "loss": 1.2061, "step": 10040 }, { "epoch": 7.86, "learning_rate": 4.9253166536356534e-05, "loss": 1.2511, "step": 10060 }, { "epoch": 7.88, "learning_rate": 4.925160281469899e-05, "loss": 1.1501, "step": 10080 }, { "epoch": 7.89, "learning_rate": 4.925003909304144e-05, "loss": 1.2169, "step": 10100 }, { "epoch": 7.91, "learning_rate": 4.924847537138389e-05, "loss": 1.1912, "step": 10120 }, { "epoch": 7.92, "learning_rate": 4.9246911649726354e-05, "loss": 1.1837, "step": 10140 }, { "epoch": 7.94, "learning_rate": 4.924534792806881e-05, "loss": 1.2644, "step": 10160 }, { "epoch": 7.95, "learning_rate": 4.924378420641126e-05, "loss": 1.1606, "step": 10180 }, { "epoch": 7.97, "learning_rate": 4.924222048475371e-05, "loss": 1.1905, "step": 10200 }, { "epoch": 7.98, "learning_rate": 4.9240656763096174e-05, "loss": 1.219, "step": 10220 }, { "epoch": 8.0, "learning_rate": 4.923909304143863e-05, "loss": 1.2419, "step": 10240 }, { "epoch": 8.02, "learning_rate": 4.9237529319781084e-05, "loss": 1.151, "step": 10260 }, { "epoch": 8.03, "learning_rate": 4.923596559812353e-05, "loss": 1.1691, "step": 10280 }, { "epoch": 8.05, "learning_rate": 4.9234401876465994e-05, "loss": 1.1762, "step": 10300 }, { "epoch": 8.06, "learning_rate": 4.923283815480845e-05, "loss": 1.1757, "step": 10320 }, { "epoch": 8.08, "learning_rate": 4.9231274433150904e-05, "loss": 1.2532, "step": 10340 }, { "epoch": 8.09, "learning_rate": 4.922971071149335e-05, "loss": 1.188, "step": 10360 }, { "epoch": 8.11, "learning_rate": 4.922822517591869e-05, "loss": 1.2122, "step": 10380 }, { "epoch": 8.12, "learning_rate": 4.922666145426114e-05, "loss": 1.1837, "step": 10400 }, { "epoch": 8.14, "learning_rate": 4.9225097732603596e-05, "loss": 1.1449, "step": 10420 }, { "epoch": 8.16, "learning_rate": 4.922353401094605e-05, "loss": 1.2147, "step": 10440 }, { "epoch": 8.17, "learning_rate": 4.922197028928851e-05, "loss": 1.1529, "step": 10460 }, { "epoch": 8.19, "learning_rate": 4.922040656763097e-05, "loss": 1.2168, "step": 10480 }, { "epoch": 8.2, "learning_rate": 4.9218842845973416e-05, "loss": 1.1955, "step": 10500 }, { "epoch": 8.22, "learning_rate": 4.921727912431587e-05, "loss": 1.1793, "step": 10520 }, { "epoch": 8.23, "learning_rate": 4.921571540265833e-05, "loss": 1.2466, "step": 10540 }, { "epoch": 8.25, "learning_rate": 4.921415168100079e-05, "loss": 1.1512, "step": 10560 }, { "epoch": 8.27, "learning_rate": 4.9212587959343236e-05, "loss": 1.2223, "step": 10580 }, { "epoch": 8.28, "learning_rate": 4.921102423768569e-05, "loss": 1.224, "step": 10600 }, { "epoch": 8.3, "learning_rate": 4.920946051602815e-05, "loss": 1.191, "step": 10620 }, { "epoch": 8.31, "learning_rate": 4.920789679437061e-05, "loss": 1.2194, "step": 10640 }, { "epoch": 8.33, "learning_rate": 4.9206333072713056e-05, "loss": 1.1671, "step": 10660 }, { "epoch": 8.34, "learning_rate": 4.920476935105551e-05, "loss": 1.1897, "step": 10680 }, { "epoch": 8.36, "learning_rate": 4.920320562939797e-05, "loss": 1.1669, "step": 10700 }, { "epoch": 8.38, "learning_rate": 4.920164190774043e-05, "loss": 1.1695, "step": 10720 }, { "epoch": 8.39, "learning_rate": 4.920007818608288e-05, "loss": 1.2647, "step": 10740 }, { "epoch": 8.41, "learning_rate": 4.919851446442533e-05, "loss": 1.1513, "step": 10760 }, { "epoch": 8.42, "learning_rate": 4.9196950742767786e-05, "loss": 1.2199, "step": 10780 }, { "epoch": 8.44, "learning_rate": 4.919538702111025e-05, "loss": 1.1682, "step": 10800 }, { "epoch": 8.45, "learning_rate": 4.91938232994527e-05, "loss": 1.1785, "step": 10820 }, { "epoch": 8.47, "learning_rate": 4.919225957779515e-05, "loss": 1.2391, "step": 10840 }, { "epoch": 8.48, "learning_rate": 4.9190695856137606e-05, "loss": 1.1626, "step": 10860 }, { "epoch": 8.5, "learning_rate": 4.918913213448007e-05, "loss": 1.1882, "step": 10880 }, { "epoch": 8.52, "learning_rate": 4.918756841282252e-05, "loss": 1.188, "step": 10900 }, { "epoch": 8.53, "learning_rate": 4.918600469116498e-05, "loss": 1.2459, "step": 10920 }, { "epoch": 8.55, "learning_rate": 4.9184440969507426e-05, "loss": 1.2485, "step": 10940 }, { "epoch": 8.56, "learning_rate": 4.918287724784989e-05, "loss": 1.1443, "step": 10960 }, { "epoch": 8.58, "learning_rate": 4.918131352619234e-05, "loss": 1.1949, "step": 10980 }, { "epoch": 8.59, "learning_rate": 4.91797498045348e-05, "loss": 1.1967, "step": 11000 }, { "epoch": 8.59, "eval_cer": 0.0856, "eval_loss": 0.18938589096069336, "eval_runtime": 245.3646, "eval_samples_per_second": 15.438, "eval_steps_per_second": 0.485, "eval_wer": 0.4035, "step": 11000 }, { "epoch": 8.61, "learning_rate": 4.9178186082877245e-05, "loss": 1.1999, "step": 11020 }, { "epoch": 8.62, "learning_rate": 4.917662236121971e-05, "loss": 1.2439, "step": 11040 }, { "epoch": 8.64, "learning_rate": 4.917505863956216e-05, "loss": 1.1515, "step": 11060 }, { "epoch": 8.66, "learning_rate": 4.917349491790462e-05, "loss": 1.2248, "step": 11080 }, { "epoch": 8.67, "learning_rate": 4.917193119624707e-05, "loss": 1.2166, "step": 11100 }, { "epoch": 8.69, "learning_rate": 4.917036747458953e-05, "loss": 1.1792, "step": 11120 }, { "epoch": 8.7, "learning_rate": 4.916880375293198e-05, "loss": 1.208, "step": 11140 }, { "epoch": 8.72, "learning_rate": 4.916724003127444e-05, "loss": 1.1584, "step": 11160 }, { "epoch": 8.73, "learning_rate": 4.916567630961689e-05, "loss": 1.2154, "step": 11180 }, { "epoch": 8.75, "learning_rate": 4.916411258795934e-05, "loss": 1.174, "step": 11200 }, { "epoch": 8.77, "learning_rate": 4.91625488663018e-05, "loss": 1.1951, "step": 11220 }, { "epoch": 8.78, "learning_rate": 4.916098514464426e-05, "loss": 1.2363, "step": 11240 }, { "epoch": 8.8, "learning_rate": 4.915942142298671e-05, "loss": 1.1738, "step": 11260 }, { "epoch": 8.81, "learning_rate": 4.915785770132916e-05, "loss": 1.1996, "step": 11280 }, { "epoch": 8.83, "learning_rate": 4.915629397967162e-05, "loss": 1.2094, "step": 11300 }, { "epoch": 8.84, "learning_rate": 4.915473025801408e-05, "loss": 1.1884, "step": 11320 }, { "epoch": 8.86, "learning_rate": 4.915316653635653e-05, "loss": 1.2541, "step": 11340 }, { "epoch": 8.88, "learning_rate": 4.915160281469899e-05, "loss": 1.152, "step": 11360 }, { "epoch": 8.89, "learning_rate": 4.915003909304144e-05, "loss": 1.2148, "step": 11380 }, { "epoch": 8.91, "learning_rate": 4.91484753713839e-05, "loss": 1.2074, "step": 11400 }, { "epoch": 8.92, "learning_rate": 4.914691164972635e-05, "loss": 1.1802, "step": 11420 }, { "epoch": 8.94, "learning_rate": 4.914534792806881e-05, "loss": 1.2463, "step": 11440 }, { "epoch": 8.95, "learning_rate": 4.914378420641126e-05, "loss": 1.1818, "step": 11460 }, { "epoch": 8.97, "learning_rate": 4.9142220484753717e-05, "loss": 1.2322, "step": 11480 }, { "epoch": 8.98, "learning_rate": 4.914065676309617e-05, "loss": 1.254, "step": 11500 }, { "epoch": 9.0, "learning_rate": 4.9139093041438627e-05, "loss": 1.2372, "step": 11520 }, { "epoch": 9.02, "learning_rate": 4.913752931978108e-05, "loss": 1.1879, "step": 11540 }, { "epoch": 9.03, "learning_rate": 4.9135965598123536e-05, "loss": 1.2133, "step": 11560 }, { "epoch": 9.05, "learning_rate": 4.913440187646599e-05, "loss": 1.1999, "step": 11580 }, { "epoch": 9.06, "learning_rate": 4.9132838154808446e-05, "loss": 1.1824, "step": 11600 }, { "epoch": 9.08, "learning_rate": 4.91312744331509e-05, "loss": 1.2318, "step": 11620 }, { "epoch": 9.09, "learning_rate": 4.9129710711493356e-05, "loss": 1.1599, "step": 11640 }, { "epoch": 9.11, "learning_rate": 4.912814698983581e-05, "loss": 1.2229, "step": 11660 }, { "epoch": 9.12, "learning_rate": 4.9126583268178266e-05, "loss": 1.2286, "step": 11680 }, { "epoch": 9.14, "learning_rate": 4.912501954652072e-05, "loss": 1.1919, "step": 11700 }, { "epoch": 9.16, "learning_rate": 4.9123455824863176e-05, "loss": 1.2359, "step": 11720 }, { "epoch": 9.17, "learning_rate": 4.912189210320563e-05, "loss": 1.1815, "step": 11740 }, { "epoch": 9.19, "learning_rate": 4.9120328381548086e-05, "loss": 1.2552, "step": 11760 }, { "epoch": 9.2, "learning_rate": 4.911876465989054e-05, "loss": 1.2085, "step": 11780 }, { "epoch": 9.22, "learning_rate": 4.9117200938232996e-05, "loss": 1.1579, "step": 11800 }, { "epoch": 9.23, "learning_rate": 4.911563721657545e-05, "loss": 1.2166, "step": 11820 }, { "epoch": 9.25, "learning_rate": 4.9114073494917906e-05, "loss": 1.1707, "step": 11840 }, { "epoch": 9.27, "learning_rate": 4.911250977326036e-05, "loss": 1.1854, "step": 11860 }, { "epoch": 9.28, "learning_rate": 4.9110946051602816e-05, "loss": 1.2069, "step": 11880 }, { "epoch": 9.3, "learning_rate": 4.910938232994527e-05, "loss": 1.1684, "step": 11900 }, { "epoch": 9.31, "learning_rate": 4.9107818608287726e-05, "loss": 1.1967, "step": 11920 }, { "epoch": 9.33, "learning_rate": 4.910625488663018e-05, "loss": 1.1769, "step": 11940 }, { "epoch": 9.34, "learning_rate": 4.9104691164972636e-05, "loss": 1.1992, "step": 11960 }, { "epoch": 9.36, "learning_rate": 4.91031274433151e-05, "loss": 1.2044, "step": 11980 }, { "epoch": 9.38, "learning_rate": 4.9101563721657546e-05, "loss": 1.1754, "step": 12000 }, { "epoch": 9.38, "eval_cer": 0.0829, "eval_loss": 0.19095608592033386, "eval_runtime": 245.3799, "eval_samples_per_second": 15.437, "eval_steps_per_second": 0.485, "eval_wer": 0.3922, "step": 12000 }, { "epoch": 9.39, "learning_rate": 4.91e-05, "loss": 1.2142, "step": 12020 }, { "epoch": 9.41, "learning_rate": 4.9098436278342456e-05, "loss": 1.1498, "step": 12040 }, { "epoch": 9.42, "learning_rate": 4.909687255668491e-05, "loss": 1.1881, "step": 12060 }, { "epoch": 9.44, "learning_rate": 4.9095308835027366e-05, "loss": 1.1585, "step": 12080 }, { "epoch": 9.45, "learning_rate": 4.909374511336982e-05, "loss": 1.1474, "step": 12100 }, { "epoch": 9.47, "learning_rate": 4.9092181391712276e-05, "loss": 1.1702, "step": 12120 }, { "epoch": 9.48, "learning_rate": 4.909061767005473e-05, "loss": 1.1375, "step": 12140 }, { "epoch": 9.5, "learning_rate": 4.908905394839719e-05, "loss": 1.2217, "step": 12160 }, { "epoch": 9.52, "learning_rate": 4.908749022673964e-05, "loss": 1.2107, "step": 12180 }, { "epoch": 9.53, "learning_rate": 4.9085926505082096e-05, "loss": 1.1794, "step": 12200 }, { "epoch": 9.55, "learning_rate": 4.908436278342455e-05, "loss": 1.2525, "step": 12220 }, { "epoch": 9.56, "learning_rate": 4.908279906176701e-05, "loss": 1.1603, "step": 12240 }, { "epoch": 9.58, "learning_rate": 4.908123534010946e-05, "loss": 1.2288, "step": 12260 }, { "epoch": 9.59, "learning_rate": 4.9079671618451916e-05, "loss": 1.2037, "step": 12280 }, { "epoch": 9.61, "learning_rate": 4.907810789679437e-05, "loss": 1.196, "step": 12300 }, { "epoch": 9.62, "learning_rate": 4.907654417513683e-05, "loss": 1.2491, "step": 12320 }, { "epoch": 9.64, "learning_rate": 4.907498045347929e-05, "loss": 1.1715, "step": 12340 }, { "epoch": 9.66, "learning_rate": 4.9073416731821735e-05, "loss": 1.1911, "step": 12360 }, { "epoch": 9.67, "learning_rate": 4.907185301016419e-05, "loss": 1.2299, "step": 12380 }, { "epoch": 9.69, "learning_rate": 4.907028928850665e-05, "loss": 1.1497, "step": 12400 }, { "epoch": 9.7, "learning_rate": 4.906872556684911e-05, "loss": 1.2486, "step": 12420 }, { "epoch": 9.72, "learning_rate": 4.9067161845191555e-05, "loss": 1.1787, "step": 12440 }, { "epoch": 9.73, "learning_rate": 4.906559812353401e-05, "loss": 1.197, "step": 12460 }, { "epoch": 9.75, "learning_rate": 4.9064034401876465e-05, "loss": 1.2123, "step": 12480 }, { "epoch": 9.77, "learning_rate": 4.906247068021893e-05, "loss": 1.1911, "step": 12500 }, { "epoch": 9.78, "learning_rate": 4.906090695856138e-05, "loss": 1.2155, "step": 12520 }, { "epoch": 9.8, "learning_rate": 4.905934323690383e-05, "loss": 1.1681, "step": 12540 }, { "epoch": 9.81, "learning_rate": 4.9057779515246285e-05, "loss": 1.2372, "step": 12560 }, { "epoch": 9.83, "learning_rate": 4.905621579358875e-05, "loss": 1.1918, "step": 12580 }, { "epoch": 9.84, "learning_rate": 4.90546520719312e-05, "loss": 1.1717, "step": 12600 }, { "epoch": 9.86, "learning_rate": 4.905308835027365e-05, "loss": 1.2068, "step": 12620 }, { "epoch": 9.88, "learning_rate": 4.9051524628616105e-05, "loss": 1.1475, "step": 12640 }, { "epoch": 9.89, "learning_rate": 4.904996090695857e-05, "loss": 1.2002, "step": 12660 }, { "epoch": 9.91, "learning_rate": 4.904839718530102e-05, "loss": 1.2035, "step": 12680 }, { "epoch": 9.92, "learning_rate": 4.904683346364347e-05, "loss": 1.1718, "step": 12700 }, { "epoch": 9.94, "learning_rate": 4.9045269741985925e-05, "loss": 1.1833, "step": 12720 }, { "epoch": 9.95, "learning_rate": 4.904370602032839e-05, "loss": 1.1648, "step": 12740 }, { "epoch": 9.97, "learning_rate": 4.904214229867084e-05, "loss": 1.2056, "step": 12760 }, { "epoch": 9.98, "learning_rate": 4.9040578577013297e-05, "loss": 1.2315, "step": 12780 }, { "epoch": 10.0, "learning_rate": 4.9039014855355745e-05, "loss": 1.229, "step": 12800 }, { "epoch": 10.02, "learning_rate": 4.9037451133698207e-05, "loss": 1.1447, "step": 12820 }, { "epoch": 10.03, "learning_rate": 4.903588741204066e-05, "loss": 1.1828, "step": 12840 }, { "epoch": 10.05, "learning_rate": 4.9034323690383116e-05, "loss": 1.1961, "step": 12860 }, { "epoch": 10.06, "learning_rate": 4.9032759968725565e-05, "loss": 1.1699, "step": 12880 }, { "epoch": 10.08, "learning_rate": 4.9031196247068026e-05, "loss": 1.2559, "step": 12900 }, { "epoch": 10.09, "learning_rate": 4.902963252541048e-05, "loss": 1.1448, "step": 12920 }, { "epoch": 10.11, "learning_rate": 4.9028068803752936e-05, "loss": 1.1904, "step": 12940 }, { "epoch": 10.12, "learning_rate": 4.902650508209539e-05, "loss": 1.1899, "step": 12960 }, { "epoch": 10.14, "learning_rate": 4.902494136043784e-05, "loss": 1.1995, "step": 12980 }, { "epoch": 10.16, "learning_rate": 4.90233776387803e-05, "loss": 1.2426, "step": 13000 }, { "epoch": 10.16, "eval_cer": 0.0804, "eval_loss": 0.18774890899658203, "eval_runtime": 244.8579, "eval_samples_per_second": 15.47, "eval_steps_per_second": 0.486, "eval_wer": 0.3863, "step": 13000 }, { "epoch": 10.17, "learning_rate": 4.9021813917122756e-05, "loss": 1.1519, "step": 13020 }, { "epoch": 10.19, "learning_rate": 4.902025019546521e-05, "loss": 1.2118, "step": 13040 }, { "epoch": 10.2, "learning_rate": 4.901868647380766e-05, "loss": 1.1595, "step": 13060 }, { "epoch": 10.22, "learning_rate": 4.901712275215012e-05, "loss": 1.1427, "step": 13080 }, { "epoch": 10.23, "learning_rate": 4.9015559030492576e-05, "loss": 1.2165, "step": 13100 }, { "epoch": 10.25, "learning_rate": 4.901399530883503e-05, "loss": 1.1529, "step": 13120 }, { "epoch": 10.27, "learning_rate": 4.9012431587177486e-05, "loss": 1.1892, "step": 13140 }, { "epoch": 10.28, "learning_rate": 4.901086786551994e-05, "loss": 1.2078, "step": 13160 }, { "epoch": 10.3, "learning_rate": 4.9009304143862396e-05, "loss": 1.1962, "step": 13180 }, { "epoch": 10.31, "learning_rate": 4.900774042220485e-05, "loss": 1.2341, "step": 13200 }, { "epoch": 10.33, "learning_rate": 4.9006176700547306e-05, "loss": 1.1535, "step": 13220 }, { "epoch": 10.34, "learning_rate": 4.900461297888976e-05, "loss": 1.2066, "step": 13240 }, { "epoch": 10.36, "learning_rate": 4.9003049257232216e-05, "loss": 1.1856, "step": 13260 }, { "epoch": 10.38, "learning_rate": 4.900148553557467e-05, "loss": 1.1652, "step": 13280 }, { "epoch": 10.39, "learning_rate": 4.8999921813917126e-05, "loss": 1.2259, "step": 13300 }, { "epoch": 10.41, "learning_rate": 4.899835809225958e-05, "loss": 1.1603, "step": 13320 }, { "epoch": 10.42, "learning_rate": 4.8996794370602036e-05, "loss": 1.1947, "step": 13340 }, { "epoch": 10.44, "learning_rate": 4.899523064894449e-05, "loss": 1.2199, "step": 13360 }, { "epoch": 10.45, "learning_rate": 4.8993666927286946e-05, "loss": 1.1641, "step": 13380 }, { "epoch": 10.47, "learning_rate": 4.89921032056294e-05, "loss": 1.1693, "step": 13400 }, { "epoch": 10.48, "learning_rate": 4.8990539483971856e-05, "loss": 1.1736, "step": 13420 }, { "epoch": 10.5, "learning_rate": 4.898897576231431e-05, "loss": 1.2132, "step": 13440 }, { "epoch": 10.52, "learning_rate": 4.8987412040656766e-05, "loss": 1.1995, "step": 13460 }, { "epoch": 10.53, "learning_rate": 4.898584831899922e-05, "loss": 1.2211, "step": 13480 }, { "epoch": 10.55, "learning_rate": 4.8984284597341676e-05, "loss": 1.224, "step": 13500 }, { "epoch": 10.56, "learning_rate": 4.898272087568413e-05, "loss": 1.2119, "step": 13520 }, { "epoch": 10.58, "learning_rate": 4.8981157154026586e-05, "loss": 1.1882, "step": 13540 }, { "epoch": 10.59, "learning_rate": 4.897959343236904e-05, "loss": 1.1475, "step": 13560 }, { "epoch": 10.61, "learning_rate": 4.8978029710711496e-05, "loss": 1.1841, "step": 13580 }, { "epoch": 10.62, "learning_rate": 4.897646598905395e-05, "loss": 1.1989, "step": 13600 }, { "epoch": 10.64, "learning_rate": 4.8974902267396405e-05, "loss": 1.1387, "step": 13620 }, { "epoch": 10.66, "learning_rate": 4.897333854573886e-05, "loss": 1.1657, "step": 13640 }, { "epoch": 10.67, "learning_rate": 4.8971774824081315e-05, "loss": 1.1935, "step": 13660 }, { "epoch": 10.69, "learning_rate": 4.897021110242377e-05, "loss": 1.1882, "step": 13680 }, { "epoch": 10.7, "learning_rate": 4.8968647380766225e-05, "loss": 1.1569, "step": 13700 }, { "epoch": 10.72, "learning_rate": 4.896708365910868e-05, "loss": 1.1564, "step": 13720 }, { "epoch": 10.73, "learning_rate": 4.8965519937451135e-05, "loss": 1.2063, "step": 13740 }, { "epoch": 10.75, "learning_rate": 4.89639562157936e-05, "loss": 1.1985, "step": 13760 }, { "epoch": 10.77, "learning_rate": 4.8962392494136045e-05, "loss": 1.1853, "step": 13780 }, { "epoch": 10.78, "learning_rate": 4.89608287724785e-05, "loss": 1.2082, "step": 13800 }, { "epoch": 10.8, "learning_rate": 4.8959265050820955e-05, "loss": 1.1286, "step": 13820 }, { "epoch": 10.81, "learning_rate": 4.895770132916341e-05, "loss": 1.1737, "step": 13840 }, { "epoch": 10.83, "learning_rate": 4.8956137607505865e-05, "loss": 1.1663, "step": 13860 }, { "epoch": 10.84, "learning_rate": 4.895457388584832e-05, "loss": 1.1624, "step": 13880 }, { "epoch": 10.86, "learning_rate": 4.8953010164190775e-05, "loss": 1.2122, "step": 13900 }, { "epoch": 10.88, "learning_rate": 4.895144644253323e-05, "loss": 1.1553, "step": 13920 }, { "epoch": 10.89, "learning_rate": 4.8949882720875685e-05, "loss": 1.2019, "step": 13940 }, { "epoch": 10.91, "learning_rate": 4.894831899921814e-05, "loss": 1.1752, "step": 13960 }, { "epoch": 10.92, "learning_rate": 4.8946755277560595e-05, "loss": 1.1814, "step": 13980 }, { "epoch": 10.94, "learning_rate": 4.894519155590305e-05, "loss": 1.2416, "step": 14000 }, { "epoch": 10.94, "eval_cer": 0.0815, "eval_loss": 0.19119442999362946, "eval_runtime": 248.9347, "eval_samples_per_second": 15.217, "eval_steps_per_second": 0.478, "eval_wer": 0.3892, "step": 14000 }, { "epoch": 10.95, "learning_rate": 4.894362783424551e-05, "loss": 1.1547, "step": 14020 }, { "epoch": 10.97, "learning_rate": 4.894206411258796e-05, "loss": 1.2016, "step": 14040 }, { "epoch": 10.98, "learning_rate": 4.8940500390930415e-05, "loss": 1.1788, "step": 14060 }, { "epoch": 11.0, "learning_rate": 4.893893666927287e-05, "loss": 1.2398, "step": 14080 }, { "epoch": 11.02, "learning_rate": 4.893737294761533e-05, "loss": 1.16, "step": 14100 }, { "epoch": 11.03, "learning_rate": 4.893580922595778e-05, "loss": 1.2037, "step": 14120 }, { "epoch": 11.05, "learning_rate": 4.8934245504300235e-05, "loss": 1.1217, "step": 14140 }, { "epoch": 11.06, "learning_rate": 4.893268178264269e-05, "loss": 1.19, "step": 14160 }, { "epoch": 11.08, "learning_rate": 4.893111806098515e-05, "loss": 1.1895, "step": 14180 }, { "epoch": 11.09, "learning_rate": 4.8929554339327606e-05, "loss": 1.1583, "step": 14200 }, { "epoch": 11.11, "learning_rate": 4.8927990617670055e-05, "loss": 1.1766, "step": 14220 }, { "epoch": 11.12, "learning_rate": 4.892642689601251e-05, "loss": 1.1734, "step": 14240 }, { "epoch": 11.14, "learning_rate": 4.8924863174354965e-05, "loss": 1.1889, "step": 14260 }, { "epoch": 11.16, "learning_rate": 4.8923299452697426e-05, "loss": 1.2461, "step": 14280 }, { "epoch": 11.17, "learning_rate": 4.8921735731039875e-05, "loss": 1.1572, "step": 14300 }, { "epoch": 11.19, "learning_rate": 4.892017200938233e-05, "loss": 1.1798, "step": 14320 }, { "epoch": 11.2, "learning_rate": 4.8918608287724785e-05, "loss": 1.1734, "step": 14340 }, { "epoch": 11.22, "learning_rate": 4.8917044566067246e-05, "loss": 1.1912, "step": 14360 }, { "epoch": 11.23, "learning_rate": 4.89154808444097e-05, "loss": 1.184, "step": 14380 }, { "epoch": 11.25, "learning_rate": 4.891391712275215e-05, "loss": 1.1295, "step": 14400 }, { "epoch": 11.27, "learning_rate": 4.8912353401094604e-05, "loss": 1.1725, "step": 14420 }, { "epoch": 11.28, "learning_rate": 4.8910789679437066e-05, "loss": 1.1681, "step": 14440 }, { "epoch": 11.3, "learning_rate": 4.890922595777952e-05, "loss": 1.1885, "step": 14460 }, { "epoch": 11.31, "learning_rate": 4.890766223612197e-05, "loss": 1.1737, "step": 14480 }, { "epoch": 11.33, "learning_rate": 4.8906098514464424e-05, "loss": 1.1188, "step": 14500 }, { "epoch": 11.34, "learning_rate": 4.8904534792806886e-05, "loss": 1.1988, "step": 14520 }, { "epoch": 11.36, "learning_rate": 4.890297107114934e-05, "loss": 1.1563, "step": 14540 }, { "epoch": 11.38, "learning_rate": 4.890140734949179e-05, "loss": 1.1871, "step": 14560 }, { "epoch": 11.39, "learning_rate": 4.8899843627834244e-05, "loss": 1.2104, "step": 14580 }, { "epoch": 11.41, "learning_rate": 4.8898279906176706e-05, "loss": 1.1605, "step": 14600 }, { "epoch": 11.42, "learning_rate": 4.889671618451916e-05, "loss": 1.1785, "step": 14620 }, { "epoch": 11.44, "learning_rate": 4.8895152462861616e-05, "loss": 1.1865, "step": 14640 }, { "epoch": 11.45, "learning_rate": 4.889366692728694e-05, "loss": 1.1742, "step": 14660 }, { "epoch": 11.47, "learning_rate": 4.8892103205629405e-05, "loss": 1.1821, "step": 14680 }, { "epoch": 11.48, "learning_rate": 4.889053948397185e-05, "loss": 1.1337, "step": 14700 }, { "epoch": 11.5, "learning_rate": 4.888897576231431e-05, "loss": 1.1592, "step": 14720 }, { "epoch": 11.52, "learning_rate": 4.888741204065676e-05, "loss": 1.1671, "step": 14740 }, { "epoch": 11.53, "learning_rate": 4.8885848318999225e-05, "loss": 1.167, "step": 14760 }, { "epoch": 11.55, "learning_rate": 4.888428459734167e-05, "loss": 1.2166, "step": 14780 }, { "epoch": 11.56, "learning_rate": 4.888272087568413e-05, "loss": 1.1214, "step": 14800 }, { "epoch": 11.58, "learning_rate": 4.888115715402658e-05, "loss": 1.2262, "step": 14820 }, { "epoch": 11.59, "learning_rate": 4.8879593432369045e-05, "loss": 1.1824, "step": 14840 }, { "epoch": 11.61, "learning_rate": 4.88780297107115e-05, "loss": 1.1686, "step": 14860 }, { "epoch": 11.62, "learning_rate": 4.887646598905395e-05, "loss": 1.2229, "step": 14880 }, { "epoch": 11.64, "learning_rate": 4.88749022673964e-05, "loss": 1.1398, "step": 14900 }, { "epoch": 11.66, "learning_rate": 4.8873338545738865e-05, "loss": 1.1781, "step": 14920 }, { "epoch": 11.67, "learning_rate": 4.887177482408132e-05, "loss": 1.1953, "step": 14940 }, { "epoch": 11.69, "learning_rate": 4.887021110242377e-05, "loss": 1.1927, "step": 14960 }, { "epoch": 11.7, "learning_rate": 4.886864738076622e-05, "loss": 1.1869, "step": 14980 }, { "epoch": 11.72, "learning_rate": 4.886708365910868e-05, "loss": 1.1675, "step": 15000 }, { "epoch": 11.72, "eval_cer": 0.0789, "eval_loss": 0.18456652760505676, "eval_runtime": 245.963, "eval_samples_per_second": 15.401, "eval_steps_per_second": 0.484, "eval_wer": 0.3816, "step": 15000 }, { "epoch": 11.73, "learning_rate": 4.886551993745114e-05, "loss": 1.2032, "step": 15020 }, { "epoch": 11.75, "learning_rate": 4.8863956215793595e-05, "loss": 1.188, "step": 15040 }, { "epoch": 11.77, "learning_rate": 4.886239249413604e-05, "loss": 1.1456, "step": 15060 }, { "epoch": 11.78, "learning_rate": 4.88608287724785e-05, "loss": 1.177, "step": 15080 }, { "epoch": 11.8, "learning_rate": 4.885926505082096e-05, "loss": 1.1718, "step": 15100 }, { "epoch": 11.81, "learning_rate": 4.8857701329163415e-05, "loss": 1.2119, "step": 15120 }, { "epoch": 11.83, "learning_rate": 4.885613760750586e-05, "loss": 1.1755, "step": 15140 }, { "epoch": 11.84, "learning_rate": 4.885457388584832e-05, "loss": 1.1624, "step": 15160 }, { "epoch": 11.86, "learning_rate": 4.885301016419078e-05, "loss": 1.1739, "step": 15180 }, { "epoch": 11.88, "learning_rate": 4.8851446442533234e-05, "loss": 1.1431, "step": 15200 }, { "epoch": 11.89, "learning_rate": 4.884988272087568e-05, "loss": 1.1937, "step": 15220 }, { "epoch": 11.91, "learning_rate": 4.884831899921814e-05, "loss": 1.2121, "step": 15240 }, { "epoch": 11.92, "learning_rate": 4.88467552775606e-05, "loss": 1.1911, "step": 15260 }, { "epoch": 11.94, "learning_rate": 4.8845191555903054e-05, "loss": 1.2446, "step": 15280 }, { "epoch": 11.95, "learning_rate": 4.884362783424551e-05, "loss": 1.1642, "step": 15300 }, { "epoch": 11.97, "learning_rate": 4.884206411258796e-05, "loss": 1.1891, "step": 15320 }, { "epoch": 11.98, "learning_rate": 4.884050039093042e-05, "loss": 1.224, "step": 15340 }, { "epoch": 12.0, "learning_rate": 4.8838936669272874e-05, "loss": 1.1916, "step": 15360 }, { "epoch": 12.02, "learning_rate": 4.883737294761533e-05, "loss": 1.1201, "step": 15380 }, { "epoch": 12.03, "learning_rate": 4.883580922595778e-05, "loss": 1.1812, "step": 15400 }, { "epoch": 12.05, "learning_rate": 4.883424550430023e-05, "loss": 1.1958, "step": 15420 }, { "epoch": 12.06, "learning_rate": 4.8832681782642694e-05, "loss": 1.1896, "step": 15440 }, { "epoch": 12.08, "learning_rate": 4.883111806098515e-05, "loss": 1.2025, "step": 15460 }, { "epoch": 12.09, "learning_rate": 4.8829554339327604e-05, "loss": 1.1121, "step": 15480 }, { "epoch": 12.11, "learning_rate": 4.882799061767005e-05, "loss": 1.1672, "step": 15500 }, { "epoch": 12.12, "learning_rate": 4.8826426896012514e-05, "loss": 1.1715, "step": 15520 }, { "epoch": 12.14, "learning_rate": 4.882486317435497e-05, "loss": 1.151, "step": 15540 }, { "epoch": 12.16, "learning_rate": 4.8823299452697424e-05, "loss": 1.2102, "step": 15560 }, { "epoch": 12.17, "learning_rate": 4.882173573103987e-05, "loss": 1.1419, "step": 15580 }, { "epoch": 12.19, "learning_rate": 4.8820172009382334e-05, "loss": 1.172, "step": 15600 }, { "epoch": 12.2, "learning_rate": 4.881860828772479e-05, "loss": 1.1639, "step": 15620 }, { "epoch": 12.22, "learning_rate": 4.8817044566067244e-05, "loss": 1.1795, "step": 15640 }, { "epoch": 12.23, "learning_rate": 4.88154808444097e-05, "loss": 1.1707, "step": 15660 }, { "epoch": 12.25, "learning_rate": 4.8813917122752154e-05, "loss": 1.1257, "step": 15680 }, { "epoch": 12.27, "learning_rate": 4.881235340109461e-05, "loss": 1.1522, "step": 15700 }, { "epoch": 12.28, "learning_rate": 4.8810789679437064e-05, "loss": 1.1947, "step": 15720 }, { "epoch": 12.3, "learning_rate": 4.880922595777952e-05, "loss": 1.1543, "step": 15740 }, { "epoch": 12.31, "learning_rate": 4.8807662236121974e-05, "loss": 1.1727, "step": 15760 }, { "epoch": 12.33, "learning_rate": 4.880609851446443e-05, "loss": 1.168, "step": 15780 }, { "epoch": 12.34, "learning_rate": 4.8804534792806884e-05, "loss": 1.1697, "step": 15800 }, { "epoch": 12.36, "learning_rate": 4.880297107114934e-05, "loss": 1.165, "step": 15820 }, { "epoch": 12.38, "learning_rate": 4.880140734949179e-05, "loss": 1.173, "step": 15840 }, { "epoch": 12.39, "learning_rate": 4.879984362783425e-05, "loss": 1.1901, "step": 15860 }, { "epoch": 12.41, "learning_rate": 4.8798279906176704e-05, "loss": 1.1655, "step": 15880 }, { "epoch": 12.42, "learning_rate": 4.879671618451916e-05, "loss": 1.2008, "step": 15900 }, { "epoch": 12.44, "learning_rate": 4.8795152462861613e-05, "loss": 1.1677, "step": 15920 }, { "epoch": 12.45, "learning_rate": 4.879358874120407e-05, "loss": 1.1869, "step": 15940 }, { "epoch": 12.47, "learning_rate": 4.8792025019546523e-05, "loss": 1.1645, "step": 15960 }, { "epoch": 12.48, "learning_rate": 4.879046129788898e-05, "loss": 1.161, "step": 15980 }, { "epoch": 12.5, "learning_rate": 4.878889757623143e-05, "loss": 1.1826, "step": 16000 }, { "epoch": 12.5, "eval_cer": 0.0854, "eval_loss": 0.1922062337398529, "eval_runtime": 244.5223, "eval_samples_per_second": 15.491, "eval_steps_per_second": 0.487, "eval_wer": 0.3997, "step": 16000 }, { "epoch": 12.52, "learning_rate": 4.878733385457389e-05, "loss": 1.1852, "step": 16020 }, { "epoch": 12.53, "learning_rate": 4.878577013291634e-05, "loss": 1.1673, "step": 16040 }, { "epoch": 12.55, "learning_rate": 4.87842064112588e-05, "loss": 1.1785, "step": 16060 }, { "epoch": 12.56, "learning_rate": 4.878264268960125e-05, "loss": 1.1502, "step": 16080 }, { "epoch": 12.58, "learning_rate": 4.878107896794371e-05, "loss": 1.1263, "step": 16100 }, { "epoch": 12.59, "learning_rate": 4.877951524628616e-05, "loss": 1.148, "step": 16120 }, { "epoch": 12.61, "learning_rate": 4.877795152462862e-05, "loss": 1.2102, "step": 16140 }, { "epoch": 12.62, "learning_rate": 4.877638780297107e-05, "loss": 1.1756, "step": 16160 }, { "epoch": 12.64, "learning_rate": 4.877482408131353e-05, "loss": 1.1316, "step": 16180 }, { "epoch": 12.66, "learning_rate": 4.877326035965598e-05, "loss": 1.2307, "step": 16200 }, { "epoch": 12.67, "learning_rate": 4.877169663799844e-05, "loss": 1.1523, "step": 16220 }, { "epoch": 12.69, "learning_rate": 4.877013291634089e-05, "loss": 1.1857, "step": 16240 }, { "epoch": 12.7, "learning_rate": 4.876856919468335e-05, "loss": 1.1858, "step": 16260 }, { "epoch": 12.72, "learning_rate": 4.87670054730258e-05, "loss": 1.1377, "step": 16280 }, { "epoch": 12.73, "learning_rate": 4.876544175136826e-05, "loss": 1.1537, "step": 16300 }, { "epoch": 12.75, "learning_rate": 4.876387802971071e-05, "loss": 1.1709, "step": 16320 }, { "epoch": 12.77, "learning_rate": 4.876231430805317e-05, "loss": 1.1508, "step": 16340 }, { "epoch": 12.78, "learning_rate": 4.876075058639562e-05, "loss": 1.174, "step": 16360 }, { "epoch": 12.8, "learning_rate": 4.875918686473808e-05, "loss": 1.1664, "step": 16380 }, { "epoch": 12.81, "learning_rate": 4.875762314308053e-05, "loss": 1.2039, "step": 16400 }, { "epoch": 12.83, "learning_rate": 4.875605942142299e-05, "loss": 1.1306, "step": 16420 }, { "epoch": 12.84, "learning_rate": 4.875449569976544e-05, "loss": 1.1812, "step": 16440 }, { "epoch": 12.86, "learning_rate": 4.87529319781079e-05, "loss": 1.1865, "step": 16460 }, { "epoch": 12.88, "learning_rate": 4.875136825645035e-05, "loss": 1.1347, "step": 16480 }, { "epoch": 12.89, "learning_rate": 4.874980453479281e-05, "loss": 1.1758, "step": 16500 }, { "epoch": 12.91, "learning_rate": 4.874824081313526e-05, "loss": 1.1682, "step": 16520 }, { "epoch": 12.92, "learning_rate": 4.8746677091477724e-05, "loss": 1.1735, "step": 16540 }, { "epoch": 12.94, "learning_rate": 4.874511336982017e-05, "loss": 1.1933, "step": 16560 }, { "epoch": 12.95, "learning_rate": 4.874354964816263e-05, "loss": 1.1225, "step": 16580 }, { "epoch": 12.97, "learning_rate": 4.874198592650508e-05, "loss": 1.2051, "step": 16600 }, { "epoch": 12.98, "learning_rate": 4.8740422204847544e-05, "loss": 1.1968, "step": 16620 }, { "epoch": 13.0, "learning_rate": 4.873885848318999e-05, "loss": 1.1752, "step": 16640 }, { "epoch": 13.02, "learning_rate": 4.873729476153245e-05, "loss": 1.1096, "step": 16660 }, { "epoch": 13.03, "learning_rate": 4.87357310398749e-05, "loss": 1.1696, "step": 16680 }, { "epoch": 13.05, "learning_rate": 4.8734167318217364e-05, "loss": 1.1415, "step": 16700 }, { "epoch": 13.06, "learning_rate": 4.873260359655982e-05, "loss": 1.1218, "step": 16720 }, { "epoch": 13.08, "learning_rate": 4.873103987490227e-05, "loss": 1.1996, "step": 16740 }, { "epoch": 13.09, "learning_rate": 4.872947615324472e-05, "loss": 1.1376, "step": 16760 }, { "epoch": 13.11, "learning_rate": 4.872791243158718e-05, "loss": 1.1655, "step": 16780 }, { "epoch": 13.12, "learning_rate": 4.872642689601251e-05, "loss": 1.1384, "step": 16800 }, { "epoch": 13.14, "learning_rate": 4.8724863174354967e-05, "loss": 1.1627, "step": 16820 }, { "epoch": 13.16, "learning_rate": 4.872329945269742e-05, "loss": 1.1401, "step": 16840 }, { "epoch": 13.17, "learning_rate": 4.8721735731039876e-05, "loss": 1.1333, "step": 16860 }, { "epoch": 13.19, "learning_rate": 4.872017200938233e-05, "loss": 1.1548, "step": 16880 }, { "epoch": 13.2, "learning_rate": 4.8718608287724786e-05, "loss": 1.132, "step": 16900 }, { "epoch": 13.22, "learning_rate": 4.871712275215012e-05, "loss": 1.1768, "step": 16920 }, { "epoch": 13.23, "learning_rate": 4.8715559030492576e-05, "loss": 1.109, "step": 16940 }, { "epoch": 13.25, "learning_rate": 4.871399530883503e-05, "loss": 1.147, "step": 16960 }, { "epoch": 13.27, "learning_rate": 4.8712431587177486e-05, "loss": 1.1738, "step": 16980 }, { "epoch": 13.28, "learning_rate": 4.871086786551994e-05, "loss": 1.148, "step": 17000 }, { "epoch": 13.28, "eval_cer": 0.0828, "eval_loss": 0.18761275708675385, "eval_runtime": 244.6215, "eval_samples_per_second": 15.485, "eval_steps_per_second": 0.486, "eval_wer": 0.3898, "step": 17000 }, { "epoch": 13.3, "learning_rate": 4.8709304143862396e-05, "loss": 1.1733, "step": 17020 }, { "epoch": 13.31, "learning_rate": 4.870774042220485e-05, "loss": 1.1974, "step": 17040 }, { "epoch": 13.33, "learning_rate": 4.8706176700547306e-05, "loss": 1.1558, "step": 17060 }, { "epoch": 13.34, "learning_rate": 4.870461297888976e-05, "loss": 1.186, "step": 17080 }, { "epoch": 13.36, "learning_rate": 4.8703049257232215e-05, "loss": 1.1332, "step": 17100 }, { "epoch": 13.38, "learning_rate": 4.870148553557467e-05, "loss": 1.1782, "step": 17120 }, { "epoch": 13.39, "learning_rate": 4.8699921813917125e-05, "loss": 1.1785, "step": 17140 }, { "epoch": 13.41, "learning_rate": 4.869835809225958e-05, "loss": 1.166, "step": 17160 }, { "epoch": 13.42, "learning_rate": 4.8696794370602035e-05, "loss": 1.1979, "step": 17180 }, { "epoch": 13.44, "learning_rate": 4.869523064894449e-05, "loss": 1.1414, "step": 17200 }, { "epoch": 13.45, "learning_rate": 4.8693666927286945e-05, "loss": 1.1455, "step": 17220 }, { "epoch": 13.47, "learning_rate": 4.86921032056294e-05, "loss": 1.1537, "step": 17240 }, { "epoch": 13.48, "learning_rate": 4.8690539483971855e-05, "loss": 1.1575, "step": 17260 }, { "epoch": 13.5, "learning_rate": 4.868897576231431e-05, "loss": 1.1579, "step": 17280 }, { "epoch": 13.52, "learning_rate": 4.8687412040656765e-05, "loss": 1.1656, "step": 17300 }, { "epoch": 13.53, "learning_rate": 4.868584831899922e-05, "loss": 1.1675, "step": 17320 }, { "epoch": 13.55, "learning_rate": 4.8684284597341675e-05, "loss": 1.2138, "step": 17340 }, { "epoch": 13.56, "learning_rate": 4.868272087568413e-05, "loss": 1.1301, "step": 17360 }, { "epoch": 13.58, "learning_rate": 4.8681157154026585e-05, "loss": 1.1552, "step": 17380 }, { "epoch": 13.59, "learning_rate": 4.867959343236904e-05, "loss": 1.1376, "step": 17400 }, { "epoch": 13.61, "learning_rate": 4.8678029710711495e-05, "loss": 1.1714, "step": 17420 }, { "epoch": 13.62, "learning_rate": 4.867646598905395e-05, "loss": 1.1686, "step": 17440 }, { "epoch": 13.64, "learning_rate": 4.8674902267396405e-05, "loss": 1.1236, "step": 17460 }, { "epoch": 13.66, "learning_rate": 4.867333854573886e-05, "loss": 1.1567, "step": 17480 }, { "epoch": 13.67, "learning_rate": 4.8671774824081315e-05, "loss": 1.1608, "step": 17500 }, { "epoch": 13.69, "learning_rate": 4.867021110242377e-05, "loss": 1.1632, "step": 17520 }, { "epoch": 13.7, "learning_rate": 4.8668647380766225e-05, "loss": 1.2273, "step": 17540 }, { "epoch": 13.72, "learning_rate": 4.866708365910868e-05, "loss": 1.1069, "step": 17560 }, { "epoch": 13.73, "learning_rate": 4.8665519937451135e-05, "loss": 1.1656, "step": 17580 }, { "epoch": 13.75, "learning_rate": 4.8663956215793597e-05, "loss": 1.1594, "step": 17600 }, { "epoch": 13.77, "learning_rate": 4.8662392494136045e-05, "loss": 1.185, "step": 17620 }, { "epoch": 13.78, "learning_rate": 4.86608287724785e-05, "loss": 1.2104, "step": 17640 }, { "epoch": 13.8, "learning_rate": 4.8659265050820955e-05, "loss": 1.1383, "step": 17660 }, { "epoch": 13.81, "learning_rate": 4.8657701329163416e-05, "loss": 1.1756, "step": 17680 }, { "epoch": 13.83, "learning_rate": 4.8656137607505865e-05, "loss": 1.1335, "step": 17700 }, { "epoch": 13.84, "learning_rate": 4.865457388584832e-05, "loss": 1.1498, "step": 17720 }, { "epoch": 13.86, "learning_rate": 4.8653010164190775e-05, "loss": 1.1368, "step": 17740 }, { "epoch": 13.88, "learning_rate": 4.865144644253323e-05, "loss": 1.1209, "step": 17760 }, { "epoch": 13.89, "learning_rate": 4.864988272087569e-05, "loss": 1.1654, "step": 17780 }, { "epoch": 13.91, "learning_rate": 4.864831899921814e-05, "loss": 1.1498, "step": 17800 }, { "epoch": 13.92, "learning_rate": 4.8646755277560594e-05, "loss": 1.1404, "step": 17820 }, { "epoch": 13.94, "learning_rate": 4.864519155590305e-05, "loss": 1.2145, "step": 17840 }, { "epoch": 13.95, "learning_rate": 4.864362783424551e-05, "loss": 1.1609, "step": 17860 }, { "epoch": 13.97, "learning_rate": 4.864206411258796e-05, "loss": 1.1979, "step": 17880 }, { "epoch": 13.98, "learning_rate": 4.8640500390930414e-05, "loss": 1.1774, "step": 17900 }, { "epoch": 14.0, "learning_rate": 4.863893666927287e-05, "loss": 1.1568, "step": 17920 }, { "epoch": 14.02, "learning_rate": 4.863737294761533e-05, "loss": 1.136, "step": 17940 }, { "epoch": 14.03, "learning_rate": 4.863580922595778e-05, "loss": 1.1775, "step": 17960 }, { "epoch": 14.05, "learning_rate": 4.8634245504300234e-05, "loss": 1.1362, "step": 17980 }, { "epoch": 14.06, "learning_rate": 4.863268178264269e-05, "loss": 1.1777, "step": 18000 }, { "epoch": 14.06, "eval_cer": 0.0804, "eval_loss": 0.18586616218090057, "eval_runtime": 246.5469, "eval_samples_per_second": 15.364, "eval_steps_per_second": 0.483, "eval_wer": 0.3878, "step": 18000 }, { "epoch": 14.08, "learning_rate": 4.863111806098515e-05, "loss": 1.1598, "step": 18020 }, { "epoch": 14.09, "learning_rate": 4.8629554339327606e-05, "loss": 1.1073, "step": 18040 }, { "epoch": 14.11, "learning_rate": 4.8627990617670054e-05, "loss": 1.169, "step": 18060 }, { "epoch": 14.12, "learning_rate": 4.862642689601251e-05, "loss": 1.1408, "step": 18080 }, { "epoch": 14.14, "learning_rate": 4.862486317435497e-05, "loss": 1.1616, "step": 18100 }, { "epoch": 14.16, "learning_rate": 4.8623299452697426e-05, "loss": 1.2081, "step": 18120 }, { "epoch": 14.17, "learning_rate": 4.8621735731039874e-05, "loss": 1.1554, "step": 18140 }, { "epoch": 14.19, "learning_rate": 4.862017200938233e-05, "loss": 1.1503, "step": 18160 }, { "epoch": 14.2, "learning_rate": 4.8618608287724784e-05, "loss": 1.1661, "step": 18180 }, { "epoch": 14.22, "learning_rate": 4.8617044566067246e-05, "loss": 1.1622, "step": 18200 }, { "epoch": 14.23, "learning_rate": 4.86154808444097e-05, "loss": 1.1587, "step": 18220 }, { "epoch": 14.25, "learning_rate": 4.861391712275215e-05, "loss": 1.1371, "step": 18240 }, { "epoch": 14.27, "learning_rate": 4.8612353401094604e-05, "loss": 1.1652, "step": 18260 }, { "epoch": 14.28, "learning_rate": 4.8610789679437066e-05, "loss": 1.1833, "step": 18280 }, { "epoch": 14.3, "learning_rate": 4.860922595777952e-05, "loss": 1.1738, "step": 18300 }, { "epoch": 14.31, "learning_rate": 4.860766223612197e-05, "loss": 1.1846, "step": 18320 }, { "epoch": 14.33, "learning_rate": 4.8606098514464424e-05, "loss": 1.1396, "step": 18340 }, { "epoch": 14.34, "learning_rate": 4.8604534792806886e-05, "loss": 1.1628, "step": 18360 }, { "epoch": 14.36, "learning_rate": 4.860297107114934e-05, "loss": 1.1034, "step": 18380 }, { "epoch": 14.38, "learning_rate": 4.8601407349491795e-05, "loss": 1.1421, "step": 18400 }, { "epoch": 14.39, "learning_rate": 4.8599843627834244e-05, "loss": 1.2098, "step": 18420 }, { "epoch": 14.41, "learning_rate": 4.8598279906176705e-05, "loss": 1.1358, "step": 18440 }, { "epoch": 14.42, "learning_rate": 4.859671618451916e-05, "loss": 1.1678, "step": 18460 }, { "epoch": 14.44, "learning_rate": 4.8595152462861615e-05, "loss": 1.1643, "step": 18480 }, { "epoch": 14.45, "learning_rate": 4.8593588741204064e-05, "loss": 1.1368, "step": 18500 }, { "epoch": 14.47, "learning_rate": 4.8592025019546525e-05, "loss": 1.174, "step": 18520 }, { "epoch": 14.48, "learning_rate": 4.859046129788898e-05, "loss": 1.1279, "step": 18540 }, { "epoch": 14.5, "learning_rate": 4.8588897576231435e-05, "loss": 1.1861, "step": 18560 }, { "epoch": 14.52, "learning_rate": 4.8587333854573883e-05, "loss": 1.1511, "step": 18580 }, { "epoch": 14.53, "learning_rate": 4.858577013291634e-05, "loss": 1.1681, "step": 18600 }, { "epoch": 14.55, "learning_rate": 4.85842064112588e-05, "loss": 1.1565, "step": 18620 }, { "epoch": 14.56, "learning_rate": 4.8582642689601255e-05, "loss": 1.1347, "step": 18640 }, { "epoch": 14.58, "learning_rate": 4.858107896794371e-05, "loss": 1.1777, "step": 18660 }, { "epoch": 14.59, "learning_rate": 4.857951524628616e-05, "loss": 1.1596, "step": 18680 }, { "epoch": 14.61, "learning_rate": 4.857795152462862e-05, "loss": 1.133, "step": 18700 }, { "epoch": 14.62, "learning_rate": 4.8576387802971075e-05, "loss": 1.2194, "step": 18720 }, { "epoch": 14.64, "learning_rate": 4.857482408131353e-05, "loss": 1.1124, "step": 18740 }, { "epoch": 14.66, "learning_rate": 4.857326035965598e-05, "loss": 1.1767, "step": 18760 }, { "epoch": 14.67, "learning_rate": 4.857169663799844e-05, "loss": 1.1511, "step": 18780 }, { "epoch": 14.69, "learning_rate": 4.8570132916340895e-05, "loss": 1.1409, "step": 18800 }, { "epoch": 14.7, "learning_rate": 4.856856919468335e-05, "loss": 1.1719, "step": 18820 }, { "epoch": 14.72, "learning_rate": 4.8567005473025805e-05, "loss": 1.1155, "step": 18840 }, { "epoch": 14.73, "learning_rate": 4.856544175136826e-05, "loss": 1.1715, "step": 18860 }, { "epoch": 14.75, "learning_rate": 4.8563878029710715e-05, "loss": 1.1459, "step": 18880 }, { "epoch": 14.77, "learning_rate": 4.856231430805317e-05, "loss": 1.1414, "step": 18900 }, { "epoch": 14.78, "learning_rate": 4.8560750586395625e-05, "loss": 1.1647, "step": 18920 }, { "epoch": 14.8, "learning_rate": 4.855918686473808e-05, "loss": 1.1296, "step": 18940 }, { "epoch": 14.81, "learning_rate": 4.8557623143080535e-05, "loss": 1.1897, "step": 18960 }, { "epoch": 14.83, "learning_rate": 4.855605942142299e-05, "loss": 1.1533, "step": 18980 }, { "epoch": 14.84, "learning_rate": 4.8554495699765445e-05, "loss": 1.1694, "step": 19000 }, { "epoch": 14.84, "eval_cer": 0.0829, "eval_loss": 0.19008716940879822, "eval_runtime": 246.2181, "eval_samples_per_second": 15.385, "eval_steps_per_second": 0.483, "eval_wer": 0.3929, "step": 19000 }, { "epoch": 14.86, "learning_rate": 4.85529319781079e-05, "loss": 1.2248, "step": 19020 }, { "epoch": 14.88, "learning_rate": 4.8551368256450355e-05, "loss": 1.1043, "step": 19040 }, { "epoch": 14.89, "learning_rate": 4.854980453479281e-05, "loss": 1.1726, "step": 19060 }, { "epoch": 14.91, "learning_rate": 4.8548240813135265e-05, "loss": 1.1381, "step": 19080 }, { "epoch": 14.92, "learning_rate": 4.854667709147772e-05, "loss": 1.1395, "step": 19100 }, { "epoch": 14.94, "learning_rate": 4.8545113369820175e-05, "loss": 1.1746, "step": 19120 }, { "epoch": 14.95, "learning_rate": 4.854354964816263e-05, "loss": 1.1346, "step": 19140 }, { "epoch": 14.97, "learning_rate": 4.8541985926505084e-05, "loss": 1.2079, "step": 19160 }, { "epoch": 14.98, "learning_rate": 4.854042220484754e-05, "loss": 1.1531, "step": 19180 }, { "epoch": 15.0, "learning_rate": 4.8538858483189994e-05, "loss": 1.1763, "step": 19200 }, { "epoch": 15.02, "learning_rate": 4.853729476153245e-05, "loss": 1.1046, "step": 19220 }, { "epoch": 15.03, "learning_rate": 4.8535731039874904e-05, "loss": 1.1477, "step": 19240 }, { "epoch": 15.05, "learning_rate": 4.853416731821736e-05, "loss": 1.1154, "step": 19260 }, { "epoch": 15.06, "learning_rate": 4.8532603596559814e-05, "loss": 1.1563, "step": 19280 }, { "epoch": 15.08, "learning_rate": 4.853103987490227e-05, "loss": 1.1585, "step": 19300 }, { "epoch": 15.09, "learning_rate": 4.8529476153244724e-05, "loss": 1.1264, "step": 19320 }, { "epoch": 15.11, "learning_rate": 4.852791243158718e-05, "loss": 1.1514, "step": 19340 }, { "epoch": 15.12, "learning_rate": 4.8526348709929634e-05, "loss": 1.154, "step": 19360 }, { "epoch": 15.14, "learning_rate": 4.852478498827209e-05, "loss": 1.1311, "step": 19380 }, { "epoch": 15.16, "learning_rate": 4.8523221266614544e-05, "loss": 1.1969, "step": 19400 }, { "epoch": 15.17, "learning_rate": 4.8521657544957e-05, "loss": 1.1301, "step": 19420 }, { "epoch": 15.19, "learning_rate": 4.8520093823299454e-05, "loss": 1.19, "step": 19440 }, { "epoch": 15.2, "learning_rate": 4.8518530101641916e-05, "loss": 1.1474, "step": 19460 }, { "epoch": 15.22, "learning_rate": 4.8516966379984364e-05, "loss": 1.1537, "step": 19480 }, { "epoch": 15.23, "learning_rate": 4.851540265832682e-05, "loss": 1.1203, "step": 19500 }, { "epoch": 15.25, "learning_rate": 4.8513838936669274e-05, "loss": 1.1399, "step": 19520 }, { "epoch": 15.27, "learning_rate": 4.851227521501173e-05, "loss": 1.1511, "step": 19540 }, { "epoch": 15.28, "learning_rate": 4.8510711493354184e-05, "loss": 1.1531, "step": 19560 }, { "epoch": 15.3, "learning_rate": 4.850914777169664e-05, "loss": 1.1713, "step": 19580 }, { "epoch": 15.31, "learning_rate": 4.8507584050039094e-05, "loss": 1.1686, "step": 19600 }, { "epoch": 15.33, "learning_rate": 4.850602032838155e-05, "loss": 1.1277, "step": 19620 }, { "epoch": 15.34, "learning_rate": 4.850445660672401e-05, "loss": 1.1651, "step": 19640 }, { "epoch": 15.36, "learning_rate": 4.850289288506646e-05, "loss": 1.1556, "step": 19660 }, { "epoch": 15.38, "learning_rate": 4.8501329163408914e-05, "loss": 1.1293, "step": 19680 }, { "epoch": 15.39, "learning_rate": 4.849976544175137e-05, "loss": 1.1985, "step": 19700 }, { "epoch": 15.41, "learning_rate": 4.849820172009383e-05, "loss": 1.1221, "step": 19720 }, { "epoch": 15.42, "learning_rate": 4.849663799843628e-05, "loss": 1.2045, "step": 19740 }, { "epoch": 15.44, "learning_rate": 4.8495074276778734e-05, "loss": 1.1562, "step": 19760 }, { "epoch": 15.45, "learning_rate": 4.849351055512119e-05, "loss": 1.1498, "step": 19780 }, { "epoch": 15.47, "learning_rate": 4.849194683346365e-05, "loss": 1.1779, "step": 19800 }, { "epoch": 15.48, "learning_rate": 4.8490383111806105e-05, "loss": 1.1398, "step": 19820 }, { "epoch": 15.5, "learning_rate": 4.8488819390148554e-05, "loss": 1.1581, "step": 19840 }, { "epoch": 15.52, "learning_rate": 4.848725566849101e-05, "loss": 1.153, "step": 19860 }, { "epoch": 15.53, "learning_rate": 4.848569194683347e-05, "loss": 1.1495, "step": 19880 }, { "epoch": 15.55, "learning_rate": 4.8484128225175925e-05, "loss": 1.1831, "step": 19900 }, { "epoch": 15.56, "learning_rate": 4.8482564503518373e-05, "loss": 1.1109, "step": 19920 }, { "epoch": 15.58, "learning_rate": 4.848100078186083e-05, "loss": 1.169, "step": 19940 }, { "epoch": 15.59, "learning_rate": 4.8479437060203283e-05, "loss": 1.1777, "step": 19960 }, { "epoch": 15.61, "learning_rate": 4.8477873338545745e-05, "loss": 1.1507, "step": 19980 }, { "epoch": 15.62, "learning_rate": 4.847630961688819e-05, "loss": 1.1945, "step": 20000 }, { "epoch": 15.62, "eval_cer": 0.0775, "eval_loss": 0.18442465364933014, "eval_runtime": 240.5647, "eval_samples_per_second": 15.746, "eval_steps_per_second": 0.495, "eval_wer": 0.376, "step": 20000 }, { "epoch": 15.64, "learning_rate": 4.847474589523065e-05, "loss": 1.125, "step": 20020 }, { "epoch": 15.66, "learning_rate": 4.84731821735731e-05, "loss": 1.1647, "step": 20040 }, { "epoch": 15.67, "learning_rate": 4.8471618451915565e-05, "loss": 1.143, "step": 20060 }, { "epoch": 15.69, "learning_rate": 4.847005473025802e-05, "loss": 1.1475, "step": 20080 }, { "epoch": 15.7, "learning_rate": 4.846849100860047e-05, "loss": 1.1612, "step": 20100 }, { "epoch": 15.72, "learning_rate": 4.846692728694292e-05, "loss": 1.1428, "step": 20120 }, { "epoch": 15.73, "learning_rate": 4.8465363565285385e-05, "loss": 1.1755, "step": 20140 }, { "epoch": 15.75, "learning_rate": 4.846379984362784e-05, "loss": 1.1903, "step": 20160 }, { "epoch": 15.77, "learning_rate": 4.846223612197029e-05, "loss": 1.1589, "step": 20180 }, { "epoch": 15.78, "learning_rate": 4.846067240031274e-05, "loss": 1.182, "step": 20200 }, { "epoch": 15.8, "learning_rate": 4.8459108678655205e-05, "loss": 1.1342, "step": 20220 }, { "epoch": 15.81, "learning_rate": 4.845754495699766e-05, "loss": 1.1593, "step": 20240 }, { "epoch": 15.83, "learning_rate": 4.8455981235340115e-05, "loss": 1.1551, "step": 20260 }, { "epoch": 15.84, "learning_rate": 4.845441751368256e-05, "loss": 1.1496, "step": 20280 }, { "epoch": 15.86, "learning_rate": 4.8452853792025025e-05, "loss": 1.1702, "step": 20300 }, { "epoch": 15.88, "learning_rate": 4.845129007036748e-05, "loss": 1.1246, "step": 20320 }, { "epoch": 15.89, "learning_rate": 4.8449726348709935e-05, "loss": 1.2002, "step": 20340 }, { "epoch": 15.91, "learning_rate": 4.844816262705238e-05, "loss": 1.1657, "step": 20360 }, { "epoch": 15.92, "learning_rate": 4.844659890539484e-05, "loss": 1.1546, "step": 20380 }, { "epoch": 15.94, "learning_rate": 4.84450351837373e-05, "loss": 1.2016, "step": 20400 }, { "epoch": 15.95, "learning_rate": 4.8443471462079755e-05, "loss": 1.1471, "step": 20420 }, { "epoch": 15.97, "learning_rate": 4.844190774042221e-05, "loss": 1.1461, "step": 20440 }, { "epoch": 15.98, "learning_rate": 4.844034401876466e-05, "loss": 1.1629, "step": 20460 }, { "epoch": 16.0, "learning_rate": 4.843878029710712e-05, "loss": 1.1828, "step": 20480 }, { "epoch": 16.02, "learning_rate": 4.8437216575449574e-05, "loss": 1.1329, "step": 20500 }, { "epoch": 16.03, "learning_rate": 4.843565285379203e-05, "loss": 1.1624, "step": 20520 }, { "epoch": 16.05, "learning_rate": 4.843408913213448e-05, "loss": 1.12, "step": 20540 }, { "epoch": 16.06, "learning_rate": 4.843252541047694e-05, "loss": 1.1454, "step": 20560 }, { "epoch": 16.08, "learning_rate": 4.8430961688819394e-05, "loss": 1.1941, "step": 20580 }, { "epoch": 16.09, "learning_rate": 4.842939796716185e-05, "loss": 1.1502, "step": 20600 }, { "epoch": 16.11, "learning_rate": 4.84278342455043e-05, "loss": 1.1393, "step": 20620 }, { "epoch": 16.12, "learning_rate": 4.842627052384676e-05, "loss": 1.1612, "step": 20640 }, { "epoch": 16.14, "learning_rate": 4.8424706802189214e-05, "loss": 1.171, "step": 20660 }, { "epoch": 16.16, "learning_rate": 4.842314308053167e-05, "loss": 1.1776, "step": 20680 }, { "epoch": 16.17, "learning_rate": 4.8421579358874124e-05, "loss": 1.1385, "step": 20700 }, { "epoch": 16.19, "learning_rate": 4.842001563721658e-05, "loss": 1.1383, "step": 20720 }, { "epoch": 16.2, "learning_rate": 4.8418451915559034e-05, "loss": 1.1197, "step": 20740 }, { "epoch": 16.22, "learning_rate": 4.841688819390149e-05, "loss": 1.1815, "step": 20760 }, { "epoch": 16.23, "learning_rate": 4.8415324472243944e-05, "loss": 1.1207, "step": 20780 }, { "epoch": 16.25, "learning_rate": 4.841376075058639e-05, "loss": 1.146, "step": 20800 }, { "epoch": 16.27, "learning_rate": 4.8412197028928854e-05, "loss": 1.1393, "step": 20820 }, { "epoch": 16.28, "learning_rate": 4.841063330727131e-05, "loss": 1.1733, "step": 20840 }, { "epoch": 16.3, "learning_rate": 4.8409069585613764e-05, "loss": 1.1429, "step": 20860 }, { "epoch": 16.31, "learning_rate": 4.840750586395622e-05, "loss": 1.1457, "step": 20880 }, { "epoch": 16.33, "learning_rate": 4.8405942142298674e-05, "loss": 1.1384, "step": 20900 }, { "epoch": 16.34, "learning_rate": 4.840437842064113e-05, "loss": 1.1341, "step": 20920 }, { "epoch": 16.36, "learning_rate": 4.8402892885066456e-05, "loss": 1.1213, "step": 20940 }, { "epoch": 16.38, "learning_rate": 4.840132916340892e-05, "loss": 1.1548, "step": 20960 }, { "epoch": 16.39, "learning_rate": 4.839976544175137e-05, "loss": 1.222, "step": 20980 }, { "epoch": 16.41, "learning_rate": 4.839820172009383e-05, "loss": 1.1319, "step": 21000 }, { "epoch": 16.41, "eval_cer": 0.084, "eval_loss": 0.18227259814739227, "eval_runtime": 244.2989, "eval_samples_per_second": 15.506, "eval_steps_per_second": 0.487, "eval_wer": 0.3982, "step": 21000 }, { "epoch": 16.42, "learning_rate": 4.8396637998436276e-05, "loss": 1.1107, "step": 21020 }, { "epoch": 16.44, "learning_rate": 4.839507427677874e-05, "loss": 1.1529, "step": 21040 }, { "epoch": 16.45, "learning_rate": 4.839351055512119e-05, "loss": 1.1631, "step": 21060 }, { "epoch": 16.47, "learning_rate": 4.839194683346365e-05, "loss": 1.1938, "step": 21080 }, { "epoch": 16.48, "learning_rate": 4.83903831118061e-05, "loss": 1.1445, "step": 21100 }, { "epoch": 16.5, "learning_rate": 4.838881939014855e-05, "loss": 1.1876, "step": 21120 }, { "epoch": 16.52, "learning_rate": 4.838725566849101e-05, "loss": 1.1768, "step": 21140 }, { "epoch": 16.53, "learning_rate": 4.838569194683347e-05, "loss": 1.1804, "step": 21160 }, { "epoch": 16.55, "learning_rate": 4.838412822517592e-05, "loss": 1.1554, "step": 21180 }, { "epoch": 16.56, "learning_rate": 4.838256450351837e-05, "loss": 1.1142, "step": 21200 }, { "epoch": 16.58, "learning_rate": 4.838100078186083e-05, "loss": 1.1522, "step": 21220 }, { "epoch": 16.59, "learning_rate": 4.837943706020329e-05, "loss": 1.1725, "step": 21240 }, { "epoch": 16.61, "learning_rate": 4.837787333854574e-05, "loss": 1.1762, "step": 21260 }, { "epoch": 16.62, "learning_rate": 4.837630961688819e-05, "loss": 1.1931, "step": 21280 }, { "epoch": 16.64, "learning_rate": 4.837474589523065e-05, "loss": 1.1316, "step": 21300 }, { "epoch": 16.66, "learning_rate": 4.837318217357311e-05, "loss": 1.1951, "step": 21320 }, { "epoch": 16.67, "learning_rate": 4.837161845191556e-05, "loss": 1.1435, "step": 21340 }, { "epoch": 16.69, "learning_rate": 4.837005473025802e-05, "loss": 1.1277, "step": 21360 }, { "epoch": 16.7, "learning_rate": 4.836849100860047e-05, "loss": 1.146, "step": 21380 }, { "epoch": 16.72, "learning_rate": 4.836692728694293e-05, "loss": 1.135, "step": 21400 }, { "epoch": 16.73, "learning_rate": 4.836536356528538e-05, "loss": 1.1617, "step": 21420 }, { "epoch": 16.75, "learning_rate": 4.836379984362784e-05, "loss": 1.1334, "step": 21440 }, { "epoch": 16.77, "learning_rate": 4.836223612197029e-05, "loss": 1.1331, "step": 21460 }, { "epoch": 16.78, "learning_rate": 4.836067240031275e-05, "loss": 1.1421, "step": 21480 }, { "epoch": 16.8, "learning_rate": 4.83591086786552e-05, "loss": 1.1451, "step": 21500 }, { "epoch": 16.81, "learning_rate": 4.835754495699766e-05, "loss": 1.1886, "step": 21520 }, { "epoch": 16.83, "learning_rate": 4.835598123534011e-05, "loss": 1.1163, "step": 21540 }, { "epoch": 16.84, "learning_rate": 4.835441751368257e-05, "loss": 1.1493, "step": 21560 }, { "epoch": 16.86, "learning_rate": 4.835285379202502e-05, "loss": 1.1823, "step": 21580 }, { "epoch": 16.88, "learning_rate": 4.835129007036748e-05, "loss": 1.1318, "step": 21600 }, { "epoch": 16.89, "learning_rate": 4.834972634870993e-05, "loss": 1.1867, "step": 21620 }, { "epoch": 16.91, "learning_rate": 4.834816262705239e-05, "loss": 1.1309, "step": 21640 }, { "epoch": 16.92, "learning_rate": 4.834659890539484e-05, "loss": 1.1501, "step": 21660 }, { "epoch": 16.94, "learning_rate": 4.83450351837373e-05, "loss": 1.204, "step": 21680 }, { "epoch": 16.95, "learning_rate": 4.834347146207975e-05, "loss": 1.1156, "step": 21700 }, { "epoch": 16.97, "learning_rate": 4.834190774042221e-05, "loss": 1.209, "step": 21720 }, { "epoch": 16.98, "learning_rate": 4.834034401876466e-05, "loss": 1.1512, "step": 21740 }, { "epoch": 17.0, "learning_rate": 4.833878029710712e-05, "loss": 1.1769, "step": 21760 }, { "epoch": 17.02, "learning_rate": 4.833721657544957e-05, "loss": 1.1215, "step": 21780 }, { "epoch": 17.03, "learning_rate": 4.833565285379203e-05, "loss": 1.1486, "step": 21800 }, { "epoch": 17.05, "learning_rate": 4.833408913213448e-05, "loss": 1.1195, "step": 21820 }, { "epoch": 17.06, "learning_rate": 4.833252541047694e-05, "loss": 1.142, "step": 21840 }, { "epoch": 17.08, "learning_rate": 4.833096168881939e-05, "loss": 1.1703, "step": 21860 }, { "epoch": 17.09, "learning_rate": 4.832939796716185e-05, "loss": 1.1266, "step": 21880 }, { "epoch": 17.11, "learning_rate": 4.83278342455043e-05, "loss": 1.1735, "step": 21900 }, { "epoch": 17.12, "learning_rate": 4.832627052384676e-05, "loss": 1.1406, "step": 21920 }, { "epoch": 17.14, "learning_rate": 4.832470680218921e-05, "loss": 1.1208, "step": 21940 }, { "epoch": 17.16, "learning_rate": 4.832314308053167e-05, "loss": 1.2007, "step": 21960 }, { "epoch": 17.17, "learning_rate": 4.832157935887412e-05, "loss": 1.1268, "step": 21980 }, { "epoch": 17.19, "learning_rate": 4.832001563721658e-05, "loss": 1.1404, "step": 22000 }, { "epoch": 17.19, "eval_cer": 0.0867, "eval_loss": 0.1880631446838379, "eval_runtime": 241.4865, "eval_samples_per_second": 15.686, "eval_steps_per_second": 0.493, "eval_wer": 0.4047, "step": 22000 } ], "max_steps": 640000, "num_train_epochs": 500, "total_flos": 1.0148810152762456e+20, "trial_name": null, "trial_params": null }