diff --git "a/trainer_state.json" "b/trainer_state.json" --- "a/trainer_state.json" +++ "b/trainer_state.json" @@ -1,8 +1,8 @@ { "best_metric": null, "best_model_checkpoint": null, - "epoch": 24.146917358985572, - "global_step": 27600, + "epoch": 39.982072584171405, + "global_step": 45700, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, @@ -17124,11 +17124,11231 @@ "eval_runtime": 1390.8693, "eval_samples_per_second": 6.298, "step": 27600 + }, + { + "epoch": 24.16, + "learning_rate": 0.00012041223404255319, + "loss": 0.3487, + "step": 27610 + }, + { + "epoch": 24.16, + "learning_rate": 0.00012034574468085106, + "loss": 0.366, + "step": 27620 + }, + { + "epoch": 24.17, + "learning_rate": 0.00012027925531914893, + "loss": 0.2586, + "step": 27630 + }, + { + "epoch": 24.18, + "learning_rate": 0.00012021276595744681, + "loss": 0.3973, + "step": 27640 + }, + { + "epoch": 24.19, + "learning_rate": 0.00012014627659574468, + "loss": 0.2663, + "step": 27650 + }, + { + "epoch": 24.2, + "learning_rate": 0.00012007978723404253, + "loss": 0.3069, + "step": 27660 + }, + { + "epoch": 24.21, + "learning_rate": 0.0001200132978723404, + "loss": 0.365, + "step": 27670 + }, + { + "epoch": 24.22, + "learning_rate": 0.00011994680851063829, + "loss": 0.2283, + "step": 27680 + }, + { + "epoch": 24.23, + "learning_rate": 0.00011988031914893616, + "loss": 0.3685, + "step": 27690 + }, + { + "epoch": 24.23, + "learning_rate": 0.00011981382978723403, + "loss": 0.2769, + "step": 27700 + }, + { + "epoch": 24.24, + "learning_rate": 0.0001197473404255319, + "loss": 0.3237, + "step": 27710 + }, + { + "epoch": 24.25, + "learning_rate": 0.00011968085106382978, + "loss": 0.3313, + "step": 27720 + }, + { + "epoch": 24.26, + "learning_rate": 0.00011961436170212765, + "loss": 0.2045, + "step": 27730 + }, + { + "epoch": 24.27, + "learning_rate": 0.00011954787234042552, + "loss": 0.3746, + "step": 27740 + }, + { + "epoch": 24.28, + "learning_rate": 0.00011948138297872339, + "loss": 0.2782, + "step": 27750 + }, + { + "epoch": 24.29, + "learning_rate": 0.00011941489361702127, + "loss": 0.2805, + "step": 27760 + }, + { + "epoch": 24.3, + "learning_rate": 0.00011934840425531914, + "loss": 0.3367, + "step": 27770 + }, + { + "epoch": 24.3, + "learning_rate": 0.00011928191489361701, + "loss": 0.2286, + "step": 27780 + }, + { + "epoch": 24.31, + "learning_rate": 0.00011921542553191488, + "loss": 0.3823, + "step": 27790 + }, + { + "epoch": 24.32, + "learning_rate": 0.00011914893617021277, + "loss": 0.2959, + "step": 27800 + }, + { + "epoch": 24.33, + "learning_rate": 0.00011908244680851064, + "loss": 0.3402, + "step": 27810 + }, + { + "epoch": 24.34, + "learning_rate": 0.0001190159574468085, + "loss": 0.4104, + "step": 27820 + }, + { + "epoch": 24.35, + "learning_rate": 0.00011894946808510638, + "loss": 0.235, + "step": 27830 + }, + { + "epoch": 24.36, + "learning_rate": 0.00011888297872340423, + "loss": 0.3524, + "step": 27840 + }, + { + "epoch": 24.37, + "learning_rate": 0.00011881648936170212, + "loss": 0.2977, + "step": 27850 + }, + { + "epoch": 24.37, + "learning_rate": 0.00011874999999999999, + "loss": 0.3181, + "step": 27860 + }, + { + "epoch": 24.38, + "learning_rate": 0.00011868351063829786, + "loss": 0.3665, + "step": 27870 + }, + { + "epoch": 24.39, + "learning_rate": 0.00011861702127659573, + "loss": 0.2661, + "step": 27880 + }, + { + "epoch": 24.4, + "learning_rate": 0.00011855053191489361, + "loss": 0.3731, + "step": 27890 + }, + { + "epoch": 24.41, + "learning_rate": 0.00011848404255319148, + "loss": 0.2666, + "step": 27900 + }, + { + "epoch": 24.42, + "learning_rate": 0.00011841755319148935, + "loss": 0.3244, + "step": 27910 + }, + { + "epoch": 24.43, + "learning_rate": 0.00011835106382978722, + "loss": 0.3023, + "step": 27920 + }, + { + "epoch": 24.44, + "learning_rate": 0.0001182845744680851, + "loss": 0.2821, + "step": 27930 + }, + { + "epoch": 24.44, + "learning_rate": 0.00011821808510638297, + "loss": 0.3681, + "step": 27940 + }, + { + "epoch": 24.45, + "learning_rate": 0.00011815159574468084, + "loss": 0.2815, + "step": 27950 + }, + { + "epoch": 24.46, + "learning_rate": 0.00011808510638297871, + "loss": 0.3543, + "step": 27960 + }, + { + "epoch": 24.47, + "learning_rate": 0.0001180186170212766, + "loss": 0.3648, + "step": 27970 + }, + { + "epoch": 24.48, + "learning_rate": 0.00011795212765957447, + "loss": 0.2333, + "step": 27980 + }, + { + "epoch": 24.49, + "learning_rate": 0.00011788563829787234, + "loss": 0.3323, + "step": 27990 + }, + { + "epoch": 24.5, + "learning_rate": 0.0001178191489361702, + "loss": 0.2663, + "step": 28000 + }, + { + "epoch": 24.51, + "learning_rate": 0.00011775265957446806, + "loss": 0.315, + "step": 28010 + }, + { + "epoch": 24.51, + "learning_rate": 0.00011768617021276594, + "loss": 0.3894, + "step": 28020 + }, + { + "epoch": 24.52, + "learning_rate": 0.00011761968085106381, + "loss": 0.2131, + "step": 28030 + }, + { + "epoch": 24.53, + "learning_rate": 0.00011755319148936168, + "loss": 0.3683, + "step": 28040 + }, + { + "epoch": 24.54, + "learning_rate": 0.00011748670212765955, + "loss": 0.3299, + "step": 28050 + }, + { + "epoch": 24.55, + "learning_rate": 0.00011742021276595744, + "loss": 0.3791, + "step": 28060 + }, + { + "epoch": 24.56, + "learning_rate": 0.00011735372340425531, + "loss": 0.316, + "step": 28070 + }, + { + "epoch": 24.57, + "learning_rate": 0.00011728723404255318, + "loss": 0.1813, + "step": 28080 + }, + { + "epoch": 24.58, + "learning_rate": 0.00011722074468085105, + "loss": 0.4137, + "step": 28090 + }, + { + "epoch": 24.58, + "learning_rate": 0.00011715425531914893, + "loss": 0.339, + "step": 28100 + }, + { + "epoch": 24.59, + "learning_rate": 0.0001170877659574468, + "loss": 0.3131, + "step": 28110 + }, + { + "epoch": 24.6, + "learning_rate": 0.00011702127659574467, + "loss": 0.3275, + "step": 28120 + }, + { + "epoch": 24.61, + "learning_rate": 0.00011695478723404254, + "loss": 0.2415, + "step": 28130 + }, + { + "epoch": 24.62, + "learning_rate": 0.00011688829787234042, + "loss": 0.3616, + "step": 28140 + }, + { + "epoch": 24.63, + "learning_rate": 0.0001168218085106383, + "loss": 0.2763, + "step": 28150 + }, + { + "epoch": 24.64, + "learning_rate": 0.00011675531914893616, + "loss": 0.322, + "step": 28160 + }, + { + "epoch": 24.65, + "learning_rate": 0.00011668882978723403, + "loss": 0.3409, + "step": 28170 + }, + { + "epoch": 24.65, + "learning_rate": 0.00011662234042553192, + "loss": 0.2211, + "step": 28180 + }, + { + "epoch": 24.66, + "learning_rate": 0.00011655585106382977, + "loss": 0.3776, + "step": 28190 + }, + { + "epoch": 24.67, + "learning_rate": 0.00011648936170212764, + "loss": 0.222, + "step": 28200 + }, + { + "epoch": 24.67, + "eval_cer1": 0.26410317004827655, + "eval_cer2": 0.24482362592288762, + "eval_cer3": 0.22005880431231623, + "eval_cer4": 0.22228661579574358, + "eval_cer5": 0.2461995753715499, + "eval_loss": 1.0298795700073242, + "eval_runtime": 1393.0381, + "eval_samples_per_second": 6.288, + "step": 28200 + }, + { + "epoch": 24.68, + "learning_rate": 0.00011642287234042551, + "loss": 0.2923, + "step": 28210 + }, + { + "epoch": 24.69, + "learning_rate": 0.00011635638297872338, + "loss": 0.3683, + "step": 28220 + }, + { + "epoch": 24.7, + "learning_rate": 0.00011628989361702127, + "loss": 0.2434, + "step": 28230 + }, + { + "epoch": 24.71, + "learning_rate": 0.00011622340425531914, + "loss": 0.4182, + "step": 28240 + }, + { + "epoch": 24.72, + "learning_rate": 0.000116156914893617, + "loss": 0.2704, + "step": 28250 + }, + { + "epoch": 24.72, + "learning_rate": 0.00011609042553191489, + "loss": 0.3601, + "step": 28260 + }, + { + "epoch": 24.73, + "learning_rate": 0.00011602393617021276, + "loss": 0.3556, + "step": 28270 + }, + { + "epoch": 24.74, + "learning_rate": 0.00011595744680851063, + "loss": 0.3134, + "step": 28280 + }, + { + "epoch": 24.75, + "learning_rate": 0.0001158909574468085, + "loss": 0.3979, + "step": 28290 + }, + { + "epoch": 24.76, + "learning_rate": 0.00011582446808510638, + "loss": 0.3138, + "step": 28300 + }, + { + "epoch": 24.77, + "learning_rate": 0.00011575797872340425, + "loss": 0.313, + "step": 28310 + }, + { + "epoch": 24.78, + "learning_rate": 0.00011569148936170212, + "loss": 0.4034, + "step": 28320 + }, + { + "epoch": 24.79, + "learning_rate": 0.00011562499999999999, + "loss": 0.2587, + "step": 28330 + }, + { + "epoch": 24.79, + "learning_rate": 0.00011555851063829787, + "loss": 0.424, + "step": 28340 + }, + { + "epoch": 24.8, + "learning_rate": 0.00011549202127659574, + "loss": 0.2582, + "step": 28350 + }, + { + "epoch": 24.81, + "learning_rate": 0.0001154255319148936, + "loss": 0.3311, + "step": 28360 + }, + { + "epoch": 24.82, + "learning_rate": 0.00011535904255319147, + "loss": 0.3179, + "step": 28370 + }, + { + "epoch": 24.83, + "learning_rate": 0.00011529255319148934, + "loss": 0.2749, + "step": 28380 + }, + { + "epoch": 24.84, + "learning_rate": 0.00011522606382978722, + "loss": 0.3305, + "step": 28390 + }, + { + "epoch": 24.85, + "learning_rate": 0.0001151595744680851, + "loss": 0.2761, + "step": 28400 + }, + { + "epoch": 24.86, + "learning_rate": 0.00011509308510638296, + "loss": 0.3303, + "step": 28410 + }, + { + "epoch": 24.86, + "learning_rate": 0.00011502659574468083, + "loss": 0.3448, + "step": 28420 + }, + { + "epoch": 24.87, + "learning_rate": 0.00011496010638297872, + "loss": 0.2466, + "step": 28430 + }, + { + "epoch": 24.88, + "learning_rate": 0.00011489361702127659, + "loss": 0.3966, + "step": 28440 + }, + { + "epoch": 24.89, + "learning_rate": 0.00011482712765957446, + "loss": 0.3506, + "step": 28450 + }, + { + "epoch": 24.9, + "learning_rate": 0.00011476063829787233, + "loss": 0.3235, + "step": 28460 + }, + { + "epoch": 24.91, + "learning_rate": 0.00011469414893617021, + "loss": 0.3684, + "step": 28470 + }, + { + "epoch": 24.92, + "learning_rate": 0.00011462765957446808, + "loss": 0.2624, + "step": 28480 + }, + { + "epoch": 24.93, + "learning_rate": 0.00011456117021276595, + "loss": 0.3806, + "step": 28490 + }, + { + "epoch": 24.93, + "learning_rate": 0.00011449468085106382, + "loss": 0.3107, + "step": 28500 + }, + { + "epoch": 24.94, + "learning_rate": 0.0001144281914893617, + "loss": 0.3286, + "step": 28510 + }, + { + "epoch": 24.95, + "learning_rate": 0.00011436170212765957, + "loss": 0.3494, + "step": 28520 + }, + { + "epoch": 24.96, + "learning_rate": 0.00011429521276595744, + "loss": 0.2631, + "step": 28530 + }, + { + "epoch": 24.97, + "learning_rate": 0.0001142287234042553, + "loss": 0.4061, + "step": 28540 + }, + { + "epoch": 24.98, + "learning_rate": 0.00011416223404255317, + "loss": 0.338, + "step": 28550 + }, + { + "epoch": 24.99, + "learning_rate": 0.00011409574468085105, + "loss": 0.3178, + "step": 28560 + }, + { + "epoch": 25.0, + "learning_rate": 0.00011402925531914892, + "loss": 0.3179, + "step": 28570 + }, + { + "epoch": 25.0, + "learning_rate": 0.00011396276595744679, + "loss": 0.385, + "step": 28580 + }, + { + "epoch": 25.01, + "learning_rate": 0.00011389627659574466, + "loss": 0.2982, + "step": 28590 + }, + { + "epoch": 25.02, + "learning_rate": 0.00011382978723404255, + "loss": 0.2012, + "step": 28600 + }, + { + "epoch": 25.03, + "learning_rate": 0.00011376329787234042, + "loss": 0.3847, + "step": 28610 + }, + { + "epoch": 25.04, + "learning_rate": 0.00011369680851063829, + "loss": 0.2064, + "step": 28620 + }, + { + "epoch": 25.05, + "learning_rate": 0.00011363031914893616, + "loss": 0.3712, + "step": 28630 + }, + { + "epoch": 25.06, + "learning_rate": 0.00011356382978723404, + "loss": 0.2774, + "step": 28640 + }, + { + "epoch": 25.07, + "learning_rate": 0.00011349734042553191, + "loss": 0.2524, + "step": 28650 + }, + { + "epoch": 25.07, + "learning_rate": 0.00011343085106382978, + "loss": 0.3973, + "step": 28660 + }, + { + "epoch": 25.08, + "learning_rate": 0.00011336436170212765, + "loss": 0.3135, + "step": 28670 + }, + { + "epoch": 25.09, + "learning_rate": 0.00011329787234042553, + "loss": 0.3289, + "step": 28680 + }, + { + "epoch": 25.1, + "learning_rate": 0.0001132313829787234, + "loss": 0.3378, + "step": 28690 + }, + { + "epoch": 25.11, + "learning_rate": 0.00011316489361702127, + "loss": 0.2178, + "step": 28700 + }, + { + "epoch": 25.12, + "learning_rate": 0.00011309840425531914, + "loss": 0.3284, + "step": 28710 + }, + { + "epoch": 25.13, + "learning_rate": 0.000113031914893617, + "loss": 0.2575, + "step": 28720 + }, + { + "epoch": 25.14, + "learning_rate": 0.00011296542553191488, + "loss": 0.2954, + "step": 28730 + }, + { + "epoch": 25.14, + "learning_rate": 0.00011289893617021275, + "loss": 0.3236, + "step": 28740 + }, + { + "epoch": 25.15, + "learning_rate": 0.00011283244680851062, + "loss": 0.2868, + "step": 28750 + }, + { + "epoch": 25.16, + "learning_rate": 0.00011276595744680849, + "loss": 0.3504, + "step": 28760 + }, + { + "epoch": 25.17, + "learning_rate": 0.00011269946808510637, + "loss": 0.2782, + "step": 28770 + }, + { + "epoch": 25.18, + "learning_rate": 0.00011263297872340424, + "loss": 0.3037, + "step": 28780 + }, + { + "epoch": 25.19, + "learning_rate": 0.00011256648936170211, + "loss": 0.301, + "step": 28790 + }, + { + "epoch": 25.2, + "learning_rate": 0.0001125, + "loss": 0.1542, + "step": 28800 + }, + { + "epoch": 25.2, + "eval_cer1": 0.2662300394990041, + "eval_cer2": 0.2460377358490566, + "eval_cer3": 0.22182293368180334, + "eval_cer4": 0.22531311375124763, + "eval_cer5": 0.2511252653927813, + "eval_loss": 1.031542420387268, + "eval_runtime": 1388.9896, + "eval_samples_per_second": 6.307, + "step": 28800 + }, + { + "epoch": 25.21, + "learning_rate": 0.00011243351063829787, + "loss": 0.3888, + "step": 28810 + }, + { + "epoch": 25.21, + "learning_rate": 0.00011236702127659574, + "loss": 0.2533, + "step": 28820 + }, + { + "epoch": 25.22, + "learning_rate": 0.0001123005319148936, + "loss": 0.2479, + "step": 28830 + }, + { + "epoch": 25.23, + "learning_rate": 0.00011223404255319149, + "loss": 0.3047, + "step": 28840 + }, + { + "epoch": 25.24, + "learning_rate": 0.00011216755319148936, + "loss": 0.2549, + "step": 28850 + }, + { + "epoch": 25.25, + "learning_rate": 0.00011210106382978723, + "loss": 0.3615, + "step": 28860 + }, + { + "epoch": 25.26, + "learning_rate": 0.0001120345744680851, + "loss": 0.2239, + "step": 28870 + }, + { + "epoch": 25.27, + "learning_rate": 0.00011196808510638298, + "loss": 0.3013, + "step": 28880 + }, + { + "epoch": 25.28, + "learning_rate": 0.00011190159574468084, + "loss": 0.3175, + "step": 28890 + }, + { + "epoch": 25.28, + "learning_rate": 0.00011183510638297871, + "loss": 0.2417, + "step": 28900 + }, + { + "epoch": 25.29, + "learning_rate": 0.00011176861702127658, + "loss": 0.3697, + "step": 28910 + }, + { + "epoch": 25.3, + "learning_rate": 0.00011170212765957445, + "loss": 0.212, + "step": 28920 + }, + { + "epoch": 25.31, + "learning_rate": 0.00011163563829787233, + "loss": 0.2745, + "step": 28930 + }, + { + "epoch": 25.32, + "learning_rate": 0.0001115691489361702, + "loss": 0.2807, + "step": 28940 + }, + { + "epoch": 25.33, + "learning_rate": 0.00011150265957446807, + "loss": 0.2511, + "step": 28950 + }, + { + "epoch": 25.34, + "learning_rate": 0.00011143617021276594, + "loss": 0.3959, + "step": 28960 + }, + { + "epoch": 25.35, + "learning_rate": 0.00011136968085106383, + "loss": 0.2386, + "step": 28970 + }, + { + "epoch": 25.35, + "learning_rate": 0.0001113031914893617, + "loss": 0.298, + "step": 28980 + }, + { + "epoch": 25.36, + "learning_rate": 0.00011123670212765956, + "loss": 0.2845, + "step": 28990 + }, + { + "epoch": 25.37, + "learning_rate": 0.00011117021276595743, + "loss": 0.2314, + "step": 29000 + }, + { + "epoch": 25.38, + "learning_rate": 0.00011110372340425532, + "loss": 0.3337, + "step": 29010 + }, + { + "epoch": 25.39, + "learning_rate": 0.00011103723404255319, + "loss": 0.2058, + "step": 29020 + }, + { + "epoch": 25.4, + "learning_rate": 0.00011097074468085106, + "loss": 0.321, + "step": 29030 + }, + { + "epoch": 25.41, + "learning_rate": 0.00011090425531914893, + "loss": 0.2684, + "step": 29040 + }, + { + "epoch": 25.42, + "learning_rate": 0.00011083776595744681, + "loss": 0.2413, + "step": 29050 + }, + { + "epoch": 25.42, + "learning_rate": 0.00011077127659574468, + "loss": 0.3861, + "step": 29060 + }, + { + "epoch": 25.43, + "learning_rate": 0.00011070478723404254, + "loss": 0.2986, + "step": 29070 + }, + { + "epoch": 25.44, + "learning_rate": 0.00011063829787234041, + "loss": 0.3379, + "step": 29080 + }, + { + "epoch": 25.45, + "learning_rate": 0.00011057180851063828, + "loss": 0.3142, + "step": 29090 + }, + { + "epoch": 25.46, + "learning_rate": 0.00011050531914893616, + "loss": 0.2539, + "step": 29100 + }, + { + "epoch": 25.47, + "learning_rate": 0.00011043882978723403, + "loss": 0.3516, + "step": 29110 + }, + { + "epoch": 25.48, + "learning_rate": 0.0001103723404255319, + "loss": 0.2485, + "step": 29120 + }, + { + "epoch": 25.49, + "learning_rate": 0.00011030585106382977, + "loss": 0.3034, + "step": 29130 + }, + { + "epoch": 25.49, + "learning_rate": 0.00011023936170212765, + "loss": 0.277, + "step": 29140 + }, + { + "epoch": 25.5, + "learning_rate": 0.00011017287234042552, + "loss": 0.2316, + "step": 29150 + }, + { + "epoch": 25.51, + "learning_rate": 0.00011010638297872339, + "loss": 0.4195, + "step": 29160 + }, + { + "epoch": 25.52, + "learning_rate": 0.00011003989361702126, + "loss": 0.23, + "step": 29170 + }, + { + "epoch": 25.53, + "learning_rate": 0.00010997340425531915, + "loss": 0.2978, + "step": 29180 + }, + { + "epoch": 25.54, + "learning_rate": 0.00010990691489361702, + "loss": 0.3391, + "step": 29190 + }, + { + "epoch": 25.55, + "learning_rate": 0.00010984042553191489, + "loss": 0.1991, + "step": 29200 + }, + { + "epoch": 25.56, + "learning_rate": 0.00010977393617021276, + "loss": 0.3993, + "step": 29210 + }, + { + "epoch": 25.56, + "learning_rate": 0.00010970744680851064, + "loss": 0.2638, + "step": 29220 + }, + { + "epoch": 25.57, + "learning_rate": 0.00010964095744680851, + "loss": 0.3625, + "step": 29230 + }, + { + "epoch": 25.58, + "learning_rate": 0.00010957446808510638, + "loss": 0.3122, + "step": 29240 + }, + { + "epoch": 25.59, + "learning_rate": 0.00010950797872340424, + "loss": 0.2126, + "step": 29250 + }, + { + "epoch": 25.6, + "learning_rate": 0.0001094414893617021, + "loss": 0.406, + "step": 29260 + }, + { + "epoch": 25.61, + "learning_rate": 0.00010937499999999999, + "loss": 0.2267, + "step": 29270 + }, + { + "epoch": 25.62, + "learning_rate": 0.00010930851063829786, + "loss": 0.3175, + "step": 29280 + }, + { + "epoch": 25.63, + "learning_rate": 0.00010924202127659573, + "loss": 0.3189, + "step": 29290 + }, + { + "epoch": 25.63, + "learning_rate": 0.0001091755319148936, + "loss": 0.257, + "step": 29300 + }, + { + "epoch": 25.64, + "learning_rate": 0.00010910904255319148, + "loss": 0.4239, + "step": 29310 + }, + { + "epoch": 25.65, + "learning_rate": 0.00010904255319148935, + "loss": 0.2385, + "step": 29320 + }, + { + "epoch": 25.66, + "learning_rate": 0.00010897606382978722, + "loss": 0.3217, + "step": 29330 + }, + { + "epoch": 25.67, + "learning_rate": 0.00010890957446808509, + "loss": 0.3226, + "step": 29340 + }, + { + "epoch": 25.68, + "learning_rate": 0.00010884308510638297, + "loss": 0.2415, + "step": 29350 + }, + { + "epoch": 25.69, + "learning_rate": 0.00010877659574468084, + "loss": 0.3817, + "step": 29360 + }, + { + "epoch": 25.7, + "learning_rate": 0.00010871010638297871, + "loss": 0.2583, + "step": 29370 + }, + { + "epoch": 25.7, + "learning_rate": 0.0001086436170212766, + "loss": 0.2834, + "step": 29380 + }, + { + "epoch": 25.71, + "learning_rate": 0.00010857712765957447, + "loss": 0.2794, + "step": 29390 + }, + { + "epoch": 25.72, + "learning_rate": 0.00010851063829787234, + "loss": 0.1729, + "step": 29400 + }, + { + "epoch": 25.72, + "eval_cer1": 0.267681712298707, + "eval_cer2": 0.24278917145200984, + "eval_cer3": 0.22316236524011762, + "eval_cer4": 0.22119192504588042, + "eval_cer5": 0.24900212314225054, + "eval_loss": 1.0280529260635376, + "eval_runtime": 1436.5418, + "eval_samples_per_second": 6.098, + "step": 29400 + }, + { + "epoch": 25.73, + "learning_rate": 0.00010844414893617021, + "loss": 0.3493, + "step": 29410 + }, + { + "epoch": 25.74, + "learning_rate": 0.00010837765957446806, + "loss": 0.2696, + "step": 29420 + }, + { + "epoch": 25.75, + "learning_rate": 0.00010831117021276595, + "loss": 0.3302, + "step": 29430 + }, + { + "epoch": 25.76, + "learning_rate": 0.00010824468085106382, + "loss": 0.2726, + "step": 29440 + }, + { + "epoch": 25.77, + "learning_rate": 0.00010817819148936169, + "loss": 0.2387, + "step": 29450 + }, + { + "epoch": 25.77, + "learning_rate": 0.00010811170212765956, + "loss": 0.3647, + "step": 29460 + }, + { + "epoch": 25.78, + "learning_rate": 0.00010804521276595744, + "loss": 0.2755, + "step": 29470 + }, + { + "epoch": 25.79, + "learning_rate": 0.00010797872340425531, + "loss": 0.3482, + "step": 29480 + }, + { + "epoch": 25.8, + "learning_rate": 0.00010791223404255318, + "loss": 0.2567, + "step": 29490 + }, + { + "epoch": 25.81, + "learning_rate": 0.00010784574468085105, + "loss": 0.2231, + "step": 29500 + }, + { + "epoch": 25.82, + "learning_rate": 0.00010777925531914893, + "loss": 0.3515, + "step": 29510 + }, + { + "epoch": 25.83, + "learning_rate": 0.0001077127659574468, + "loss": 0.2851, + "step": 29520 + }, + { + "epoch": 25.84, + "learning_rate": 0.00010764627659574467, + "loss": 0.3146, + "step": 29530 + }, + { + "epoch": 25.84, + "learning_rate": 0.00010757978723404254, + "loss": 0.2861, + "step": 29540 + }, + { + "epoch": 25.85, + "learning_rate": 0.00010751329787234043, + "loss": 0.2163, + "step": 29550 + }, + { + "epoch": 25.86, + "learning_rate": 0.0001074468085106383, + "loss": 0.4086, + "step": 29560 + }, + { + "epoch": 25.87, + "learning_rate": 0.00010738031914893617, + "loss": 0.2442, + "step": 29570 + }, + { + "epoch": 25.88, + "learning_rate": 0.00010731382978723404, + "loss": 0.3528, + "step": 29580 + }, + { + "epoch": 25.89, + "learning_rate": 0.00010724734042553192, + "loss": 0.3322, + "step": 29590 + }, + { + "epoch": 25.9, + "learning_rate": 0.00010718085106382978, + "loss": 0.2295, + "step": 29600 + }, + { + "epoch": 25.91, + "learning_rate": 0.00010711436170212765, + "loss": 0.4222, + "step": 29610 + }, + { + "epoch": 25.91, + "learning_rate": 0.00010704787234042552, + "loss": 0.3143, + "step": 29620 + }, + { + "epoch": 25.92, + "learning_rate": 0.00010698138297872338, + "loss": 0.3276, + "step": 29630 + }, + { + "epoch": 25.93, + "learning_rate": 0.00010691489361702127, + "loss": 0.3264, + "step": 29640 + }, + { + "epoch": 25.94, + "learning_rate": 0.00010684840425531914, + "loss": 0.2424, + "step": 29650 + }, + { + "epoch": 25.95, + "learning_rate": 0.00010678191489361701, + "loss": 0.4745, + "step": 29660 + }, + { + "epoch": 25.96, + "learning_rate": 0.00010671542553191488, + "loss": 0.2372, + "step": 29670 + }, + { + "epoch": 25.97, + "learning_rate": 0.00010664893617021276, + "loss": 0.3653, + "step": 29680 + }, + { + "epoch": 25.98, + "learning_rate": 0.00010658244680851063, + "loss": 0.3214, + "step": 29690 + }, + { + "epoch": 25.98, + "learning_rate": 0.0001065159574468085, + "loss": 0.2353, + "step": 29700 + }, + { + "epoch": 25.99, + "learning_rate": 0.00010644946808510637, + "loss": 0.4505, + "step": 29710 + }, + { + "epoch": 26.0, + "learning_rate": 0.00010638297872340425, + "loss": 0.4167, + "step": 29720 + }, + { + "epoch": 26.01, + "learning_rate": 0.00010631648936170212, + "loss": 0.3344, + "step": 29730 + }, + { + "epoch": 26.02, + "learning_rate": 0.00010625, + "loss": 0.1992, + "step": 29740 + }, + { + "epoch": 26.03, + "learning_rate": 0.00010618351063829786, + "loss": 0.3313, + "step": 29750 + }, + { + "epoch": 26.04, + "learning_rate": 0.00010611702127659575, + "loss": 0.2653, + "step": 29760 + }, + { + "epoch": 26.05, + "learning_rate": 0.0001060505319148936, + "loss": 0.2799, + "step": 29770 + }, + { + "epoch": 26.05, + "learning_rate": 0.00010598404255319147, + "loss": 0.3272, + "step": 29780 + }, + { + "epoch": 26.06, + "learning_rate": 0.00010591755319148934, + "loss": 0.2237, + "step": 29790 + }, + { + "epoch": 26.07, + "learning_rate": 0.00010585106382978721, + "loss": 0.3129, + "step": 29800 + }, + { + "epoch": 26.08, + "learning_rate": 0.0001057845744680851, + "loss": 0.2481, + "step": 29810 + }, + { + "epoch": 26.09, + "learning_rate": 0.00010571808510638297, + "loss": 0.2451, + "step": 29820 + }, + { + "epoch": 26.1, + "learning_rate": 0.00010565159574468084, + "loss": 0.3068, + "step": 29830 + }, + { + "epoch": 26.11, + "learning_rate": 0.0001055851063829787, + "loss": 0.1691, + "step": 29840 + }, + { + "epoch": 26.12, + "learning_rate": 0.00010551861702127659, + "loss": 0.3205, + "step": 29850 + }, + { + "epoch": 26.12, + "learning_rate": 0.00010545212765957446, + "loss": 0.2891, + "step": 29860 + }, + { + "epoch": 26.13, + "learning_rate": 0.00010538563829787233, + "loss": 0.2392, + "step": 29870 + }, + { + "epoch": 26.14, + "learning_rate": 0.0001053191489361702, + "loss": 0.2937, + "step": 29880 + }, + { + "epoch": 26.15, + "learning_rate": 0.00010525265957446808, + "loss": 0.2255, + "step": 29890 + }, + { + "epoch": 26.16, + "learning_rate": 0.00010518617021276595, + "loss": 0.3463, + "step": 29900 + }, + { + "epoch": 26.17, + "learning_rate": 0.00010511968085106382, + "loss": 0.2503, + "step": 29910 + }, + { + "epoch": 26.18, + "learning_rate": 0.00010505319148936169, + "loss": 0.2524, + "step": 29920 + }, + { + "epoch": 26.19, + "learning_rate": 0.00010498670212765958, + "loss": 0.3409, + "step": 29930 + }, + { + "epoch": 26.19, + "learning_rate": 0.00010492021276595745, + "loss": 0.2799, + "step": 29940 + }, + { + "epoch": 26.2, + "learning_rate": 0.0001048537234042553, + "loss": 0.2942, + "step": 29950 + }, + { + "epoch": 26.21, + "learning_rate": 0.00010478723404255317, + "loss": 0.242, + "step": 29960 + }, + { + "epoch": 26.22, + "learning_rate": 0.00010472074468085106, + "loss": 0.2646, + "step": 29970 + }, + { + "epoch": 26.23, + "learning_rate": 0.00010465425531914892, + "loss": 0.3402, + "step": 29980 + }, + { + "epoch": 26.24, + "learning_rate": 0.0001045877659574468, + "loss": 0.2402, + "step": 29990 + }, + { + "epoch": 26.25, + "learning_rate": 0.00010452127659574466, + "loss": 0.3621, + "step": 30000 + }, + { + "epoch": 26.25, + "eval_cer1": 0.2643394888761352, + "eval_cer2": 0.2462346185397867, + "eval_cer3": 0.22322770336491343, + "eval_cer4": 0.22151389291348722, + "eval_cer5": 0.24934182590233545, + "eval_loss": 1.029146671295166, + "eval_runtime": 1485.1015, + "eval_samples_per_second": 5.899, + "step": 30000 + }, + { + "epoch": 26.26, + "learning_rate": 0.00010445478723404255, + "loss": 0.264, + "step": 30010 + }, + { + "epoch": 26.26, + "learning_rate": 0.00010438829787234042, + "loss": 0.3064, + "step": 30020 + }, + { + "epoch": 26.27, + "learning_rate": 0.00010432180851063829, + "loss": 0.3571, + "step": 30030 + }, + { + "epoch": 26.28, + "learning_rate": 0.00010425531914893616, + "loss": 0.2181, + "step": 30040 + }, + { + "epoch": 26.29, + "learning_rate": 0.00010418882978723404, + "loss": 0.3138, + "step": 30050 + }, + { + "epoch": 26.3, + "learning_rate": 0.00010412234042553191, + "loss": 0.2597, + "step": 30060 + }, + { + "epoch": 26.31, + "learning_rate": 0.00010405585106382978, + "loss": 0.2329, + "step": 30070 + }, + { + "epoch": 26.32, + "learning_rate": 0.00010398936170212765, + "loss": 0.3073, + "step": 30080 + }, + { + "epoch": 26.33, + "learning_rate": 0.00010392287234042553, + "loss": 0.288, + "step": 30090 + }, + { + "epoch": 26.33, + "learning_rate": 0.0001038563829787234, + "loss": 0.3471, + "step": 30100 + }, + { + "epoch": 26.34, + "learning_rate": 0.00010378989361702127, + "loss": 0.2624, + "step": 30110 + }, + { + "epoch": 26.35, + "learning_rate": 0.00010372340425531914, + "loss": 0.1944, + "step": 30120 + }, + { + "epoch": 26.36, + "learning_rate": 0.000103656914893617, + "loss": 0.3337, + "step": 30130 + }, + { + "epoch": 26.37, + "learning_rate": 0.00010359042553191488, + "loss": 0.234, + "step": 30140 + }, + { + "epoch": 26.38, + "learning_rate": 0.00010352393617021275, + "loss": 0.3417, + "step": 30150 + }, + { + "epoch": 26.39, + "learning_rate": 0.00010345744680851062, + "loss": 0.2358, + "step": 30160 + }, + { + "epoch": 26.4, + "learning_rate": 0.00010339095744680849, + "loss": 0.2113, + "step": 30170 + }, + { + "epoch": 26.4, + "learning_rate": 0.00010332446808510638, + "loss": 0.2894, + "step": 30180 + }, + { + "epoch": 26.41, + "learning_rate": 0.00010325797872340425, + "loss": 0.2099, + "step": 30190 + }, + { + "epoch": 26.42, + "learning_rate": 0.00010319148936170212, + "loss": 0.2764, + "step": 30200 + }, + { + "epoch": 26.43, + "learning_rate": 0.00010312499999999999, + "loss": 0.2588, + "step": 30210 + }, + { + "epoch": 26.44, + "learning_rate": 0.00010305851063829787, + "loss": 0.2498, + "step": 30220 + }, + { + "epoch": 26.45, + "learning_rate": 0.00010299202127659574, + "loss": 0.329, + "step": 30230 + }, + { + "epoch": 26.46, + "learning_rate": 0.00010292553191489361, + "loss": 0.2544, + "step": 30240 + }, + { + "epoch": 26.47, + "learning_rate": 0.00010285904255319148, + "loss": 0.3048, + "step": 30250 + }, + { + "epoch": 26.47, + "learning_rate": 0.00010279255319148936, + "loss": 0.3024, + "step": 30260 + }, + { + "epoch": 26.48, + "learning_rate": 0.00010272606382978723, + "loss": 0.2467, + "step": 30270 + }, + { + "epoch": 26.49, + "learning_rate": 0.0001026595744680851, + "loss": 0.2897, + "step": 30280 + }, + { + "epoch": 26.5, + "learning_rate": 0.00010259308510638297, + "loss": 0.1755, + "step": 30290 + }, + { + "epoch": 26.51, + "learning_rate": 0.00010252659574468083, + "loss": 0.3278, + "step": 30300 + }, + { + "epoch": 26.52, + "learning_rate": 0.00010246010638297871, + "loss": 0.225, + "step": 30310 + }, + { + "epoch": 26.53, + "learning_rate": 0.00010239361702127658, + "loss": 0.2449, + "step": 30320 + }, + { + "epoch": 26.54, + "learning_rate": 0.00010232712765957445, + "loss": 0.3354, + "step": 30330 + }, + { + "epoch": 26.54, + "learning_rate": 0.00010226063829787232, + "loss": 0.1819, + "step": 30340 + }, + { + "epoch": 26.55, + "learning_rate": 0.0001021941489361702, + "loss": 0.3612, + "step": 30350 + }, + { + "epoch": 26.56, + "learning_rate": 0.00010212765957446807, + "loss": 0.2227, + "step": 30360 + }, + { + "epoch": 26.57, + "learning_rate": 0.00010206117021276594, + "loss": 0.2445, + "step": 30370 + }, + { + "epoch": 26.58, + "learning_rate": 0.00010199468085106381, + "loss": 0.356, + "step": 30380 + }, + { + "epoch": 26.59, + "learning_rate": 0.0001019281914893617, + "loss": 0.2124, + "step": 30390 + }, + { + "epoch": 26.6, + "learning_rate": 0.00010186170212765957, + "loss": 0.3383, + "step": 30400 + }, + { + "epoch": 26.61, + "learning_rate": 0.00010179521276595744, + "loss": 0.2547, + "step": 30410 + }, + { + "epoch": 26.61, + "learning_rate": 0.00010172872340425531, + "loss": 0.2601, + "step": 30420 + }, + { + "epoch": 26.62, + "learning_rate": 0.00010166223404255319, + "loss": 0.2998, + "step": 30430 + }, + { + "epoch": 26.63, + "learning_rate": 0.00010159574468085106, + "loss": 0.2124, + "step": 30440 + }, + { + "epoch": 26.64, + "learning_rate": 0.00010152925531914893, + "loss": 0.3025, + "step": 30450 + }, + { + "epoch": 26.65, + "learning_rate": 0.0001014627659574468, + "loss": 0.2691, + "step": 30460 + }, + { + "epoch": 26.66, + "learning_rate": 0.00010139627659574468, + "loss": 0.2575, + "step": 30470 + }, + { + "epoch": 26.67, + "learning_rate": 0.00010132978723404254, + "loss": 0.3434, + "step": 30480 + }, + { + "epoch": 26.68, + "learning_rate": 0.00010126329787234041, + "loss": 0.2434, + "step": 30490 + }, + { + "epoch": 26.68, + "learning_rate": 0.00010119680851063828, + "loss": 0.2925, + "step": 30500 + }, + { + "epoch": 26.69, + "learning_rate": 0.00010113031914893616, + "loss": 0.2326, + "step": 30510 + }, + { + "epoch": 26.7, + "learning_rate": 0.00010106382978723403, + "loss": 0.2828, + "step": 30520 + }, + { + "epoch": 26.71, + "learning_rate": 0.0001009973404255319, + "loss": 0.3347, + "step": 30530 + }, + { + "epoch": 26.72, + "learning_rate": 0.00010093085106382977, + "loss": 0.234, + "step": 30540 + }, + { + "epoch": 26.73, + "learning_rate": 0.00010086436170212766, + "loss": 0.2724, + "step": 30550 + }, + { + "epoch": 26.74, + "learning_rate": 0.00010079787234042553, + "loss": 0.1898, + "step": 30560 + }, + { + "epoch": 26.75, + "learning_rate": 0.0001007313829787234, + "loss": 0.2782, + "step": 30570 + }, + { + "epoch": 26.75, + "learning_rate": 0.00010066489361702127, + "loss": 0.3117, + "step": 30580 + }, + { + "epoch": 26.76, + "learning_rate": 0.00010059840425531915, + "loss": 0.2017, + "step": 30590 + }, + { + "epoch": 26.77, + "learning_rate": 0.00010053191489361702, + "loss": 0.3229, + "step": 30600 + }, + { + "epoch": 26.77, + "eval_cer1": 0.2588366361702846, + "eval_cer2": 0.24249384741591468, + "eval_cer3": 0.21767396275726886, + "eval_cer4": 0.21581506165684664, + "eval_cer5": 0.24305732484076434, + "eval_loss": 1.0247892141342163, + "eval_runtime": 1507.0564, + "eval_samples_per_second": 5.813, + "step": 30600 + }, + { + "epoch": 26.78, + "learning_rate": 0.00010046542553191489, + "loss": 0.2657, + "step": 30610 + }, + { + "epoch": 26.79, + "learning_rate": 0.00010039893617021276, + "loss": 0.3272, + "step": 30620 + }, + { + "epoch": 26.8, + "learning_rate": 0.00010033244680851064, + "loss": 0.2785, + "step": 30630 + }, + { + "epoch": 26.81, + "learning_rate": 0.00010026595744680851, + "loss": 0.2101, + "step": 30640 + }, + { + "epoch": 26.82, + "learning_rate": 0.00010019946808510638, + "loss": 0.3562, + "step": 30650 + }, + { + "epoch": 26.82, + "learning_rate": 0.00010013297872340424, + "loss": 0.2505, + "step": 30660 + }, + { + "epoch": 26.83, + "learning_rate": 0.00010006648936170211, + "loss": 0.245, + "step": 30670 + }, + { + "epoch": 26.84, + "learning_rate": 9.999999999999999e-05, + "loss": 0.3345, + "step": 30680 + }, + { + "epoch": 26.85, + "learning_rate": 9.993351063829786e-05, + "loss": 0.2022, + "step": 30690 + }, + { + "epoch": 26.86, + "learning_rate": 9.986702127659573e-05, + "loss": 0.3151, + "step": 30700 + }, + { + "epoch": 26.87, + "learning_rate": 9.98005319148936e-05, + "loss": 0.2485, + "step": 30710 + }, + { + "epoch": 26.88, + "learning_rate": 9.973404255319148e-05, + "loss": 0.2156, + "step": 30720 + }, + { + "epoch": 26.89, + "learning_rate": 9.966755319148935e-05, + "loss": 0.2992, + "step": 30730 + }, + { + "epoch": 26.89, + "learning_rate": 9.960106382978722e-05, + "loss": 0.2467, + "step": 30740 + }, + { + "epoch": 26.9, + "learning_rate": 9.95345744680851e-05, + "loss": 0.2973, + "step": 30750 + }, + { + "epoch": 26.91, + "learning_rate": 9.946808510638298e-05, + "loss": 0.214, + "step": 30760 + }, + { + "epoch": 26.92, + "learning_rate": 9.940159574468085e-05, + "loss": 0.2341, + "step": 30770 + }, + { + "epoch": 26.93, + "learning_rate": 9.933510638297872e-05, + "loss": 0.3063, + "step": 30780 + }, + { + "epoch": 26.94, + "learning_rate": 9.926861702127659e-05, + "loss": 0.2117, + "step": 30790 + }, + { + "epoch": 26.95, + "learning_rate": 9.920212765957447e-05, + "loss": 0.3313, + "step": 30800 + }, + { + "epoch": 26.95, + "learning_rate": 9.913563829787234e-05, + "loss": 0.2516, + "step": 30810 + }, + { + "epoch": 26.96, + "learning_rate": 9.906914893617021e-05, + "loss": 0.2664, + "step": 30820 + }, + { + "epoch": 26.97, + "learning_rate": 9.900265957446807e-05, + "loss": 0.2853, + "step": 30830 + }, + { + "epoch": 26.98, + "learning_rate": 9.893617021276594e-05, + "loss": 0.2072, + "step": 30840 + }, + { + "epoch": 26.99, + "learning_rate": 9.886968085106382e-05, + "loss": 0.3216, + "step": 30850 + }, + { + "epoch": 27.0, + "learning_rate": 9.880319148936169e-05, + "loss": 0.2569, + "step": 30860 + }, + { + "epoch": 27.01, + "learning_rate": 9.873670212765956e-05, + "loss": 0.3426, + "step": 30870 + }, + { + "epoch": 27.02, + "learning_rate": 9.867021276595743e-05, + "loss": 0.2115, + "step": 30880 + }, + { + "epoch": 27.03, + "learning_rate": 9.860372340425531e-05, + "loss": 0.2323, + "step": 30890 + }, + { + "epoch": 27.03, + "learning_rate": 9.853723404255318e-05, + "loss": 0.2537, + "step": 30900 + }, + { + "epoch": 27.04, + "learning_rate": 9.847074468085105e-05, + "loss": 0.1648, + "step": 30910 + }, + { + "epoch": 27.05, + "learning_rate": 9.840425531914892e-05, + "loss": 0.2771, + "step": 30920 + }, + { + "epoch": 27.06, + "learning_rate": 9.83377659574468e-05, + "loss": 0.2452, + "step": 30930 + }, + { + "epoch": 27.07, + "learning_rate": 9.827127659574468e-05, + "loss": 0.2119, + "step": 30940 + }, + { + "epoch": 27.08, + "learning_rate": 9.820478723404255e-05, + "loss": 0.2509, + "step": 30950 + }, + { + "epoch": 27.09, + "learning_rate": 9.813829787234042e-05, + "loss": 0.1906, + "step": 30960 + }, + { + "epoch": 27.1, + "learning_rate": 9.80718085106383e-05, + "loss": 0.3401, + "step": 30970 + }, + { + "epoch": 27.1, + "learning_rate": 9.800531914893617e-05, + "loss": 0.2194, + "step": 30980 + }, + { + "epoch": 27.11, + "learning_rate": 9.793882978723404e-05, + "loss": 0.2698, + "step": 30990 + }, + { + "epoch": 27.12, + "learning_rate": 9.787234042553191e-05, + "loss": 0.2353, + "step": 31000 + }, + { + "epoch": 27.13, + "learning_rate": 9.780585106382976e-05, + "loss": 0.1978, + "step": 31010 + }, + { + "epoch": 27.14, + "learning_rate": 9.773936170212765e-05, + "loss": 0.3344, + "step": 31020 + }, + { + "epoch": 27.15, + "learning_rate": 9.767287234042552e-05, + "loss": 0.2526, + "step": 31030 + }, + { + "epoch": 27.16, + "learning_rate": 9.760638297872339e-05, + "loss": 0.2375, + "step": 31040 + }, + { + "epoch": 27.17, + "learning_rate": 9.753989361702127e-05, + "loss": 0.2096, + "step": 31050 + }, + { + "epoch": 27.17, + "learning_rate": 9.747340425531914e-05, + "loss": 0.1563, + "step": 31060 + }, + { + "epoch": 27.18, + "learning_rate": 9.740691489361701e-05, + "loss": 0.2449, + "step": 31070 + }, + { + "epoch": 27.19, + "learning_rate": 9.734042553191488e-05, + "loss": 0.1953, + "step": 31080 + }, + { + "epoch": 27.2, + "learning_rate": 9.727393617021276e-05, + "loss": 0.2934, + "step": 31090 + }, + { + "epoch": 27.21, + "learning_rate": 9.720744680851063e-05, + "loss": 0.2217, + "step": 31100 + }, + { + "epoch": 27.22, + "learning_rate": 9.71409574468085e-05, + "loss": 0.1701, + "step": 31110 + }, + { + "epoch": 27.23, + "learning_rate": 9.707446808510637e-05, + "loss": 0.3106, + "step": 31120 + }, + { + "epoch": 27.24, + "learning_rate": 9.700797872340426e-05, + "loss": 0.2108, + "step": 31130 + }, + { + "epoch": 27.24, + "learning_rate": 9.694148936170213e-05, + "loss": 0.272, + "step": 31140 + }, + { + "epoch": 27.25, + "learning_rate": 9.6875e-05, + "loss": 0.254, + "step": 31150 + }, + { + "epoch": 27.26, + "learning_rate": 9.680851063829787e-05, + "loss": 0.1927, + "step": 31160 + }, + { + "epoch": 27.27, + "learning_rate": 9.674202127659575e-05, + "loss": 0.3339, + "step": 31170 + }, + { + "epoch": 27.28, + "learning_rate": 9.66755319148936e-05, + "loss": 0.1941, + "step": 31180 + }, + { + "epoch": 27.29, + "learning_rate": 9.660904255319148e-05, + "loss": 0.2352, + "step": 31190 + }, + { + "epoch": 27.3, + "learning_rate": 9.654255319148935e-05, + "loss": 0.2997, + "step": 31200 + }, + { + "epoch": 27.3, + "eval_cer1": 0.26143614327672937, + "eval_cer2": 0.2374405250205086, + "eval_cer3": 0.2174779483828814, + "eval_cer4": 0.21674876847290642, + "eval_cer5": 0.24670912951167728, + "eval_loss": 1.0207247734069824, + "eval_runtime": 1456.0036, + "eval_samples_per_second": 6.016, + "step": 31200 + }, + { + "epoch": 27.31, + "learning_rate": 9.647606382978722e-05, + "loss": 0.1265, + "step": 31210 + }, + { + "epoch": 27.31, + "learning_rate": 9.64095744680851e-05, + "loss": 0.3038, + "step": 31220 + }, + { + "epoch": 27.32, + "learning_rate": 9.634308510638297e-05, + "loss": 0.1978, + "step": 31230 + }, + { + "epoch": 27.33, + "learning_rate": 9.627659574468084e-05, + "loss": 0.237, + "step": 31240 + }, + { + "epoch": 27.34, + "learning_rate": 9.621010638297871e-05, + "loss": 0.2628, + "step": 31250 + }, + { + "epoch": 27.35, + "learning_rate": 9.614361702127659e-05, + "loss": 0.2, + "step": 31260 + }, + { + "epoch": 27.36, + "learning_rate": 9.607712765957446e-05, + "loss": 0.294, + "step": 31270 + }, + { + "epoch": 27.37, + "learning_rate": 9.601063829787233e-05, + "loss": 0.2154, + "step": 31280 + }, + { + "epoch": 27.38, + "learning_rate": 9.59441489361702e-05, + "loss": 0.3139, + "step": 31290 + }, + { + "epoch": 27.38, + "learning_rate": 9.587765957446809e-05, + "loss": 0.2583, + "step": 31300 + }, + { + "epoch": 27.39, + "learning_rate": 9.581117021276596e-05, + "loss": 0.217, + "step": 31310 + }, + { + "epoch": 27.4, + "learning_rate": 9.574468085106382e-05, + "loss": 0.2996, + "step": 31320 + }, + { + "epoch": 27.41, + "learning_rate": 9.56781914893617e-05, + "loss": 0.2456, + "step": 31330 + }, + { + "epoch": 27.42, + "learning_rate": 9.561170212765958e-05, + "loss": 0.245, + "step": 31340 + }, + { + "epoch": 27.43, + "learning_rate": 9.554521276595745e-05, + "loss": 0.2713, + "step": 31350 + }, + { + "epoch": 27.44, + "learning_rate": 9.54787234042553e-05, + "loss": 0.2011, + "step": 31360 + }, + { + "epoch": 27.45, + "learning_rate": 9.541223404255317e-05, + "loss": 0.3593, + "step": 31370 + }, + { + "epoch": 27.45, + "learning_rate": 9.534574468085104e-05, + "loss": 0.2025, + "step": 31380 + }, + { + "epoch": 27.46, + "learning_rate": 9.527925531914893e-05, + "loss": 0.2873, + "step": 31390 + }, + { + "epoch": 27.47, + "learning_rate": 9.52127659574468e-05, + "loss": 0.2647, + "step": 31400 + }, + { + "epoch": 27.48, + "learning_rate": 9.514627659574467e-05, + "loss": 0.1944, + "step": 31410 + }, + { + "epoch": 27.49, + "learning_rate": 9.507978723404254e-05, + "loss": 0.2805, + "step": 31420 + }, + { + "epoch": 27.5, + "learning_rate": 9.501329787234042e-05, + "loss": 0.2372, + "step": 31430 + }, + { + "epoch": 27.51, + "learning_rate": 9.494680851063829e-05, + "loss": 0.2594, + "step": 31440 + }, + { + "epoch": 27.52, + "learning_rate": 9.488031914893616e-05, + "loss": 0.2737, + "step": 31450 + }, + { + "epoch": 27.52, + "learning_rate": 9.481382978723403e-05, + "loss": 0.2055, + "step": 31460 + }, + { + "epoch": 27.53, + "learning_rate": 9.474734042553191e-05, + "loss": 0.3222, + "step": 31470 + }, + { + "epoch": 27.54, + "learning_rate": 9.468085106382978e-05, + "loss": 0.2843, + "step": 31480 + }, + { + "epoch": 27.55, + "learning_rate": 9.461436170212765e-05, + "loss": 0.2622, + "step": 31490 + }, + { + "epoch": 27.56, + "learning_rate": 9.454787234042552e-05, + "loss": 0.2502, + "step": 31500 + }, + { + "epoch": 27.57, + "learning_rate": 9.44813829787234e-05, + "loss": 0.1612, + "step": 31510 + }, + { + "epoch": 27.58, + "learning_rate": 9.441489361702128e-05, + "loss": 0.2919, + "step": 31520 + }, + { + "epoch": 27.59, + "learning_rate": 9.434840425531915e-05, + "loss": 0.2328, + "step": 31530 + }, + { + "epoch": 27.59, + "learning_rate": 9.4281914893617e-05, + "loss": 0.283, + "step": 31540 + }, + { + "epoch": 27.6, + "learning_rate": 9.421542553191487e-05, + "loss": 0.2663, + "step": 31550 + }, + { + "epoch": 27.61, + "learning_rate": 9.414893617021276e-05, + "loss": 0.1909, + "step": 31560 + }, + { + "epoch": 27.62, + "learning_rate": 9.408244680851063e-05, + "loss": 0.3346, + "step": 31570 + }, + { + "epoch": 27.63, + "learning_rate": 9.40159574468085e-05, + "loss": 0.2552, + "step": 31580 + }, + { + "epoch": 27.64, + "learning_rate": 9.394946808510637e-05, + "loss": 0.279, + "step": 31590 + }, + { + "epoch": 27.65, + "learning_rate": 9.388297872340425e-05, + "loss": 0.2329, + "step": 31600 + }, + { + "epoch": 27.66, + "learning_rate": 9.381648936170212e-05, + "loss": 0.1384, + "step": 31610 + }, + { + "epoch": 27.66, + "learning_rate": 9.374999999999999e-05, + "loss": 0.2982, + "step": 31620 + }, + { + "epoch": 27.67, + "learning_rate": 9.368351063829787e-05, + "loss": 0.243, + "step": 31630 + }, + { + "epoch": 27.68, + "learning_rate": 9.361702127659574e-05, + "loss": 0.2628, + "step": 31640 + }, + { + "epoch": 27.69, + "learning_rate": 9.355053191489361e-05, + "loss": 0.2297, + "step": 31650 + }, + { + "epoch": 27.7, + "learning_rate": 9.348404255319148e-05, + "loss": 0.1579, + "step": 31660 + }, + { + "epoch": 27.71, + "learning_rate": 9.341755319148936e-05, + "loss": 0.3486, + "step": 31670 + }, + { + "epoch": 27.72, + "learning_rate": 9.335106382978723e-05, + "loss": 0.1826, + "step": 31680 + }, + { + "epoch": 27.72, + "learning_rate": 9.32845744680851e-05, + "loss": 0.2471, + "step": 31690 + }, + { + "epoch": 27.73, + "learning_rate": 9.321808510638297e-05, + "loss": 0.3142, + "step": 31700 + }, + { + "epoch": 27.74, + "learning_rate": 9.315159574468083e-05, + "loss": 0.2355, + "step": 31710 + }, + { + "epoch": 27.75, + "learning_rate": 9.308510638297871e-05, + "loss": 0.3302, + "step": 31720 + }, + { + "epoch": 27.76, + "learning_rate": 9.301861702127658e-05, + "loss": 0.2433, + "step": 31730 + }, + { + "epoch": 27.77, + "learning_rate": 9.295212765957445e-05, + "loss": 0.2156, + "step": 31740 + }, + { + "epoch": 27.78, + "learning_rate": 9.288563829787232e-05, + "loss": 0.2943, + "step": 31750 + }, + { + "epoch": 27.79, + "learning_rate": 9.281914893617021e-05, + "loss": 0.1814, + "step": 31760 + }, + { + "epoch": 27.79, + "learning_rate": 9.275265957446808e-05, + "loss": 0.3136, + "step": 31770 + }, + { + "epoch": 27.8, + "learning_rate": 9.268617021276595e-05, + "loss": 0.2177, + "step": 31780 + }, + { + "epoch": 27.81, + "learning_rate": 9.261968085106382e-05, + "loss": 0.279, + "step": 31790 + }, + { + "epoch": 27.82, + "learning_rate": 9.25531914893617e-05, + "loss": 0.2461, + "step": 31800 + }, + { + "epoch": 27.82, + "eval_cer1": 0.2556632119104689, + "eval_cer2": 0.23543888433141918, + "eval_cer3": 0.2131656321463574, + "eval_cer4": 0.21317492514247077, + "eval_cer5": 0.23855626326963908, + "eval_loss": 1.0181804895401, + "eval_runtime": 1437.34, + "eval_samples_per_second": 6.095, + "step": 31800 + }, + { + "epoch": 27.83, + "learning_rate": 9.248670212765957e-05, + "loss": 0.1999, + "step": 31810 + }, + { + "epoch": 27.84, + "learning_rate": 9.242021276595744e-05, + "loss": 0.3005, + "step": 31820 + }, + { + "epoch": 27.85, + "learning_rate": 9.235372340425531e-05, + "loss": 0.2197, + "step": 31830 + }, + { + "epoch": 27.86, + "learning_rate": 9.228723404255319e-05, + "loss": 0.2352, + "step": 31840 + }, + { + "epoch": 27.86, + "learning_rate": 9.222074468085106e-05, + "loss": 0.2733, + "step": 31850 + }, + { + "epoch": 27.87, + "learning_rate": 9.215425531914893e-05, + "loss": 0.2026, + "step": 31860 + }, + { + "epoch": 27.88, + "learning_rate": 9.20877659574468e-05, + "loss": 0.3294, + "step": 31870 + }, + { + "epoch": 27.89, + "learning_rate": 9.202127659574469e-05, + "loss": 0.2265, + "step": 31880 + }, + { + "epoch": 27.9, + "learning_rate": 9.195478723404254e-05, + "loss": 0.2553, + "step": 31890 + }, + { + "epoch": 27.91, + "learning_rate": 9.188829787234041e-05, + "loss": 0.2758, + "step": 31900 + }, + { + "epoch": 27.92, + "learning_rate": 9.182180851063828e-05, + "loss": 0.183, + "step": 31910 + }, + { + "epoch": 27.93, + "learning_rate": 9.175531914893615e-05, + "loss": 0.332, + "step": 31920 + }, + { + "epoch": 27.93, + "learning_rate": 9.168882978723404e-05, + "loss": 0.1728, + "step": 31930 + }, + { + "epoch": 27.94, + "learning_rate": 9.16223404255319e-05, + "loss": 0.2965, + "step": 31940 + }, + { + "epoch": 27.95, + "learning_rate": 9.155585106382978e-05, + "loss": 0.2349, + "step": 31950 + }, + { + "epoch": 27.96, + "learning_rate": 9.148936170212764e-05, + "loss": 0.2084, + "step": 31960 + }, + { + "epoch": 27.97, + "learning_rate": 9.142287234042553e-05, + "loss": 0.322, + "step": 31970 + }, + { + "epoch": 27.98, + "learning_rate": 9.13563829787234e-05, + "loss": 0.2388, + "step": 31980 + }, + { + "epoch": 27.99, + "learning_rate": 9.128989361702127e-05, + "loss": 0.1909, + "step": 31990 + }, + { + "epoch": 28.0, + "learning_rate": 9.122340425531914e-05, + "loss": 0.1898, + "step": 32000 + }, + { + "epoch": 28.01, + "learning_rate": 9.115691489361702e-05, + "loss": 0.2849, + "step": 32010 + }, + { + "epoch": 28.01, + "learning_rate": 9.109042553191489e-05, + "loss": 0.2579, + "step": 32020 + }, + { + "epoch": 28.02, + "learning_rate": 9.102393617021276e-05, + "loss": 0.1564, + "step": 32030 + }, + { + "epoch": 28.03, + "learning_rate": 9.095744680851063e-05, + "loss": 0.2738, + "step": 32040 + }, + { + "epoch": 28.04, + "learning_rate": 9.089095744680851e-05, + "loss": 0.1675, + "step": 32050 + }, + { + "epoch": 28.05, + "learning_rate": 9.082446808510638e-05, + "loss": 0.3122, + "step": 32060 + }, + { + "epoch": 28.06, + "learning_rate": 9.075797872340424e-05, + "loss": 0.2452, + "step": 32070 + }, + { + "epoch": 28.07, + "learning_rate": 9.069148936170211e-05, + "loss": 0.2378, + "step": 32080 + }, + { + "epoch": 28.08, + "learning_rate": 9.062499999999998e-05, + "loss": 0.2339, + "step": 32090 + }, + { + "epoch": 28.08, + "learning_rate": 9.055851063829786e-05, + "loss": 0.245, + "step": 32100 + }, + { + "epoch": 28.09, + "learning_rate": 9.049202127659573e-05, + "loss": 0.269, + "step": 32110 + }, + { + "epoch": 28.1, + "learning_rate": 9.04255319148936e-05, + "loss": 0.2235, + "step": 32120 + }, + { + "epoch": 28.11, + "learning_rate": 9.035904255319147e-05, + "loss": 0.2386, + "step": 32130 + }, + { + "epoch": 28.12, + "learning_rate": 9.029255319148936e-05, + "loss": 0.2266, + "step": 32140 + }, + { + "epoch": 28.13, + "learning_rate": 9.022606382978723e-05, + "loss": 0.2106, + "step": 32150 + }, + { + "epoch": 28.14, + "learning_rate": 9.01595744680851e-05, + "loss": 0.2506, + "step": 32160 + }, + { + "epoch": 28.15, + "learning_rate": 9.009308510638297e-05, + "loss": 0.1846, + "step": 32170 + }, + { + "epoch": 28.15, + "learning_rate": 9.002659574468085e-05, + "loss": 0.1618, + "step": 32180 + }, + { + "epoch": 28.16, + "learning_rate": 8.996010638297872e-05, + "loss": 0.2715, + "step": 32190 + }, + { + "epoch": 28.17, + "learning_rate": 8.989361702127659e-05, + "loss": 0.179, + "step": 32200 + }, + { + "epoch": 28.18, + "learning_rate": 8.982712765957447e-05, + "loss": 0.2847, + "step": 32210 + }, + { + "epoch": 28.19, + "learning_rate": 8.976063829787234e-05, + "loss": 0.1758, + "step": 32220 + }, + { + "epoch": 28.2, + "learning_rate": 8.969414893617021e-05, + "loss": 0.2159, + "step": 32230 + }, + { + "epoch": 28.21, + "learning_rate": 8.962765957446807e-05, + "loss": 0.2823, + "step": 32240 + }, + { + "epoch": 28.22, + "learning_rate": 8.956117021276594e-05, + "loss": 0.1597, + "step": 32250 + }, + { + "epoch": 28.22, + "learning_rate": 8.949468085106382e-05, + "loss": 0.3012, + "step": 32260 + }, + { + "epoch": 28.23, + "learning_rate": 8.942819148936169e-05, + "loss": 0.2111, + "step": 32270 + }, + { + "epoch": 28.24, + "learning_rate": 8.936170212765956e-05, + "loss": 0.2427, + "step": 32280 + }, + { + "epoch": 28.25, + "learning_rate": 8.929521276595743e-05, + "loss": 0.2423, + "step": 32290 + }, + { + "epoch": 28.26, + "learning_rate": 8.922872340425532e-05, + "loss": 0.2037, + "step": 32300 + }, + { + "epoch": 28.27, + "learning_rate": 8.916223404255318e-05, + "loss": 0.2299, + "step": 32310 + }, + { + "epoch": 28.28, + "learning_rate": 8.909574468085105e-05, + "loss": 0.2302, + "step": 32320 + }, + { + "epoch": 28.29, + "learning_rate": 8.902925531914892e-05, + "loss": 0.2138, + "step": 32330 + }, + { + "epoch": 28.29, + "learning_rate": 8.896276595744681e-05, + "loss": 0.301, + "step": 32340 + }, + { + "epoch": 28.3, + "learning_rate": 8.889627659574468e-05, + "loss": 0.1965, + "step": 32350 + }, + { + "epoch": 28.31, + "learning_rate": 8.882978723404255e-05, + "loss": 0.295, + "step": 32360 + }, + { + "epoch": 28.32, + "learning_rate": 8.876329787234042e-05, + "loss": 0.2105, + "step": 32370 + }, + { + "epoch": 28.33, + "learning_rate": 8.86968085106383e-05, + "loss": 0.1953, + "step": 32380 + }, + { + "epoch": 28.34, + "learning_rate": 8.863031914893617e-05, + "loss": 0.3007, + "step": 32390 + }, + { + "epoch": 28.35, + "learning_rate": 8.856382978723404e-05, + "loss": 0.1532, + "step": 32400 + }, + { + "epoch": 28.35, + "eval_cer1": 0.2568785658823132, + "eval_cer2": 0.23668580803937653, + "eval_cer3": 0.2134923227703365, + "eval_cer4": 0.21584725844360733, + "eval_cer5": 0.24016985138004246, + "eval_loss": 1.0208557844161987, + "eval_runtime": 1460.2588, + "eval_samples_per_second": 5.999, + "step": 32400 + }, + { + "epoch": 28.36, + "learning_rate": 8.849734042553191e-05, + "loss": 0.2277, + "step": 32410 + }, + { + "epoch": 28.36, + "learning_rate": 8.843085106382977e-05, + "loss": 0.1995, + "step": 32420 + }, + { + "epoch": 28.37, + "learning_rate": 8.836436170212765e-05, + "loss": 0.1582, + "step": 32430 + }, + { + "epoch": 28.38, + "learning_rate": 8.829787234042552e-05, + "loss": 0.3057, + "step": 32440 + }, + { + "epoch": 28.39, + "learning_rate": 8.823138297872339e-05, + "loss": 0.1396, + "step": 32450 + }, + { + "epoch": 28.4, + "learning_rate": 8.816489361702126e-05, + "loss": 0.2855, + "step": 32460 + }, + { + "epoch": 28.41, + "learning_rate": 8.809840425531914e-05, + "loss": 0.2354, + "step": 32470 + }, + { + "epoch": 28.42, + "learning_rate": 8.803191489361701e-05, + "loss": 0.168, + "step": 32480 + }, + { + "epoch": 28.43, + "learning_rate": 8.796542553191488e-05, + "loss": 0.3093, + "step": 32490 + }, + { + "epoch": 28.43, + "learning_rate": 8.789893617021275e-05, + "loss": 0.177, + "step": 32500 + }, + { + "epoch": 28.44, + "learning_rate": 8.783244680851064e-05, + "loss": 0.2213, + "step": 32510 + }, + { + "epoch": 28.45, + "learning_rate": 8.77659574468085e-05, + "loss": 0.2438, + "step": 32520 + }, + { + "epoch": 28.46, + "learning_rate": 8.769946808510638e-05, + "loss": 0.2138, + "step": 32530 + }, + { + "epoch": 28.47, + "learning_rate": 8.763297872340425e-05, + "loss": 0.3195, + "step": 32540 + }, + { + "epoch": 28.48, + "learning_rate": 8.756648936170213e-05, + "loss": 0.1386, + "step": 32550 + }, + { + "epoch": 28.49, + "learning_rate": 8.75e-05, + "loss": 0.2627, + "step": 32560 + }, + { + "epoch": 28.49, + "learning_rate": 8.743351063829787e-05, + "loss": 0.2102, + "step": 32570 + }, + { + "epoch": 28.5, + "learning_rate": 8.736702127659574e-05, + "loss": 0.2127, + "step": 32580 + }, + { + "epoch": 28.51, + "learning_rate": 8.73005319148936e-05, + "loss": 0.326, + "step": 32590 + }, + { + "epoch": 28.52, + "learning_rate": 8.723404255319148e-05, + "loss": 0.2089, + "step": 32600 + }, + { + "epoch": 28.53, + "learning_rate": 8.716755319148935e-05, + "loss": 0.2495, + "step": 32610 + }, + { + "epoch": 28.54, + "learning_rate": 8.710106382978722e-05, + "loss": 0.2482, + "step": 32620 + }, + { + "epoch": 28.55, + "learning_rate": 8.703457446808509e-05, + "loss": 0.1889, + "step": 32630 + }, + { + "epoch": 28.56, + "learning_rate": 8.696808510638297e-05, + "loss": 0.3184, + "step": 32640 + }, + { + "epoch": 28.56, + "learning_rate": 8.690159574468084e-05, + "loss": 0.1858, + "step": 32650 + }, + { + "epoch": 28.57, + "learning_rate": 8.683510638297871e-05, + "loss": 0.2492, + "step": 32660 + }, + { + "epoch": 28.58, + "learning_rate": 8.676861702127658e-05, + "loss": 0.215, + "step": 32670 + }, + { + "epoch": 28.59, + "learning_rate": 8.670212765957446e-05, + "loss": 0.1269, + "step": 32680 + }, + { + "epoch": 28.6, + "learning_rate": 8.663563829787233e-05, + "loss": 0.2923, + "step": 32690 + }, + { + "epoch": 28.61, + "learning_rate": 8.65691489361702e-05, + "loss": 0.1782, + "step": 32700 + }, + { + "epoch": 28.62, + "learning_rate": 8.650265957446807e-05, + "loss": 0.2827, + "step": 32710 + }, + { + "epoch": 28.63, + "learning_rate": 8.643617021276596e-05, + "loss": 0.2357, + "step": 32720 + }, + { + "epoch": 28.63, + "learning_rate": 8.636968085106383e-05, + "loss": 0.1844, + "step": 32730 + }, + { + "epoch": 28.64, + "learning_rate": 8.63031914893617e-05, + "loss": 0.2596, + "step": 32740 + }, + { + "epoch": 28.65, + "learning_rate": 8.623670212765957e-05, + "loss": 0.1641, + "step": 32750 + }, + { + "epoch": 28.66, + "learning_rate": 8.617021276595745e-05, + "loss": 0.2588, + "step": 32760 + }, + { + "epoch": 28.67, + "learning_rate": 8.610372340425531e-05, + "loss": 0.2082, + "step": 32770 + }, + { + "epoch": 28.68, + "learning_rate": 8.603723404255318e-05, + "loss": 0.1696, + "step": 32780 + }, + { + "epoch": 28.69, + "learning_rate": 8.597074468085105e-05, + "loss": 0.2652, + "step": 32790 + }, + { + "epoch": 28.7, + "learning_rate": 8.590425531914893e-05, + "loss": 0.1763, + "step": 32800 + }, + { + "epoch": 28.7, + "learning_rate": 8.58377659574468e-05, + "loss": 0.2386, + "step": 32810 + }, + { + "epoch": 28.71, + "learning_rate": 8.577127659574467e-05, + "loss": 0.2928, + "step": 32820 + }, + { + "epoch": 28.72, + "learning_rate": 8.570478723404254e-05, + "loss": 0.1688, + "step": 32830 + }, + { + "epoch": 28.73, + "learning_rate": 8.563829787234042e-05, + "loss": 0.3004, + "step": 32840 + }, + { + "epoch": 28.74, + "learning_rate": 8.557180851063829e-05, + "loss": 0.2131, + "step": 32850 + }, + { + "epoch": 28.75, + "learning_rate": 8.550531914893616e-05, + "loss": 0.2091, + "step": 32860 + }, + { + "epoch": 28.76, + "learning_rate": 8.543882978723403e-05, + "loss": 0.1967, + "step": 32870 + }, + { + "epoch": 28.77, + "learning_rate": 8.537234042553192e-05, + "loss": 0.1664, + "step": 32880 + }, + { + "epoch": 28.77, + "learning_rate": 8.530585106382979e-05, + "loss": 0.3386, + "step": 32890 + }, + { + "epoch": 28.78, + "learning_rate": 8.523936170212766e-05, + "loss": 0.213, + "step": 32900 + }, + { + "epoch": 28.79, + "learning_rate": 8.517287234042553e-05, + "loss": 0.267, + "step": 32910 + }, + { + "epoch": 28.8, + "learning_rate": 8.510638297872341e-05, + "loss": 0.2418, + "step": 32920 + }, + { + "epoch": 28.81, + "learning_rate": 8.503989361702128e-05, + "loss": 0.1753, + "step": 32930 + }, + { + "epoch": 28.82, + "learning_rate": 8.497340425531915e-05, + "loss": 0.3012, + "step": 32940 + }, + { + "epoch": 28.83, + "learning_rate": 8.4906914893617e-05, + "loss": 0.1924, + "step": 32950 + }, + { + "epoch": 28.84, + "learning_rate": 8.484042553191487e-05, + "loss": 0.269, + "step": 32960 + }, + { + "epoch": 28.84, + "learning_rate": 8.477393617021276e-05, + "loss": 0.2638, + "step": 32970 + }, + { + "epoch": 28.85, + "learning_rate": 8.470744680851063e-05, + "loss": 0.241, + "step": 32980 + }, + { + "epoch": 28.86, + "learning_rate": 8.46409574468085e-05, + "loss": 0.2674, + "step": 32990 + }, + { + "epoch": 28.87, + "learning_rate": 8.457446808510637e-05, + "loss": 0.1705, + "step": 33000 + }, + { + "epoch": 28.87, + "eval_cer1": 0.2563046487289423, + "eval_cer2": 0.23186218211648893, + "eval_cer3": 0.21114015027768704, + "eval_cer4": 0.21430181267909462, + "eval_cer5": 0.23736730360934183, + "eval_loss": 1.0212068557739258, + "eval_runtime": 1463.899, + "eval_samples_per_second": 5.984, + "step": 33000 + }, + { + "epoch": 28.88, + "learning_rate": 8.450797872340425e-05, + "loss": 0.2879, + "step": 33010 + }, + { + "epoch": 28.89, + "learning_rate": 8.444148936170212e-05, + "loss": 0.2216, + "step": 33020 + }, + { + "epoch": 28.9, + "learning_rate": 8.437499999999999e-05, + "loss": 0.1741, + "step": 33030 + }, + { + "epoch": 28.91, + "learning_rate": 8.430851063829786e-05, + "loss": 0.2827, + "step": 33040 + }, + { + "epoch": 28.91, + "learning_rate": 8.424202127659574e-05, + "loss": 0.1643, + "step": 33050 + }, + { + "epoch": 28.92, + "learning_rate": 8.417553191489361e-05, + "loss": 0.2935, + "step": 33060 + }, + { + "epoch": 28.93, + "learning_rate": 8.410904255319148e-05, + "loss": 0.2283, + "step": 33070 + }, + { + "epoch": 28.94, + "learning_rate": 8.404255319148935e-05, + "loss": 0.178, + "step": 33080 + }, + { + "epoch": 28.95, + "learning_rate": 8.397606382978724e-05, + "loss": 0.2698, + "step": 33090 + }, + { + "epoch": 28.96, + "learning_rate": 8.390957446808511e-05, + "loss": 0.178, + "step": 33100 + }, + { + "epoch": 28.97, + "learning_rate": 8.384308510638298e-05, + "loss": 0.2781, + "step": 33110 + }, + { + "epoch": 28.98, + "learning_rate": 8.377659574468083e-05, + "loss": 0.2213, + "step": 33120 + }, + { + "epoch": 28.98, + "learning_rate": 8.37101063829787e-05, + "loss": 0.1796, + "step": 33130 + }, + { + "epoch": 28.99, + "learning_rate": 8.364361702127659e-05, + "loss": 0.2551, + "step": 33140 + }, + { + "epoch": 29.0, + "learning_rate": 8.357712765957446e-05, + "loss": 0.2451, + "step": 33150 + }, + { + "epoch": 29.01, + "learning_rate": 8.351063829787233e-05, + "loss": 0.2655, + "step": 33160 + }, + { + "epoch": 29.02, + "learning_rate": 8.34441489361702e-05, + "loss": 0.1502, + "step": 33170 + }, + { + "epoch": 29.03, + "learning_rate": 8.337765957446808e-05, + "loss": 0.3193, + "step": 33180 + }, + { + "epoch": 29.04, + "learning_rate": 8.331117021276595e-05, + "loss": 0.2363, + "step": 33190 + }, + { + "epoch": 29.05, + "learning_rate": 8.324468085106382e-05, + "loss": 0.2369, + "step": 33200 + }, + { + "epoch": 29.06, + "learning_rate": 8.317819148936169e-05, + "loss": 0.2447, + "step": 33210 + }, + { + "epoch": 29.06, + "learning_rate": 8.311170212765957e-05, + "loss": 0.1887, + "step": 33220 + }, + { + "epoch": 29.07, + "learning_rate": 8.304521276595744e-05, + "loss": 0.2976, + "step": 33230 + }, + { + "epoch": 29.08, + "learning_rate": 8.297872340425531e-05, + "loss": 0.1867, + "step": 33240 + }, + { + "epoch": 29.09, + "learning_rate": 8.291223404255318e-05, + "loss": 0.2073, + "step": 33250 + }, + { + "epoch": 29.1, + "learning_rate": 8.284574468085107e-05, + "loss": 0.2768, + "step": 33260 + }, + { + "epoch": 29.11, + "learning_rate": 8.277925531914894e-05, + "loss": 0.1858, + "step": 33270 + }, + { + "epoch": 29.12, + "learning_rate": 8.27127659574468e-05, + "loss": 0.2429, + "step": 33280 + }, + { + "epoch": 29.13, + "learning_rate": 8.264627659574468e-05, + "loss": 0.2358, + "step": 33290 + }, + { + "epoch": 29.13, + "learning_rate": 8.257978723404254e-05, + "loss": 0.1802, + "step": 33300 + }, + { + "epoch": 29.14, + "learning_rate": 8.251329787234041e-05, + "loss": 0.2441, + "step": 33310 + }, + { + "epoch": 29.15, + "learning_rate": 8.244680851063828e-05, + "loss": 0.1722, + "step": 33320 + }, + { + "epoch": 29.16, + "learning_rate": 8.238031914893615e-05, + "loss": 0.2812, + "step": 33330 + }, + { + "epoch": 29.17, + "learning_rate": 8.231382978723404e-05, + "loss": 0.1838, + "step": 33340 + }, + { + "epoch": 29.18, + "learning_rate": 8.224734042553191e-05, + "loss": 0.2453, + "step": 33350 + }, + { + "epoch": 29.19, + "learning_rate": 8.218085106382978e-05, + "loss": 0.2567, + "step": 33360 + }, + { + "epoch": 29.2, + "learning_rate": 8.211436170212765e-05, + "loss": 0.1684, + "step": 33370 + }, + { + "epoch": 29.2, + "learning_rate": 8.204787234042553e-05, + "loss": 0.2686, + "step": 33380 + }, + { + "epoch": 29.21, + "learning_rate": 8.19813829787234e-05, + "loss": 0.1972, + "step": 33390 + }, + { + "epoch": 29.22, + "learning_rate": 8.191489361702127e-05, + "loss": 0.2457, + "step": 33400 + }, + { + "epoch": 29.23, + "learning_rate": 8.184840425531914e-05, + "loss": 0.234, + "step": 33410 + }, + { + "epoch": 29.24, + "learning_rate": 8.178191489361702e-05, + "loss": 0.1775, + "step": 33420 + }, + { + "epoch": 29.25, + "learning_rate": 8.17154255319149e-05, + "loss": 0.2568, + "step": 33430 + }, + { + "epoch": 29.26, + "learning_rate": 8.164893617021276e-05, + "loss": 0.2197, + "step": 33440 + }, + { + "epoch": 29.26, + "learning_rate": 8.158244680851063e-05, + "loss": 0.2684, + "step": 33450 + }, + { + "epoch": 29.27, + "learning_rate": 8.151595744680852e-05, + "loss": 0.193, + "step": 33460 + }, + { + "epoch": 29.28, + "learning_rate": 8.144946808510639e-05, + "loss": 0.1507, + "step": 33470 + }, + { + "epoch": 29.29, + "learning_rate": 8.138297872340424e-05, + "loss": 0.2676, + "step": 33480 + }, + { + "epoch": 29.3, + "learning_rate": 8.131648936170211e-05, + "loss": 0.1801, + "step": 33490 + }, + { + "epoch": 29.31, + "learning_rate": 8.124999999999998e-05, + "loss": 0.2234, + "step": 33500 + }, + { + "epoch": 29.32, + "learning_rate": 8.118351063829787e-05, + "loss": 0.2621, + "step": 33510 + }, + { + "epoch": 29.33, + "learning_rate": 8.111702127659574e-05, + "loss": 0.1889, + "step": 33520 + }, + { + "epoch": 29.33, + "learning_rate": 8.10505319148936e-05, + "loss": 0.2506, + "step": 33530 + }, + { + "epoch": 29.34, + "learning_rate": 8.098404255319148e-05, + "loss": 0.1947, + "step": 33540 + }, + { + "epoch": 29.35, + "learning_rate": 8.091755319148936e-05, + "loss": 0.2078, + "step": 33550 + }, + { + "epoch": 29.36, + "learning_rate": 8.085106382978723e-05, + "loss": 0.21, + "step": 33560 + }, + { + "epoch": 29.37, + "learning_rate": 8.07845744680851e-05, + "loss": 0.1593, + "step": 33570 + }, + { + "epoch": 29.38, + "learning_rate": 8.071808510638297e-05, + "loss": 0.2212, + "step": 33580 + }, + { + "epoch": 29.39, + "learning_rate": 8.065159574468085e-05, + "loss": 0.19, + "step": 33590 + }, + { + "epoch": 29.4, + "learning_rate": 8.058510638297872e-05, + "loss": 0.2509, + "step": 33600 + }, + { + "epoch": 29.4, + "eval_cer1": 0.2500253198744134, + "eval_cer2": 0.23245283018867924, + "eval_cer3": 0.2085592943482522, + "eval_cer4": 0.20979426253259925, + "eval_cer5": 0.23923566878980893, + "eval_loss": 1.024003505706787, + "eval_runtime": 1456.5951, + "eval_samples_per_second": 6.014, + "step": 33600 + }, + { + "epoch": 29.4, + "learning_rate": 8.051861702127659e-05, + "loss": 0.2267, + "step": 33610 + }, + { + "epoch": 29.41, + "learning_rate": 8.045212765957446e-05, + "loss": 0.1334, + "step": 33620 + }, + { + "epoch": 29.42, + "learning_rate": 8.038563829787235e-05, + "loss": 0.2582, + "step": 33630 + }, + { + "epoch": 29.43, + "learning_rate": 8.031914893617021e-05, + "loss": 0.1532, + "step": 33640 + }, + { + "epoch": 29.44, + "learning_rate": 8.025265957446807e-05, + "loss": 0.1622, + "step": 33650 + }, + { + "epoch": 29.45, + "learning_rate": 8.018617021276594e-05, + "loss": 0.2012, + "step": 33660 + }, + { + "epoch": 29.46, + "learning_rate": 8.011968085106381e-05, + "loss": 0.1545, + "step": 33670 + }, + { + "epoch": 29.47, + "learning_rate": 8.00531914893617e-05, + "loss": 0.2547, + "step": 33680 + }, + { + "epoch": 29.47, + "learning_rate": 7.998670212765956e-05, + "loss": 0.2239, + "step": 33690 + }, + { + "epoch": 29.48, + "learning_rate": 7.992021276595743e-05, + "loss": 0.1635, + "step": 33700 + }, + { + "epoch": 29.49, + "learning_rate": 7.98537234042553e-05, + "loss": 0.2212, + "step": 33710 + }, + { + "epoch": 29.5, + "learning_rate": 7.978723404255319e-05, + "loss": 0.1767, + "step": 33720 + }, + { + "epoch": 29.51, + "learning_rate": 7.972074468085106e-05, + "loss": 0.2599, + "step": 33730 + }, + { + "epoch": 29.52, + "learning_rate": 7.965425531914893e-05, + "loss": 0.1697, + "step": 33740 + }, + { + "epoch": 29.53, + "learning_rate": 7.95877659574468e-05, + "loss": 0.2097, + "step": 33750 + }, + { + "epoch": 29.54, + "learning_rate": 7.952127659574468e-05, + "loss": 0.1848, + "step": 33760 + }, + { + "epoch": 29.54, + "learning_rate": 7.945478723404255e-05, + "loss": 0.1143, + "step": 33770 + }, + { + "epoch": 29.55, + "learning_rate": 7.938829787234042e-05, + "loss": 0.2369, + "step": 33780 + }, + { + "epoch": 29.56, + "learning_rate": 7.932180851063829e-05, + "loss": 0.1898, + "step": 33790 + }, + { + "epoch": 29.57, + "learning_rate": 7.925531914893617e-05, + "loss": 0.2223, + "step": 33800 + }, + { + "epoch": 29.58, + "learning_rate": 7.918882978723404e-05, + "loss": 0.2357, + "step": 33810 + }, + { + "epoch": 29.59, + "learning_rate": 7.912234042553191e-05, + "loss": 0.1632, + "step": 33820 + }, + { + "epoch": 29.6, + "learning_rate": 7.905585106382977e-05, + "loss": 0.2716, + "step": 33830 + }, + { + "epoch": 29.61, + "learning_rate": 7.898936170212764e-05, + "loss": 0.1898, + "step": 33840 + }, + { + "epoch": 29.61, + "learning_rate": 7.892287234042552e-05, + "loss": 0.2387, + "step": 33850 + }, + { + "epoch": 29.62, + "learning_rate": 7.885638297872339e-05, + "loss": 0.2356, + "step": 33860 + }, + { + "epoch": 29.63, + "learning_rate": 7.878989361702126e-05, + "loss": 0.1348, + "step": 33870 + }, + { + "epoch": 29.64, + "learning_rate": 7.872340425531915e-05, + "loss": 0.2727, + "step": 33880 + }, + { + "epoch": 29.65, + "learning_rate": 7.865691489361702e-05, + "loss": 0.1605, + "step": 33890 + }, + { + "epoch": 29.66, + "learning_rate": 7.859042553191489e-05, + "loss": 0.2063, + "step": 33900 + }, + { + "epoch": 29.67, + "learning_rate": 7.852393617021276e-05, + "loss": 0.2162, + "step": 33910 + }, + { + "epoch": 29.68, + "learning_rate": 7.845744680851064e-05, + "loss": 0.1417, + "step": 33920 + }, + { + "epoch": 29.68, + "learning_rate": 7.839095744680851e-05, + "loss": 0.2569, + "step": 33930 + }, + { + "epoch": 29.69, + "learning_rate": 7.832446808510638e-05, + "loss": 0.1614, + "step": 33940 + }, + { + "epoch": 29.7, + "learning_rate": 7.825797872340425e-05, + "loss": 0.2097, + "step": 33950 + }, + { + "epoch": 29.71, + "learning_rate": 7.819148936170213e-05, + "loss": 0.2294, + "step": 33960 + }, + { + "epoch": 29.72, + "learning_rate": 7.8125e-05, + "loss": 0.1658, + "step": 33970 + }, + { + "epoch": 29.73, + "learning_rate": 7.805851063829787e-05, + "loss": 0.2696, + "step": 33980 + }, + { + "epoch": 29.74, + "learning_rate": 7.799202127659574e-05, + "loss": 0.1842, + "step": 33990 + }, + { + "epoch": 29.75, + "learning_rate": 7.79255319148936e-05, + "loss": 0.245, + "step": 34000 + }, + { + "epoch": 29.75, + "learning_rate": 7.785904255319148e-05, + "loss": 0.203, + "step": 34010 + }, + { + "epoch": 29.76, + "learning_rate": 7.779255319148935e-05, + "loss": 0.1773, + "step": 34020 + }, + { + "epoch": 29.77, + "learning_rate": 7.772606382978722e-05, + "loss": 0.2509, + "step": 34030 + }, + { + "epoch": 29.78, + "learning_rate": 7.765957446808509e-05, + "loss": 0.1625, + "step": 34040 + }, + { + "epoch": 29.79, + "learning_rate": 7.759308510638297e-05, + "loss": 0.1995, + "step": 34050 + }, + { + "epoch": 29.8, + "learning_rate": 7.752659574468084e-05, + "loss": 0.2076, + "step": 34060 + }, + { + "epoch": 29.81, + "learning_rate": 7.746010638297871e-05, + "loss": 0.1542, + "step": 34070 + }, + { + "epoch": 29.82, + "learning_rate": 7.739361702127658e-05, + "loss": 0.244, + "step": 34080 + }, + { + "epoch": 29.82, + "learning_rate": 7.732712765957447e-05, + "loss": 0.1696, + "step": 34090 + }, + { + "epoch": 29.83, + "learning_rate": 7.726063829787234e-05, + "loss": 0.2242, + "step": 34100 + }, + { + "epoch": 29.84, + "learning_rate": 7.71941489361702e-05, + "loss": 0.2145, + "step": 34110 + }, + { + "epoch": 29.85, + "learning_rate": 7.712765957446808e-05, + "loss": 0.2206, + "step": 34120 + }, + { + "epoch": 29.86, + "learning_rate": 7.706117021276596e-05, + "loss": 0.2733, + "step": 34130 + }, + { + "epoch": 29.87, + "learning_rate": 7.699468085106383e-05, + "loss": 0.2063, + "step": 34140 + }, + { + "epoch": 29.88, + "learning_rate": 7.69281914893617e-05, + "loss": 0.1992, + "step": 34150 + }, + { + "epoch": 29.89, + "learning_rate": 7.686170212765957e-05, + "loss": 0.234, + "step": 34160 + }, + { + "epoch": 29.89, + "learning_rate": 7.679521276595745e-05, + "loss": 0.1824, + "step": 34170 + }, + { + "epoch": 29.9, + "learning_rate": 7.672872340425531e-05, + "loss": 0.2341, + "step": 34180 + }, + { + "epoch": 29.91, + "learning_rate": 7.666223404255318e-05, + "loss": 0.1896, + "step": 34190 + }, + { + "epoch": 29.92, + "learning_rate": 7.659574468085105e-05, + "loss": 0.1796, + "step": 34200 + }, + { + "epoch": 29.92, + "eval_cer1": 0.251274433678809, + "eval_cer2": 0.22956521739130434, + "eval_cer3": 0.20859196341065012, + "eval_cer4": 0.2114041018706333, + "eval_cer5": 0.2356687898089172, + "eval_loss": 1.0192776918411255, + "eval_runtime": 1443.2517, + "eval_samples_per_second": 6.07, + "step": 34200 + }, + { + "epoch": 29.93, + "learning_rate": 7.652925531914892e-05, + "loss": 0.277, + "step": 34210 + }, + { + "epoch": 29.94, + "learning_rate": 7.64627659574468e-05, + "loss": 0.1345, + "step": 34220 + }, + { + "epoch": 29.95, + "learning_rate": 7.639627659574467e-05, + "loss": 0.2297, + "step": 34230 + }, + { + "epoch": 29.96, + "learning_rate": 7.632978723404254e-05, + "loss": 0.1807, + "step": 34240 + }, + { + "epoch": 29.96, + "learning_rate": 7.626329787234041e-05, + "loss": 0.1728, + "step": 34250 + }, + { + "epoch": 29.97, + "learning_rate": 7.61968085106383e-05, + "loss": 0.2002, + "step": 34260 + }, + { + "epoch": 29.98, + "learning_rate": 7.613031914893617e-05, + "loss": 0.1273, + "step": 34270 + }, + { + "epoch": 29.99, + "learning_rate": 7.606382978723404e-05, + "loss": 0.216, + "step": 34280 + }, + { + "epoch": 30.0, + "learning_rate": 7.59973404255319e-05, + "loss": 0.1523, + "step": 34290 + }, + { + "epoch": 30.01, + "learning_rate": 7.593085106382979e-05, + "loss": 0.2616, + "step": 34300 + }, + { + "epoch": 30.02, + "learning_rate": 7.586436170212766e-05, + "loss": 0.1171, + "step": 34310 + }, + { + "epoch": 30.03, + "learning_rate": 7.579787234042553e-05, + "loss": 0.1971, + "step": 34320 + }, + { + "epoch": 30.03, + "learning_rate": 7.57313829787234e-05, + "loss": 0.2014, + "step": 34330 + }, + { + "epoch": 30.04, + "learning_rate": 7.566489361702128e-05, + "loss": 0.1554, + "step": 34340 + }, + { + "epoch": 30.05, + "learning_rate": 7.559840425531915e-05, + "loss": 0.2091, + "step": 34350 + }, + { + "epoch": 30.06, + "learning_rate": 7.553191489361701e-05, + "loss": 0.1912, + "step": 34360 + }, + { + "epoch": 30.07, + "learning_rate": 7.546542553191488e-05, + "loss": 0.2322, + "step": 34370 + }, + { + "epoch": 30.08, + "learning_rate": 7.539893617021275e-05, + "loss": 0.1863, + "step": 34380 + }, + { + "epoch": 30.09, + "learning_rate": 7.533244680851063e-05, + "loss": 0.14, + "step": 34390 + }, + { + "epoch": 30.1, + "learning_rate": 7.52659574468085e-05, + "loss": 0.2368, + "step": 34400 + }, + { + "epoch": 30.1, + "learning_rate": 7.519946808510637e-05, + "loss": 0.167, + "step": 34410 + }, + { + "epoch": 30.11, + "learning_rate": 7.513297872340424e-05, + "loss": 0.1898, + "step": 34420 + }, + { + "epoch": 30.12, + "learning_rate": 7.506648936170212e-05, + "loss": 0.1717, + "step": 34430 + }, + { + "epoch": 30.13, + "learning_rate": 7.5e-05, + "loss": 0.1582, + "step": 34440 + }, + { + "epoch": 30.14, + "learning_rate": 7.493351063829786e-05, + "loss": 0.2903, + "step": 34450 + }, + { + "epoch": 30.15, + "learning_rate": 7.486702127659575e-05, + "loss": 0.1414, + "step": 34460 + }, + { + "epoch": 30.16, + "learning_rate": 7.480053191489362e-05, + "loss": 0.2035, + "step": 34470 + }, + { + "epoch": 30.17, + "learning_rate": 7.473404255319149e-05, + "loss": 0.1856, + "step": 34480 + }, + { + "epoch": 30.17, + "learning_rate": 7.466755319148936e-05, + "loss": 0.1483, + "step": 34490 + }, + { + "epoch": 30.18, + "learning_rate": 7.460106382978723e-05, + "loss": 0.2859, + "step": 34500 + }, + { + "epoch": 30.19, + "learning_rate": 7.45345744680851e-05, + "loss": 0.1655, + "step": 34510 + }, + { + "epoch": 30.2, + "learning_rate": 7.446808510638297e-05, + "loss": 0.247, + "step": 34520 + }, + { + "epoch": 30.21, + "learning_rate": 7.440159574468085e-05, + "loss": 0.1813, + "step": 34530 + }, + { + "epoch": 30.22, + "learning_rate": 7.433510638297872e-05, + "loss": 0.203, + "step": 34540 + }, + { + "epoch": 30.23, + "learning_rate": 7.426861702127659e-05, + "loss": 0.2259, + "step": 34550 + }, + { + "epoch": 30.24, + "learning_rate": 7.420212765957446e-05, + "loss": 0.1762, + "step": 34560 + }, + { + "epoch": 30.24, + "learning_rate": 7.413563829787234e-05, + "loss": 0.2374, + "step": 34570 + }, + { + "epoch": 30.25, + "learning_rate": 7.40691489361702e-05, + "loss": 0.1781, + "step": 34580 + }, + { + "epoch": 30.26, + "learning_rate": 7.400265957446808e-05, + "loss": 0.1523, + "step": 34590 + }, + { + "epoch": 30.27, + "learning_rate": 7.393617021276595e-05, + "loss": 0.24, + "step": 34600 + }, + { + "epoch": 30.28, + "learning_rate": 7.386968085106382e-05, + "loss": 0.1327, + "step": 34610 + }, + { + "epoch": 30.29, + "learning_rate": 7.380319148936169e-05, + "loss": 0.2016, + "step": 34620 + }, + { + "epoch": 30.3, + "learning_rate": 7.373670212765957e-05, + "loss": 0.1542, + "step": 34630 + }, + { + "epoch": 30.31, + "learning_rate": 7.367021276595744e-05, + "loss": 0.1105, + "step": 34640 + }, + { + "epoch": 30.31, + "learning_rate": 7.360372340425531e-05, + "loss": 0.281, + "step": 34650 + }, + { + "epoch": 30.32, + "learning_rate": 7.353723404255318e-05, + "loss": 0.1521, + "step": 34660 + }, + { + "epoch": 30.33, + "learning_rate": 7.347074468085105e-05, + "loss": 0.2439, + "step": 34670 + }, + { + "epoch": 30.34, + "learning_rate": 7.340425531914892e-05, + "loss": 0.2121, + "step": 34680 + }, + { + "epoch": 30.35, + "learning_rate": 7.33377659574468e-05, + "loss": 0.1283, + "step": 34690 + }, + { + "epoch": 30.36, + "learning_rate": 7.327127659574468e-05, + "loss": 0.271, + "step": 34700 + }, + { + "epoch": 30.37, + "learning_rate": 7.320478723404255e-05, + "loss": 0.1568, + "step": 34710 + }, + { + "epoch": 30.38, + "learning_rate": 7.313829787234042e-05, + "loss": 0.244, + "step": 34720 + }, + { + "epoch": 30.38, + "learning_rate": 7.30718085106383e-05, + "loss": 0.1979, + "step": 34730 + }, + { + "epoch": 30.39, + "learning_rate": 7.300531914893617e-05, + "loss": 0.1656, + "step": 34740 + }, + { + "epoch": 30.4, + "learning_rate": 7.293882978723403e-05, + "loss": 0.2802, + "step": 34750 + }, + { + "epoch": 30.41, + "learning_rate": 7.287234042553191e-05, + "loss": 0.1753, + "step": 34760 + }, + { + "epoch": 30.42, + "learning_rate": 7.280585106382978e-05, + "loss": 0.2025, + "step": 34770 + }, + { + "epoch": 30.43, + "learning_rate": 7.273936170212765e-05, + "loss": 0.1858, + "step": 34780 + }, + { + "epoch": 30.44, + "learning_rate": 7.267287234042552e-05, + "loss": 0.1386, + "step": 34790 + }, + { + "epoch": 30.45, + "learning_rate": 7.26063829787234e-05, + "loss": 0.2326, + "step": 34800 + }, + { + "epoch": 30.45, + "eval_cer1": 0.2481347692515445, + "eval_cer2": 0.2269729286300246, + "eval_cer3": 0.20878797778503758, + "eval_cer4": 0.2079590456872404, + "eval_cer5": 0.23447983014861995, + "eval_loss": 1.0198484659194946, + "eval_runtime": 1437.4715, + "eval_samples_per_second": 6.094, + "step": 34800 + }, + { + "epoch": 30.45, + "learning_rate": 7.253989361702127e-05, + "loss": 0.1268, + "step": 34810 + }, + { + "epoch": 30.46, + "learning_rate": 7.247340425531914e-05, + "loss": 0.2117, + "step": 34820 + }, + { + "epoch": 30.47, + "learning_rate": 7.240691489361701e-05, + "loss": 0.1934, + "step": 34830 + }, + { + "epoch": 30.48, + "learning_rate": 7.234042553191488e-05, + "loss": 0.1513, + "step": 34840 + }, + { + "epoch": 30.49, + "learning_rate": 7.227393617021275e-05, + "loss": 0.3037, + "step": 34850 + }, + { + "epoch": 30.5, + "learning_rate": 7.220744680851064e-05, + "loss": 0.1452, + "step": 34860 + }, + { + "epoch": 30.51, + "learning_rate": 7.21409574468085e-05, + "loss": 0.2373, + "step": 34870 + }, + { + "epoch": 30.52, + "learning_rate": 7.207446808510638e-05, + "loss": 0.1649, + "step": 34880 + }, + { + "epoch": 30.52, + "learning_rate": 7.200797872340425e-05, + "loss": 0.1545, + "step": 34890 + }, + { + "epoch": 30.53, + "learning_rate": 7.194148936170213e-05, + "loss": 0.2858, + "step": 34900 + }, + { + "epoch": 30.54, + "learning_rate": 7.1875e-05, + "loss": 0.1672, + "step": 34910 + }, + { + "epoch": 30.55, + "learning_rate": 7.180851063829787e-05, + "loss": 0.2481, + "step": 34920 + }, + { + "epoch": 30.56, + "learning_rate": 7.174202127659574e-05, + "loss": 0.1707, + "step": 34930 + }, + { + "epoch": 30.57, + "learning_rate": 7.167553191489361e-05, + "loss": 0.1076, + "step": 34940 + }, + { + "epoch": 30.58, + "learning_rate": 7.160904255319148e-05, + "loss": 0.2822, + "step": 34950 + }, + { + "epoch": 30.59, + "learning_rate": 7.154255319148935e-05, + "loss": 0.1514, + "step": 34960 + }, + { + "epoch": 30.59, + "learning_rate": 7.147606382978723e-05, + "loss": 0.208, + "step": 34970 + }, + { + "epoch": 30.6, + "learning_rate": 7.14095744680851e-05, + "loss": 0.1355, + "step": 34980 + }, + { + "epoch": 30.61, + "learning_rate": 7.134308510638297e-05, + "loss": 0.1348, + "step": 34990 + }, + { + "epoch": 30.62, + "learning_rate": 7.127659574468084e-05, + "loss": 0.269, + "step": 35000 + }, + { + "epoch": 30.63, + "learning_rate": 7.121010638297872e-05, + "loss": 0.1873, + "step": 35010 + }, + { + "epoch": 30.64, + "learning_rate": 7.114361702127658e-05, + "loss": 0.1941, + "step": 35020 + }, + { + "epoch": 30.65, + "learning_rate": 7.107712765957446e-05, + "loss": 0.1862, + "step": 35030 + }, + { + "epoch": 30.66, + "learning_rate": 7.101063829787233e-05, + "loss": 0.1445, + "step": 35040 + }, + { + "epoch": 30.66, + "learning_rate": 7.09441489361702e-05, + "loss": 0.2834, + "step": 35050 + }, + { + "epoch": 30.67, + "learning_rate": 7.087765957446807e-05, + "loss": 0.1387, + "step": 35060 + }, + { + "epoch": 30.68, + "learning_rate": 7.081117021276596e-05, + "loss": 0.1995, + "step": 35070 + }, + { + "epoch": 30.69, + "learning_rate": 7.074468085106383e-05, + "loss": 0.2047, + "step": 35080 + }, + { + "epoch": 30.7, + "learning_rate": 7.06781914893617e-05, + "loss": 0.1808, + "step": 35090 + }, + { + "epoch": 30.71, + "learning_rate": 7.061170212765957e-05, + "loss": 0.2809, + "step": 35100 + }, + { + "epoch": 30.72, + "learning_rate": 7.054521276595744e-05, + "loss": 0.1712, + "step": 35110 + }, + { + "epoch": 30.73, + "learning_rate": 7.04787234042553e-05, + "loss": 0.2072, + "step": 35120 + }, + { + "epoch": 30.73, + "learning_rate": 7.041223404255319e-05, + "loss": 0.1787, + "step": 35130 + }, + { + "epoch": 30.74, + "learning_rate": 7.034574468085106e-05, + "loss": 0.1476, + "step": 35140 + }, + { + "epoch": 30.75, + "learning_rate": 7.027925531914893e-05, + "loss": 0.2687, + "step": 35150 + }, + { + "epoch": 30.76, + "learning_rate": 7.02127659574468e-05, + "loss": 0.1377, + "step": 35160 + }, + { + "epoch": 30.77, + "learning_rate": 7.014627659574468e-05, + "loss": 0.1818, + "step": 35170 + }, + { + "epoch": 30.78, + "learning_rate": 7.007978723404255e-05, + "loss": 0.1543, + "step": 35180 + }, + { + "epoch": 30.79, + "learning_rate": 7.001329787234041e-05, + "loss": 0.1378, + "step": 35190 + }, + { + "epoch": 30.8, + "learning_rate": 6.994680851063829e-05, + "loss": 0.2284, + "step": 35200 + }, + { + "epoch": 30.8, + "learning_rate": 6.988031914893616e-05, + "loss": 0.1551, + "step": 35210 + }, + { + "epoch": 30.81, + "learning_rate": 6.981382978723403e-05, + "loss": 0.2366, + "step": 35220 + }, + { + "epoch": 30.82, + "learning_rate": 6.97473404255319e-05, + "loss": 0.1739, + "step": 35230 + }, + { + "epoch": 30.83, + "learning_rate": 6.968085106382979e-05, + "loss": 0.1512, + "step": 35240 + }, + { + "epoch": 30.84, + "learning_rate": 6.961436170212766e-05, + "loss": 0.2759, + "step": 35250 + }, + { + "epoch": 30.85, + "learning_rate": 6.954787234042553e-05, + "loss": 0.1957, + "step": 35260 + }, + { + "epoch": 30.86, + "learning_rate": 6.94813829787234e-05, + "loss": 0.1962, + "step": 35270 + }, + { + "epoch": 30.87, + "learning_rate": 6.941489361702126e-05, + "loss": 0.1991, + "step": 35280 + }, + { + "epoch": 30.87, + "learning_rate": 6.934840425531913e-05, + "loss": 0.1228, + "step": 35290 + }, + { + "epoch": 30.88, + "learning_rate": 6.928191489361702e-05, + "loss": 0.2481, + "step": 35300 + }, + { + "epoch": 30.89, + "learning_rate": 6.921542553191489e-05, + "loss": 0.1411, + "step": 35310 + }, + { + "epoch": 30.9, + "learning_rate": 6.914893617021276e-05, + "loss": 0.2211, + "step": 35320 + }, + { + "epoch": 30.91, + "learning_rate": 6.908244680851063e-05, + "loss": 0.1751, + "step": 35330 + }, + { + "epoch": 30.92, + "learning_rate": 6.901595744680851e-05, + "loss": 0.1508, + "step": 35340 + }, + { + "epoch": 30.93, + "learning_rate": 6.894946808510638e-05, + "loss": 0.2826, + "step": 35350 + }, + { + "epoch": 30.94, + "learning_rate": 6.888297872340425e-05, + "loss": 0.1581, + "step": 35360 + }, + { + "epoch": 30.94, + "learning_rate": 6.881648936170212e-05, + "loss": 0.1827, + "step": 35370 + }, + { + "epoch": 30.95, + "learning_rate": 6.874999999999999e-05, + "loss": 0.2392, + "step": 35380 + }, + { + "epoch": 30.96, + "learning_rate": 6.868351063829786e-05, + "loss": 0.1787, + "step": 35390 + }, + { + "epoch": 30.97, + "learning_rate": 6.861702127659574e-05, + "loss": 0.2824, + "step": 35400 + }, + { + "epoch": 30.97, + "eval_cer1": 0.24702069477735392, + "eval_cer2": 0.22720262510254308, + "eval_cer3": 0.20329957530218884, + "eval_cer4": 0.20477156379793296, + "eval_cer5": 0.23125265392781316, + "eval_loss": 1.0153509378433228, + "eval_runtime": 1450.7622, + "eval_samples_per_second": 6.038, + "step": 35400 + }, + { + "epoch": 30.98, + "learning_rate": 6.855053191489361e-05, + "loss": 0.1699, + "step": 35410 + }, + { + "epoch": 30.99, + "learning_rate": 6.848404255319148e-05, + "loss": 0.226, + "step": 35420 + }, + { + "epoch": 31.0, + "learning_rate": 6.841755319148935e-05, + "loss": 0.1506, + "step": 35430 + }, + { + "epoch": 31.01, + "learning_rate": 6.835106382978724e-05, + "loss": 0.2054, + "step": 35440 + }, + { + "epoch": 31.01, + "learning_rate": 6.82845744680851e-05, + "loss": 0.15, + "step": 35450 + }, + { + "epoch": 31.02, + "learning_rate": 6.821808510638296e-05, + "loss": 0.1999, + "step": 35460 + }, + { + "epoch": 31.03, + "learning_rate": 6.815159574468085e-05, + "loss": 0.1846, + "step": 35470 + }, + { + "epoch": 31.04, + "learning_rate": 6.808510638297872e-05, + "loss": 0.1134, + "step": 35480 + }, + { + "epoch": 31.05, + "learning_rate": 6.801861702127659e-05, + "loss": 0.1801, + "step": 35490 + }, + { + "epoch": 31.06, + "learning_rate": 6.795212765957446e-05, + "loss": 0.1895, + "step": 35500 + }, + { + "epoch": 31.07, + "learning_rate": 6.788563829787234e-05, + "loss": 0.134, + "step": 35510 + }, + { + "epoch": 31.08, + "learning_rate": 6.781914893617021e-05, + "loss": 0.2187, + "step": 35520 + }, + { + "epoch": 31.08, + "learning_rate": 6.775265957446808e-05, + "loss": 0.0919, + "step": 35530 + }, + { + "epoch": 31.09, + "learning_rate": 6.768617021276595e-05, + "loss": 0.2195, + "step": 35540 + }, + { + "epoch": 31.1, + "learning_rate": 6.761968085106382e-05, + "loss": 0.1563, + "step": 35550 + }, + { + "epoch": 31.11, + "learning_rate": 6.755319148936169e-05, + "loss": 0.1748, + "step": 35560 + }, + { + "epoch": 31.12, + "learning_rate": 6.748670212765957e-05, + "loss": 0.2085, + "step": 35570 + }, + { + "epoch": 31.13, + "learning_rate": 6.742021276595744e-05, + "loss": 0.1725, + "step": 35580 + }, + { + "epoch": 31.14, + "learning_rate": 6.735372340425531e-05, + "loss": 0.2975, + "step": 35590 + }, + { + "epoch": 31.15, + "learning_rate": 6.728723404255318e-05, + "loss": 0.2054, + "step": 35600 + }, + { + "epoch": 31.15, + "learning_rate": 6.722074468085107e-05, + "loss": 0.1407, + "step": 35610 + }, + { + "epoch": 31.16, + "learning_rate": 6.715425531914893e-05, + "loss": 0.2442, + "step": 35620 + }, + { + "epoch": 31.17, + "learning_rate": 6.70877659574468e-05, + "loss": 0.1284, + "step": 35630 + }, + { + "epoch": 31.18, + "learning_rate": 6.702127659574467e-05, + "loss": 0.2221, + "step": 35640 + }, + { + "epoch": 31.19, + "learning_rate": 6.695478723404254e-05, + "loss": 0.1394, + "step": 35650 + }, + { + "epoch": 31.2, + "learning_rate": 6.688829787234041e-05, + "loss": 0.1529, + "step": 35660 + }, + { + "epoch": 31.21, + "learning_rate": 6.68218085106383e-05, + "loss": 0.2296, + "step": 35670 + }, + { + "epoch": 31.22, + "learning_rate": 6.675531914893617e-05, + "loss": 0.1705, + "step": 35680 + }, + { + "epoch": 31.22, + "learning_rate": 6.668882978723404e-05, + "loss": 0.2917, + "step": 35690 + }, + { + "epoch": 31.23, + "learning_rate": 6.662234042553191e-05, + "loss": 0.1724, + "step": 35700 + }, + { + "epoch": 31.24, + "learning_rate": 6.655585106382979e-05, + "loss": 0.1395, + "step": 35710 + }, + { + "epoch": 31.25, + "learning_rate": 6.648936170212765e-05, + "loss": 0.1632, + "step": 35720 + }, + { + "epoch": 31.26, + "learning_rate": 6.642287234042552e-05, + "loss": 0.1604, + "step": 35730 + }, + { + "epoch": 31.27, + "learning_rate": 6.63563829787234e-05, + "loss": 0.1978, + "step": 35740 + }, + { + "epoch": 31.28, + "learning_rate": 6.628989361702127e-05, + "loss": 0.1793, + "step": 35750 + }, + { + "epoch": 31.29, + "learning_rate": 6.622340425531914e-05, + "loss": 0.123, + "step": 35760 + }, + { + "epoch": 31.29, + "learning_rate": 6.615691489361701e-05, + "loss": 0.1884, + "step": 35770 + }, + { + "epoch": 31.3, + "learning_rate": 6.60904255319149e-05, + "loss": 0.1496, + "step": 35780 + }, + { + "epoch": 31.31, + "learning_rate": 6.602393617021276e-05, + "loss": 0.2296, + "step": 35790 + }, + { + "epoch": 31.32, + "learning_rate": 6.595744680851063e-05, + "loss": 0.165, + "step": 35800 + }, + { + "epoch": 31.33, + "learning_rate": 6.58909574468085e-05, + "loss": 0.2108, + "step": 35810 + }, + { + "epoch": 31.34, + "learning_rate": 6.582446808510637e-05, + "loss": 0.204, + "step": 35820 + }, + { + "epoch": 31.35, + "learning_rate": 6.575797872340424e-05, + "loss": 0.104, + "step": 35830 + }, + { + "epoch": 31.36, + "learning_rate": 6.569148936170213e-05, + "loss": 0.2232, + "step": 35840 + }, + { + "epoch": 31.36, + "learning_rate": 6.5625e-05, + "loss": 0.1981, + "step": 35850 + }, + { + "epoch": 31.37, + "learning_rate": 6.555851063829787e-05, + "loss": 0.1674, + "step": 35860 + }, + { + "epoch": 31.38, + "learning_rate": 6.549202127659574e-05, + "loss": 0.1891, + "step": 35870 + }, + { + "epoch": 31.39, + "learning_rate": 6.542553191489362e-05, + "loss": 0.1355, + "step": 35880 + }, + { + "epoch": 31.4, + "learning_rate": 6.535904255319149e-05, + "loss": 0.2609, + "step": 35890 + }, + { + "epoch": 31.41, + "learning_rate": 6.529255319148936e-05, + "loss": 0.1735, + "step": 35900 + }, + { + "epoch": 31.42, + "learning_rate": 6.522606382978723e-05, + "loss": 0.2064, + "step": 35910 + }, + { + "epoch": 31.43, + "learning_rate": 6.51595744680851e-05, + "loss": 0.1905, + "step": 35920 + }, + { + "epoch": 31.43, + "learning_rate": 6.509308510638297e-05, + "loss": 0.1303, + "step": 35930 + }, + { + "epoch": 31.44, + "learning_rate": 6.502659574468085e-05, + "loss": 0.2222, + "step": 35940 + }, + { + "epoch": 31.45, + "learning_rate": 6.496010638297872e-05, + "loss": 0.162, + "step": 35950 + }, + { + "epoch": 31.46, + "learning_rate": 6.489361702127659e-05, + "loss": 0.1872, + "step": 35960 + }, + { + "epoch": 31.47, + "learning_rate": 6.482712765957446e-05, + "loss": 0.209, + "step": 35970 + }, + { + "epoch": 31.48, + "learning_rate": 6.476063829787234e-05, + "loss": 0.1518, + "step": 35980 + }, + { + "epoch": 31.49, + "learning_rate": 6.46941489361702e-05, + "loss": 0.2252, + "step": 35990 + }, + { + "epoch": 31.5, + "learning_rate": 6.462765957446807e-05, + "loss": 0.1863, + "step": 36000 + }, + { + "epoch": 31.5, + "eval_cer1": 0.2479997299213396, + "eval_cer2": 0.22887612797374898, + "eval_cer3": 0.20476968311009475, + "eval_cer4": 0.20528671238610385, + "eval_cer5": 0.2315923566878981, + "eval_loss": 1.0220904350280762, + "eval_runtime": 1458.0447, + "eval_samples_per_second": 6.008, + "step": 36000 + }, + { + "epoch": 31.5, + "learning_rate": 6.456117021276595e-05, + "loss": 0.1989, + "step": 36010 + }, + { + "epoch": 31.51, + "learning_rate": 6.449468085106382e-05, + "loss": 0.2102, + "step": 36020 + }, + { + "epoch": 31.52, + "learning_rate": 6.44281914893617e-05, + "loss": 0.1113, + "step": 36030 + }, + { + "epoch": 31.53, + "learning_rate": 6.436170212765956e-05, + "loss": 0.1909, + "step": 36040 + }, + { + "epoch": 31.54, + "learning_rate": 6.429521276595745e-05, + "loss": 0.182, + "step": 36050 + }, + { + "epoch": 31.55, + "learning_rate": 6.422872340425532e-05, + "loss": 0.2008, + "step": 36060 + }, + { + "epoch": 31.56, + "learning_rate": 6.416223404255319e-05, + "loss": 0.1781, + "step": 36070 + }, + { + "epoch": 31.57, + "learning_rate": 6.409574468085106e-05, + "loss": 0.1572, + "step": 36080 + }, + { + "epoch": 31.57, + "learning_rate": 6.402925531914893e-05, + "loss": 0.2777, + "step": 36090 + }, + { + "epoch": 31.58, + "learning_rate": 6.39627659574468e-05, + "loss": 0.1278, + "step": 36100 + }, + { + "epoch": 31.59, + "learning_rate": 6.389627659574468e-05, + "loss": 0.202, + "step": 36110 + }, + { + "epoch": 31.6, + "learning_rate": 6.382978723404255e-05, + "loss": 0.2236, + "step": 36120 + }, + { + "epoch": 31.61, + "learning_rate": 6.376329787234042e-05, + "loss": 0.142, + "step": 36130 + }, + { + "epoch": 31.62, + "learning_rate": 6.369680851063829e-05, + "loss": 0.1975, + "step": 36140 + }, + { + "epoch": 31.63, + "learning_rate": 6.363031914893617e-05, + "loss": 0.1676, + "step": 36150 + }, + { + "epoch": 31.64, + "learning_rate": 6.356382978723403e-05, + "loss": 0.1689, + "step": 36160 + }, + { + "epoch": 31.64, + "learning_rate": 6.349734042553191e-05, + "loss": 0.2285, + "step": 36170 + }, + { + "epoch": 31.65, + "learning_rate": 6.343085106382978e-05, + "loss": 0.155, + "step": 36180 + }, + { + "epoch": 31.66, + "learning_rate": 6.336436170212765e-05, + "loss": 0.2309, + "step": 36190 + }, + { + "epoch": 31.67, + "learning_rate": 6.329787234042552e-05, + "loss": 0.184, + "step": 36200 + }, + { + "epoch": 31.68, + "learning_rate": 6.32313829787234e-05, + "loss": 0.1826, + "step": 36210 + }, + { + "epoch": 31.69, + "learning_rate": 6.316489361702128e-05, + "loss": 0.2212, + "step": 36220 + }, + { + "epoch": 31.7, + "learning_rate": 6.309840425531915e-05, + "loss": 0.159, + "step": 36230 + }, + { + "epoch": 31.71, + "learning_rate": 6.303191489361702e-05, + "loss": 0.2025, + "step": 36240 + }, + { + "epoch": 31.71, + "learning_rate": 6.296542553191489e-05, + "loss": 0.1542, + "step": 36250 + }, + { + "epoch": 31.72, + "learning_rate": 6.289893617021276e-05, + "loss": 0.1288, + "step": 36260 + }, + { + "epoch": 31.73, + "learning_rate": 6.283244680851062e-05, + "loss": 0.2373, + "step": 36270 + }, + { + "epoch": 31.74, + "learning_rate": 6.276595744680851e-05, + "loss": 0.1383, + "step": 36280 + }, + { + "epoch": 31.75, + "learning_rate": 6.269946808510638e-05, + "loss": 0.2086, + "step": 36290 + }, + { + "epoch": 31.76, + "learning_rate": 6.263297872340425e-05, + "loss": 0.1667, + "step": 36300 + }, + { + "epoch": 31.77, + "learning_rate": 6.256648936170212e-05, + "loss": 0.1908, + "step": 36310 + }, + { + "epoch": 31.78, + "learning_rate": 6.25e-05, + "loss": 0.1785, + "step": 36320 + }, + { + "epoch": 31.78, + "learning_rate": 6.243351063829787e-05, + "loss": 0.1587, + "step": 36330 + }, + { + "epoch": 31.79, + "learning_rate": 6.236702127659574e-05, + "loss": 0.2122, + "step": 36340 + }, + { + "epoch": 31.8, + "learning_rate": 6.230053191489361e-05, + "loss": 0.1425, + "step": 36350 + }, + { + "epoch": 31.81, + "learning_rate": 6.223404255319148e-05, + "loss": 0.1536, + "step": 36360 + }, + { + "epoch": 31.82, + "learning_rate": 6.216755319148935e-05, + "loss": 0.2013, + "step": 36370 + }, + { + "epoch": 31.83, + "learning_rate": 6.210106382978723e-05, + "loss": 0.1377, + "step": 36380 + }, + { + "epoch": 31.84, + "learning_rate": 6.20345744680851e-05, + "loss": 0.2839, + "step": 36390 + }, + { + "epoch": 31.85, + "learning_rate": 6.196808510638297e-05, + "loss": 0.1767, + "step": 36400 + }, + { + "epoch": 31.85, + "learning_rate": 6.190159574468084e-05, + "loss": 0.1591, + "step": 36410 + }, + { + "epoch": 31.86, + "learning_rate": 6.183510638297873e-05, + "loss": 0.2181, + "step": 36420 + }, + { + "epoch": 31.87, + "learning_rate": 6.176861702127658e-05, + "loss": 0.1447, + "step": 36430 + }, + { + "epoch": 31.88, + "learning_rate": 6.170212765957447e-05, + "loss": 0.1884, + "step": 36440 + }, + { + "epoch": 31.89, + "learning_rate": 6.163563829787234e-05, + "loss": 0.1618, + "step": 36450 + }, + { + "epoch": 31.9, + "learning_rate": 6.15691489361702e-05, + "loss": 0.1807, + "step": 36460 + }, + { + "epoch": 31.91, + "learning_rate": 6.150265957446808e-05, + "loss": 0.2381, + "step": 36470 + }, + { + "epoch": 31.92, + "learning_rate": 6.143617021276596e-05, + "loss": 0.1733, + "step": 36480 + }, + { + "epoch": 31.92, + "learning_rate": 6.136968085106383e-05, + "loss": 0.2248, + "step": 36490 + }, + { + "epoch": 31.93, + "learning_rate": 6.13031914893617e-05, + "loss": 0.1572, + "step": 36500 + }, + { + "epoch": 31.94, + "learning_rate": 6.123670212765957e-05, + "loss": 0.1851, + "step": 36510 + }, + { + "epoch": 31.95, + "learning_rate": 6.117021276595744e-05, + "loss": 0.1769, + "step": 36520 + }, + { + "epoch": 31.96, + "learning_rate": 6.110372340425531e-05, + "loss": 0.2028, + "step": 36530 + }, + { + "epoch": 31.97, + "learning_rate": 6.103723404255318e-05, + "loss": 0.2211, + "step": 36540 + }, + { + "epoch": 31.98, + "learning_rate": 6.0970744680851055e-05, + "loss": 0.1515, + "step": 36550 + }, + { + "epoch": 31.99, + "learning_rate": 6.090425531914893e-05, + "loss": 0.2036, + "step": 36560 + }, + { + "epoch": 31.99, + "learning_rate": 6.08377659574468e-05, + "loss": 0.2045, + "step": 36570 + }, + { + "epoch": 32.0, + "learning_rate": 6.077127659574468e-05, + "loss": 0.1668, + "step": 36580 + }, + { + "epoch": 32.01, + "learning_rate": 6.070478723404255e-05, + "loss": 0.1838, + "step": 36590 + }, + { + "epoch": 32.02, + "learning_rate": 6.063829787234042e-05, + "loss": 0.1024, + "step": 36600 + }, + { + "epoch": 32.02, + "eval_cer1": 0.24729077343776376, + "eval_cer2": 0.22572600492206726, + "eval_cer3": 0.20369160405096373, + "eval_cer4": 0.2060594352683602, + "eval_cer5": 0.22980891719745222, + "eval_loss": 1.019065499305725, + "eval_runtime": 1491.6188, + "eval_samples_per_second": 5.873, + "step": 36600 + }, + { + "epoch": 32.03, + "learning_rate": 6.057180851063829e-05, + "loss": 0.1933, + "step": 36610 + }, + { + "epoch": 32.04, + "learning_rate": 6.0505319148936165e-05, + "loss": 0.1016, + "step": 36620 + }, + { + "epoch": 32.05, + "learning_rate": 6.0438829787234035e-05, + "loss": 0.1433, + "step": 36630 + }, + { + "epoch": 32.06, + "learning_rate": 6.037234042553191e-05, + "loss": 0.1493, + "step": 36640 + }, + { + "epoch": 32.06, + "learning_rate": 6.030585106382978e-05, + "loss": 0.1335, + "step": 36650 + }, + { + "epoch": 32.07, + "learning_rate": 6.023936170212766e-05, + "loss": 0.197, + "step": 36660 + }, + { + "epoch": 32.08, + "learning_rate": 6.017287234042553e-05, + "loss": 0.1322, + "step": 36670 + }, + { + "epoch": 32.09, + "learning_rate": 6.0106382978723404e-05, + "loss": 0.2164, + "step": 36680 + }, + { + "epoch": 32.1, + "learning_rate": 6.003989361702127e-05, + "loss": 0.1514, + "step": 36690 + }, + { + "epoch": 32.11, + "learning_rate": 5.9973404255319144e-05, + "loss": 0.1264, + "step": 36700 + }, + { + "epoch": 32.12, + "learning_rate": 5.9906914893617014e-05, + "loss": 0.228, + "step": 36710 + }, + { + "epoch": 32.13, + "learning_rate": 5.984042553191489e-05, + "loss": 0.1296, + "step": 36720 + }, + { + "epoch": 32.13, + "learning_rate": 5.977393617021276e-05, + "loss": 0.1667, + "step": 36730 + }, + { + "epoch": 32.14, + "learning_rate": 5.970744680851064e-05, + "loss": 0.1611, + "step": 36740 + }, + { + "epoch": 32.15, + "learning_rate": 5.964095744680851e-05, + "loss": 0.1183, + "step": 36750 + }, + { + "epoch": 32.16, + "learning_rate": 5.9574468085106384e-05, + "loss": 0.2053, + "step": 36760 + }, + { + "epoch": 32.17, + "learning_rate": 5.950797872340425e-05, + "loss": 0.1081, + "step": 36770 + }, + { + "epoch": 32.18, + "learning_rate": 5.9441489361702116e-05, + "loss": 0.1968, + "step": 36780 + }, + { + "epoch": 32.19, + "learning_rate": 5.937499999999999e-05, + "loss": 0.2182, + "step": 36790 + }, + { + "epoch": 32.2, + "learning_rate": 5.930851063829786e-05, + "loss": 0.1266, + "step": 36800 + }, + { + "epoch": 32.2, + "learning_rate": 5.924202127659574e-05, + "loss": 0.2033, + "step": 36810 + }, + { + "epoch": 32.21, + "learning_rate": 5.917553191489361e-05, + "loss": 0.1534, + "step": 36820 + }, + { + "epoch": 32.22, + "learning_rate": 5.9109042553191486e-05, + "loss": 0.2102, + "step": 36830 + }, + { + "epoch": 32.23, + "learning_rate": 5.9042553191489356e-05, + "loss": 0.1747, + "step": 36840 + }, + { + "epoch": 32.24, + "learning_rate": 5.897606382978723e-05, + "loss": 0.1205, + "step": 36850 + }, + { + "epoch": 32.25, + "learning_rate": 5.89095744680851e-05, + "loss": 0.2197, + "step": 36860 + }, + { + "epoch": 32.26, + "learning_rate": 5.884308510638297e-05, + "loss": 0.1485, + "step": 36870 + }, + { + "epoch": 32.27, + "learning_rate": 5.877659574468084e-05, + "loss": 0.175, + "step": 36880 + }, + { + "epoch": 32.27, + "learning_rate": 5.871010638297872e-05, + "loss": 0.1541, + "step": 36890 + }, + { + "epoch": 32.28, + "learning_rate": 5.864361702127659e-05, + "loss": 0.1558, + "step": 36900 + }, + { + "epoch": 32.29, + "learning_rate": 5.8577127659574465e-05, + "loss": 0.2099, + "step": 36910 + }, + { + "epoch": 32.3, + "learning_rate": 5.8510638297872335e-05, + "loss": 0.162, + "step": 36920 + }, + { + "epoch": 32.31, + "learning_rate": 5.844414893617021e-05, + "loss": 0.1373, + "step": 36930 + }, + { + "epoch": 32.32, + "learning_rate": 5.837765957446808e-05, + "loss": 0.1741, + "step": 36940 + }, + { + "epoch": 32.33, + "learning_rate": 5.831117021276596e-05, + "loss": 0.1995, + "step": 36950 + }, + { + "epoch": 32.34, + "learning_rate": 5.824468085106382e-05, + "loss": 0.1911, + "step": 36960 + }, + { + "epoch": 32.34, + "learning_rate": 5.817819148936169e-05, + "loss": 0.1841, + "step": 36970 + }, + { + "epoch": 32.35, + "learning_rate": 5.811170212765957e-05, + "loss": 0.1959, + "step": 36980 + }, + { + "epoch": 32.36, + "learning_rate": 5.8045212765957444e-05, + "loss": 0.1653, + "step": 36990 + }, + { + "epoch": 32.37, + "learning_rate": 5.7978723404255314e-05, + "loss": 0.1341, + "step": 37000 + }, + { + "epoch": 32.38, + "learning_rate": 5.791223404255319e-05, + "loss": 0.2119, + "step": 37010 + }, + { + "epoch": 32.39, + "learning_rate": 5.784574468085106e-05, + "loss": 0.1678, + "step": 37020 + }, + { + "epoch": 32.4, + "learning_rate": 5.777925531914894e-05, + "loss": 0.202, + "step": 37030 + }, + { + "epoch": 32.41, + "learning_rate": 5.77127659574468e-05, + "loss": 0.1929, + "step": 37040 + }, + { + "epoch": 32.41, + "learning_rate": 5.764627659574467e-05, + "loss": 0.1508, + "step": 37050 + }, + { + "epoch": 32.42, + "learning_rate": 5.757978723404255e-05, + "loss": 0.2019, + "step": 37060 + }, + { + "epoch": 32.43, + "learning_rate": 5.751329787234042e-05, + "loss": 0.1133, + "step": 37070 + }, + { + "epoch": 32.44, + "learning_rate": 5.7446808510638294e-05, + "loss": 0.1782, + "step": 37080 + }, + { + "epoch": 32.45, + "learning_rate": 5.7380319148936163e-05, + "loss": 0.202, + "step": 37090 + }, + { + "epoch": 32.46, + "learning_rate": 5.731382978723404e-05, + "loss": 0.0962, + "step": 37100 + }, + { + "epoch": 32.47, + "learning_rate": 5.724734042553191e-05, + "loss": 0.2356, + "step": 37110 + }, + { + "epoch": 32.48, + "learning_rate": 5.7180851063829787e-05, + "loss": 0.1182, + "step": 37120 + }, + { + "epoch": 32.48, + "learning_rate": 5.711436170212765e-05, + "loss": 0.2245, + "step": 37130 + }, + { + "epoch": 32.49, + "learning_rate": 5.7047872340425526e-05, + "loss": 0.1999, + "step": 37140 + }, + { + "epoch": 32.5, + "learning_rate": 5.6981382978723396e-05, + "loss": 0.1021, + "step": 37150 + }, + { + "epoch": 32.51, + "learning_rate": 5.691489361702127e-05, + "loss": 0.2284, + "step": 37160 + }, + { + "epoch": 32.52, + "learning_rate": 5.684840425531914e-05, + "loss": 0.1485, + "step": 37170 + }, + { + "epoch": 32.53, + "learning_rate": 5.678191489361702e-05, + "loss": 0.1537, + "step": 37180 + }, + { + "epoch": 32.54, + "learning_rate": 5.671542553191489e-05, + "loss": 0.174, + "step": 37190 + }, + { + "epoch": 32.55, + "learning_rate": 5.6648936170212766e-05, + "loss": 0.1158, + "step": 37200 + }, + { + "epoch": 32.55, + "eval_cer1": 0.24465750649876777, + "eval_cer2": 0.22441345365053322, + "eval_cer3": 0.20300555374060764, + "eval_cer4": 0.20329051160694162, + "eval_cer5": 0.2278556263269639, + "eval_loss": 1.0190215110778809, + "eval_runtime": 1505.7593, + "eval_samples_per_second": 5.818, + "step": 37200 + }, + { + "epoch": 32.55, + "learning_rate": 5.6582446808510636e-05, + "loss": 0.2011, + "step": 37210 + }, + { + "epoch": 32.56, + "learning_rate": 5.65159574468085e-05, + "loss": 0.1392, + "step": 37220 + }, + { + "epoch": 32.57, + "learning_rate": 5.6449468085106375e-05, + "loss": 0.197, + "step": 37230 + }, + { + "epoch": 32.58, + "learning_rate": 5.6382978723404245e-05, + "loss": 0.2074, + "step": 37240 + }, + { + "epoch": 32.59, + "learning_rate": 5.631648936170212e-05, + "loss": 0.1356, + "step": 37250 + }, + { + "epoch": 32.6, + "learning_rate": 5.625e-05, + "loss": 0.1915, + "step": 37260 + }, + { + "epoch": 32.61, + "learning_rate": 5.618351063829787e-05, + "loss": 0.1244, + "step": 37270 + }, + { + "epoch": 32.62, + "learning_rate": 5.6117021276595745e-05, + "loss": 0.198, + "step": 37280 + }, + { + "epoch": 32.62, + "learning_rate": 5.6050531914893615e-05, + "loss": 0.1867, + "step": 37290 + }, + { + "epoch": 32.63, + "learning_rate": 5.598404255319149e-05, + "loss": 0.1066, + "step": 37300 + }, + { + "epoch": 32.64, + "learning_rate": 5.5917553191489355e-05, + "loss": 0.1939, + "step": 37310 + }, + { + "epoch": 32.65, + "learning_rate": 5.5851063829787224e-05, + "loss": 0.1501, + "step": 37320 + }, + { + "epoch": 32.66, + "learning_rate": 5.57845744680851e-05, + "loss": 0.1927, + "step": 37330 + }, + { + "epoch": 32.67, + "learning_rate": 5.571808510638297e-05, + "loss": 0.1846, + "step": 37340 + }, + { + "epoch": 32.68, + "learning_rate": 5.565159574468085e-05, + "loss": 0.1265, + "step": 37350 + }, + { + "epoch": 32.69, + "learning_rate": 5.558510638297872e-05, + "loss": 0.1908, + "step": 37360 + }, + { + "epoch": 32.69, + "learning_rate": 5.5518617021276594e-05, + "loss": 0.1317, + "step": 37370 + }, + { + "epoch": 32.7, + "learning_rate": 5.5452127659574464e-05, + "loss": 0.205, + "step": 37380 + }, + { + "epoch": 32.71, + "learning_rate": 5.538563829787234e-05, + "loss": 0.126, + "step": 37390 + }, + { + "epoch": 32.72, + "learning_rate": 5.5319148936170204e-05, + "loss": 0.1129, + "step": 37400 + }, + { + "epoch": 32.73, + "learning_rate": 5.525265957446808e-05, + "loss": 0.228, + "step": 37410 + }, + { + "epoch": 32.74, + "learning_rate": 5.518617021276595e-05, + "loss": 0.1297, + "step": 37420 + }, + { + "epoch": 32.75, + "learning_rate": 5.511968085106383e-05, + "loss": 0.1907, + "step": 37430 + }, + { + "epoch": 32.76, + "learning_rate": 5.5053191489361697e-05, + "loss": 0.1786, + "step": 37440 + }, + { + "epoch": 32.76, + "learning_rate": 5.498670212765957e-05, + "loss": 0.1634, + "step": 37450 + }, + { + "epoch": 32.77, + "learning_rate": 5.492021276595744e-05, + "loss": 0.203, + "step": 37460 + }, + { + "epoch": 32.78, + "learning_rate": 5.485372340425532e-05, + "loss": 0.1627, + "step": 37470 + }, + { + "epoch": 32.79, + "learning_rate": 5.478723404255319e-05, + "loss": 0.1987, + "step": 37480 + }, + { + "epoch": 32.8, + "learning_rate": 5.472074468085105e-05, + "loss": 0.1761, + "step": 37490 + }, + { + "epoch": 32.81, + "learning_rate": 5.465425531914893e-05, + "loss": 0.152, + "step": 37500 + }, + { + "epoch": 32.82, + "learning_rate": 5.45877659574468e-05, + "loss": 0.2135, + "step": 37510 + }, + { + "epoch": 32.83, + "learning_rate": 5.4521276595744676e-05, + "loss": 0.125, + "step": 37520 + }, + { + "epoch": 32.83, + "learning_rate": 5.4454787234042546e-05, + "loss": 0.1603, + "step": 37530 + }, + { + "epoch": 32.84, + "learning_rate": 5.438829787234042e-05, + "loss": 0.1708, + "step": 37540 + }, + { + "epoch": 32.85, + "learning_rate": 5.43218085106383e-05, + "loss": 0.1065, + "step": 37550 + }, + { + "epoch": 32.86, + "learning_rate": 5.425531914893617e-05, + "loss": 0.196, + "step": 37560 + }, + { + "epoch": 32.87, + "learning_rate": 5.418882978723403e-05, + "loss": 0.1723, + "step": 37570 + }, + { + "epoch": 32.88, + "learning_rate": 5.412234042553191e-05, + "loss": 0.1971, + "step": 37580 + }, + { + "epoch": 32.89, + "learning_rate": 5.405585106382978e-05, + "loss": 0.1574, + "step": 37590 + }, + { + "epoch": 32.9, + "learning_rate": 5.3989361702127655e-05, + "loss": 0.1162, + "step": 37600 + }, + { + "epoch": 32.9, + "learning_rate": 5.3922872340425525e-05, + "loss": 0.2412, + "step": 37610 + }, + { + "epoch": 32.91, + "learning_rate": 5.38563829787234e-05, + "loss": 0.1141, + "step": 37620 + }, + { + "epoch": 32.92, + "learning_rate": 5.378989361702127e-05, + "loss": 0.1784, + "step": 37630 + }, + { + "epoch": 32.93, + "learning_rate": 5.372340425531915e-05, + "loss": 0.1347, + "step": 37640 + }, + { + "epoch": 32.94, + "learning_rate": 5.365691489361702e-05, + "loss": 0.1282, + "step": 37650 + }, + { + "epoch": 32.95, + "learning_rate": 5.359042553191489e-05, + "loss": 0.2386, + "step": 37660 + }, + { + "epoch": 32.96, + "learning_rate": 5.352393617021276e-05, + "loss": 0.1963, + "step": 37670 + }, + { + "epoch": 32.97, + "learning_rate": 5.3457446808510634e-05, + "loss": 0.1499, + "step": 37680 + }, + { + "epoch": 32.97, + "learning_rate": 5.3390957446808504e-05, + "loss": 0.178, + "step": 37690 + }, + { + "epoch": 32.98, + "learning_rate": 5.332446808510638e-05, + "loss": 0.1355, + "step": 37700 + }, + { + "epoch": 32.99, + "learning_rate": 5.325797872340425e-05, + "loss": 0.1921, + "step": 37710 + }, + { + "epoch": 33.0, + "learning_rate": 5.319148936170213e-05, + "loss": 0.1459, + "step": 37720 + }, + { + "epoch": 33.01, + "learning_rate": 5.3125e-05, + "loss": 0.1774, + "step": 37730 + }, + { + "epoch": 33.02, + "learning_rate": 5.3058510638297874e-05, + "loss": 0.1191, + "step": 37740 + }, + { + "epoch": 33.03, + "learning_rate": 5.299202127659574e-05, + "loss": 0.1651, + "step": 37750 + }, + { + "epoch": 33.04, + "learning_rate": 5.292553191489361e-05, + "loss": 0.1144, + "step": 37760 + }, + { + "epoch": 33.04, + "learning_rate": 5.285904255319148e-05, + "loss": 0.1244, + "step": 37770 + }, + { + "epoch": 33.05, + "learning_rate": 5.279255319148935e-05, + "loss": 0.1956, + "step": 37780 + }, + { + "epoch": 33.06, + "learning_rate": 5.272606382978723e-05, + "loss": 0.1146, + "step": 37790 + }, + { + "epoch": 33.07, + "learning_rate": 5.26595744680851e-05, + "loss": 0.1643, + "step": 37800 + }, + { + "epoch": 33.07, + "eval_cer1": 0.24553526214509977, + "eval_cer2": 0.2257588187038556, + "eval_cer3": 0.20202548186867036, + "eval_cer4": 0.20480376058469366, + "eval_cer5": 0.22955414012738853, + "eval_loss": 1.013848066329956, + "eval_runtime": 1534.8488, + "eval_samples_per_second": 5.707, + "step": 37800 + }, + { + "epoch": 33.08, + "learning_rate": 5.2593085106382976e-05, + "loss": 0.1803, + "step": 37810 + }, + { + "epoch": 33.09, + "learning_rate": 5.2526595744680846e-05, + "loss": 0.0995, + "step": 37820 + }, + { + "epoch": 33.1, + "learning_rate": 5.246010638297872e-05, + "loss": 0.1841, + "step": 37830 + }, + { + "epoch": 33.11, + "learning_rate": 5.2393617021276586e-05, + "loss": 0.1286, + "step": 37840 + }, + { + "epoch": 33.11, + "learning_rate": 5.232712765957446e-05, + "loss": 0.1858, + "step": 37850 + }, + { + "epoch": 33.12, + "learning_rate": 5.226063829787233e-05, + "loss": 0.168, + "step": 37860 + }, + { + "epoch": 33.13, + "learning_rate": 5.219414893617021e-05, + "loss": 0.1406, + "step": 37870 + }, + { + "epoch": 33.14, + "learning_rate": 5.212765957446808e-05, + "loss": 0.1917, + "step": 37880 + }, + { + "epoch": 33.15, + "learning_rate": 5.2061170212765955e-05, + "loss": 0.1073, + "step": 37890 + }, + { + "epoch": 33.16, + "learning_rate": 5.1994680851063825e-05, + "loss": 0.1916, + "step": 37900 + }, + { + "epoch": 33.17, + "learning_rate": 5.19281914893617e-05, + "loss": 0.1185, + "step": 37910 + }, + { + "epoch": 33.18, + "learning_rate": 5.186170212765957e-05, + "loss": 0.139, + "step": 37920 + }, + { + "epoch": 33.18, + "learning_rate": 5.179521276595744e-05, + "loss": 0.1536, + "step": 37930 + }, + { + "epoch": 33.19, + "learning_rate": 5.172872340425531e-05, + "loss": 0.1349, + "step": 37940 + }, + { + "epoch": 33.2, + "learning_rate": 5.166223404255319e-05, + "loss": 0.2043, + "step": 37950 + }, + { + "epoch": 33.21, + "learning_rate": 5.159574468085106e-05, + "loss": 0.1508, + "step": 37960 + }, + { + "epoch": 33.22, + "learning_rate": 5.1529255319148935e-05, + "loss": 0.1349, + "step": 37970 + }, + { + "epoch": 33.23, + "learning_rate": 5.1462765957446805e-05, + "loss": 0.1913, + "step": 37980 + }, + { + "epoch": 33.24, + "learning_rate": 5.139627659574468e-05, + "loss": 0.097, + "step": 37990 + }, + { + "epoch": 33.25, + "learning_rate": 5.132978723404255e-05, + "loss": 0.1919, + "step": 38000 + }, + { + "epoch": 33.25, + "learning_rate": 5.1263297872340414e-05, + "loss": 0.1261, + "step": 38010 + }, + { + "epoch": 33.26, + "learning_rate": 5.119680851063829e-05, + "loss": 0.1161, + "step": 38020 + }, + { + "epoch": 33.27, + "learning_rate": 5.113031914893616e-05, + "loss": 0.1809, + "step": 38030 + }, + { + "epoch": 33.28, + "learning_rate": 5.106382978723404e-05, + "loss": 0.1301, + "step": 38040 + }, + { + "epoch": 33.29, + "learning_rate": 5.099734042553191e-05, + "loss": 0.1622, + "step": 38050 + }, + { + "epoch": 33.3, + "learning_rate": 5.0930851063829784e-05, + "loss": 0.1297, + "step": 38060 + }, + { + "epoch": 33.31, + "learning_rate": 5.0864361702127654e-05, + "loss": 0.1397, + "step": 38070 + }, + { + "epoch": 33.32, + "learning_rate": 5.079787234042553e-05, + "loss": 0.21, + "step": 38080 + }, + { + "epoch": 33.32, + "learning_rate": 5.07313829787234e-05, + "loss": 0.1254, + "step": 38090 + }, + { + "epoch": 33.33, + "learning_rate": 5.066489361702127e-05, + "loss": 0.1988, + "step": 38100 + }, + { + "epoch": 33.34, + "learning_rate": 5.059840425531914e-05, + "loss": 0.202, + "step": 38110 + }, + { + "epoch": 33.35, + "learning_rate": 5.0531914893617016e-05, + "loss": 0.1527, + "step": 38120 + }, + { + "epoch": 33.36, + "learning_rate": 5.0465425531914886e-05, + "loss": 0.1954, + "step": 38130 + }, + { + "epoch": 33.37, + "learning_rate": 5.039893617021276e-05, + "loss": 0.1477, + "step": 38140 + }, + { + "epoch": 33.38, + "learning_rate": 5.033244680851063e-05, + "loss": 0.1884, + "step": 38150 + }, + { + "epoch": 33.39, + "learning_rate": 5.026595744680851e-05, + "loss": 0.1478, + "step": 38160 + }, + { + "epoch": 33.39, + "learning_rate": 5.019946808510638e-05, + "loss": 0.0989, + "step": 38170 + }, + { + "epoch": 33.4, + "learning_rate": 5.0132978723404256e-05, + "loss": 0.1832, + "step": 38180 + }, + { + "epoch": 33.41, + "learning_rate": 5.006648936170212e-05, + "loss": 0.155, + "step": 38190 + }, + { + "epoch": 33.42, + "learning_rate": 4.9999999999999996e-05, + "loss": 0.182, + "step": 38200 + }, + { + "epoch": 33.43, + "learning_rate": 4.9933510638297865e-05, + "loss": 0.1499, + "step": 38210 + }, + { + "epoch": 33.44, + "learning_rate": 4.986702127659574e-05, + "loss": 0.1328, + "step": 38220 + }, + { + "epoch": 33.45, + "learning_rate": 4.980053191489361e-05, + "loss": 0.1683, + "step": 38230 + }, + { + "epoch": 33.46, + "learning_rate": 4.973404255319149e-05, + "loss": 0.1151, + "step": 38240 + }, + { + "epoch": 33.46, + "learning_rate": 4.966755319148936e-05, + "loss": 0.2923, + "step": 38250 + }, + { + "epoch": 33.47, + "learning_rate": 4.9601063829787235e-05, + "loss": 0.1262, + "step": 38260 + }, + { + "epoch": 33.48, + "learning_rate": 4.9534574468085105e-05, + "loss": 0.1139, + "step": 38270 + }, + { + "epoch": 33.49, + "learning_rate": 4.946808510638297e-05, + "loss": 0.159, + "step": 38280 + }, + { + "epoch": 33.5, + "learning_rate": 4.9401595744680845e-05, + "loss": 0.1168, + "step": 38290 + }, + { + "epoch": 33.51, + "learning_rate": 4.9335106382978715e-05, + "loss": 0.1923, + "step": 38300 + }, + { + "epoch": 33.52, + "learning_rate": 4.926861702127659e-05, + "loss": 0.1457, + "step": 38310 + }, + { + "epoch": 33.53, + "learning_rate": 4.920212765957446e-05, + "loss": 0.1432, + "step": 38320 + }, + { + "epoch": 33.53, + "learning_rate": 4.913563829787234e-05, + "loss": 0.2057, + "step": 38330 + }, + { + "epoch": 33.54, + "learning_rate": 4.906914893617021e-05, + "loss": 0.147, + "step": 38340 + }, + { + "epoch": 33.55, + "learning_rate": 4.9002659574468084e-05, + "loss": 0.1572, + "step": 38350 + }, + { + "epoch": 33.56, + "learning_rate": 4.8936170212765954e-05, + "loss": 0.1367, + "step": 38360 + }, + { + "epoch": 33.57, + "learning_rate": 4.8869680851063824e-05, + "loss": 0.1115, + "step": 38370 + }, + { + "epoch": 33.58, + "learning_rate": 4.8803191489361694e-05, + "loss": 0.1833, + "step": 38380 + }, + { + "epoch": 33.59, + "learning_rate": 4.873670212765957e-05, + "loss": 0.1337, + "step": 38390 + }, + { + "epoch": 33.6, + "learning_rate": 4.867021276595744e-05, + "loss": 0.1492, + "step": 38400 + }, + { + "epoch": 33.6, + "eval_cer1": 0.24195671989466933, + "eval_cer2": 0.2238884331419196, + "eval_cer3": 0.20062071218556027, + "eval_cer4": 0.20222801764383916, + "eval_cer5": 0.22777070063694269, + "eval_loss": 1.0146465301513672, + "eval_runtime": 1542.8524, + "eval_samples_per_second": 5.678, + "step": 38400 + }, + { + "epoch": 33.6, + "learning_rate": 4.860372340425532e-05, + "loss": 0.1482, + "step": 38410 + }, + { + "epoch": 33.61, + "learning_rate": 4.853723404255319e-05, + "loss": 0.1122, + "step": 38420 + }, + { + "epoch": 33.62, + "learning_rate": 4.847074468085106e-05, + "loss": 0.1743, + "step": 38430 + }, + { + "epoch": 33.63, + "learning_rate": 4.840425531914893e-05, + "loss": 0.1067, + "step": 38440 + }, + { + "epoch": 33.64, + "learning_rate": 4.83377659574468e-05, + "loss": 0.1802, + "step": 38450 + }, + { + "epoch": 33.65, + "learning_rate": 4.827127659574467e-05, + "loss": 0.1531, + "step": 38460 + }, + { + "epoch": 33.66, + "learning_rate": 4.820478723404255e-05, + "loss": 0.1004, + "step": 38470 + }, + { + "epoch": 33.67, + "learning_rate": 4.813829787234042e-05, + "loss": 0.1698, + "step": 38480 + }, + { + "epoch": 33.67, + "learning_rate": 4.8071808510638296e-05, + "loss": 0.1322, + "step": 38490 + }, + { + "epoch": 33.68, + "learning_rate": 4.8005319148936166e-05, + "loss": 0.1583, + "step": 38500 + }, + { + "epoch": 33.69, + "learning_rate": 4.793882978723404e-05, + "loss": 0.1441, + "step": 38510 + }, + { + "epoch": 33.7, + "learning_rate": 4.787234042553191e-05, + "loss": 0.1072, + "step": 38520 + }, + { + "epoch": 33.71, + "learning_rate": 4.780585106382979e-05, + "loss": 0.2303, + "step": 38530 + }, + { + "epoch": 33.72, + "learning_rate": 4.773936170212765e-05, + "loss": 0.1098, + "step": 38540 + }, + { + "epoch": 33.73, + "learning_rate": 4.767287234042552e-05, + "loss": 0.2012, + "step": 38550 + }, + { + "epoch": 33.74, + "learning_rate": 4.76063829787234e-05, + "loss": 0.1565, + "step": 38560 + }, + { + "epoch": 33.74, + "learning_rate": 4.753989361702127e-05, + "loss": 0.1514, + "step": 38570 + }, + { + "epoch": 33.75, + "learning_rate": 4.7473404255319145e-05, + "loss": 0.1792, + "step": 38580 + }, + { + "epoch": 33.76, + "learning_rate": 4.7406914893617015e-05, + "loss": 0.1243, + "step": 38590 + }, + { + "epoch": 33.77, + "learning_rate": 4.734042553191489e-05, + "loss": 0.1715, + "step": 38600 + }, + { + "epoch": 33.78, + "learning_rate": 4.727393617021276e-05, + "loss": 0.1655, + "step": 38610 + }, + { + "epoch": 33.79, + "learning_rate": 4.720744680851064e-05, + "loss": 0.1232, + "step": 38620 + }, + { + "epoch": 33.8, + "learning_rate": 4.71409574468085e-05, + "loss": 0.2047, + "step": 38630 + }, + { + "epoch": 33.81, + "learning_rate": 4.707446808510638e-05, + "loss": 0.1213, + "step": 38640 + }, + { + "epoch": 33.81, + "learning_rate": 4.700797872340425e-05, + "loss": 0.208, + "step": 38650 + }, + { + "epoch": 33.82, + "learning_rate": 4.6941489361702124e-05, + "loss": 0.1373, + "step": 38660 + }, + { + "epoch": 33.83, + "learning_rate": 4.6874999999999994e-05, + "loss": 0.1257, + "step": 38670 + }, + { + "epoch": 33.84, + "learning_rate": 4.680851063829787e-05, + "loss": 0.1834, + "step": 38680 + }, + { + "epoch": 33.85, + "learning_rate": 4.674202127659574e-05, + "loss": 0.1421, + "step": 38690 + }, + { + "epoch": 33.86, + "learning_rate": 4.667553191489362e-05, + "loss": 0.2001, + "step": 38700 + }, + { + "epoch": 33.87, + "learning_rate": 4.660904255319149e-05, + "loss": 0.1378, + "step": 38710 + }, + { + "epoch": 33.88, + "learning_rate": 4.654255319148936e-05, + "loss": 0.1213, + "step": 38720 + }, + { + "epoch": 33.88, + "learning_rate": 4.647606382978723e-05, + "loss": 0.1821, + "step": 38730 + }, + { + "epoch": 33.89, + "learning_rate": 4.6409574468085104e-05, + "loss": 0.1131, + "step": 38740 + }, + { + "epoch": 33.9, + "learning_rate": 4.6343085106382973e-05, + "loss": 0.1603, + "step": 38750 + }, + { + "epoch": 33.91, + "learning_rate": 4.627659574468085e-05, + "loss": 0.113, + "step": 38760 + }, + { + "epoch": 33.92, + "learning_rate": 4.621010638297872e-05, + "loss": 0.1129, + "step": 38770 + }, + { + "epoch": 33.93, + "learning_rate": 4.6143617021276597e-05, + "loss": 0.2015, + "step": 38780 + }, + { + "epoch": 33.94, + "learning_rate": 4.6077127659574466e-05, + "loss": 0.1222, + "step": 38790 + }, + { + "epoch": 33.95, + "learning_rate": 4.601063829787234e-05, + "loss": 0.1914, + "step": 38800 + }, + { + "epoch": 33.95, + "learning_rate": 4.5944148936170206e-05, + "loss": 0.126, + "step": 38810 + }, + { + "epoch": 33.96, + "learning_rate": 4.5877659574468076e-05, + "loss": 0.1028, + "step": 38820 + }, + { + "epoch": 33.97, + "learning_rate": 4.581117021276595e-05, + "loss": 0.2172, + "step": 38830 + }, + { + "epoch": 33.98, + "learning_rate": 4.574468085106382e-05, + "loss": 0.1199, + "step": 38840 + }, + { + "epoch": 33.99, + "learning_rate": 4.56781914893617e-05, + "loss": 0.1487, + "step": 38850 + }, + { + "epoch": 34.0, + "learning_rate": 4.561170212765957e-05, + "loss": 0.1043, + "step": 38860 + }, + { + "epoch": 34.01, + "learning_rate": 4.5545212765957446e-05, + "loss": 0.2112, + "step": 38870 + }, + { + "epoch": 34.02, + "learning_rate": 4.5478723404255315e-05, + "loss": 0.0949, + "step": 38880 + }, + { + "epoch": 34.02, + "learning_rate": 4.541223404255319e-05, + "loss": 0.1886, + "step": 38890 + }, + { + "epoch": 34.03, + "learning_rate": 4.5345744680851055e-05, + "loss": 0.1672, + "step": 38900 + }, + { + "epoch": 34.04, + "learning_rate": 4.527925531914893e-05, + "loss": 0.1078, + "step": 38910 + }, + { + "epoch": 34.05, + "learning_rate": 4.52127659574468e-05, + "loss": 0.1895, + "step": 38920 + }, + { + "epoch": 34.06, + "learning_rate": 4.514627659574468e-05, + "loss": 0.1226, + "step": 38930 + }, + { + "epoch": 34.07, + "learning_rate": 4.507978723404255e-05, + "loss": 0.1443, + "step": 38940 + }, + { + "epoch": 34.08, + "learning_rate": 4.5013297872340425e-05, + "loss": 0.1473, + "step": 38950 + }, + { + "epoch": 34.09, + "learning_rate": 4.4946808510638295e-05, + "loss": 0.1227, + "step": 38960 + }, + { + "epoch": 34.09, + "learning_rate": 4.488031914893617e-05, + "loss": 0.2005, + "step": 38970 + }, + { + "epoch": 34.1, + "learning_rate": 4.4813829787234034e-05, + "loss": 0.1079, + "step": 38980 + }, + { + "epoch": 34.11, + "learning_rate": 4.474734042553191e-05, + "loss": 0.1211, + "step": 38990 + }, + { + "epoch": 34.12, + "learning_rate": 4.468085106382978e-05, + "loss": 0.1407, + "step": 39000 + }, + { + "epoch": 34.12, + "eval_cer1": 0.24107896424833733, + "eval_cer2": 0.22041017227235438, + "eval_cer3": 0.19983665468801046, + "eval_cer4": 0.20065037509256575, + "eval_cer5": 0.22496815286624203, + "eval_loss": 1.0069777965545654, + "eval_runtime": 1496.6002, + "eval_samples_per_second": 5.853, + "step": 39000 + }, + { + "epoch": 34.13, + "learning_rate": 4.461436170212766e-05, + "loss": 0.1235, + "step": 39010 + }, + { + "epoch": 34.14, + "learning_rate": 4.454787234042553e-05, + "loss": 0.1617, + "step": 39020 + }, + { + "epoch": 34.15, + "learning_rate": 4.4481382978723404e-05, + "loss": 0.1348, + "step": 39030 + }, + { + "epoch": 34.16, + "learning_rate": 4.4414893617021274e-05, + "loss": 0.1295, + "step": 39040 + }, + { + "epoch": 34.16, + "learning_rate": 4.434840425531915e-05, + "loss": 0.1374, + "step": 39050 + }, + { + "epoch": 34.17, + "learning_rate": 4.428191489361702e-05, + "loss": 0.0941, + "step": 39060 + }, + { + "epoch": 34.18, + "learning_rate": 4.4215425531914883e-05, + "loss": 0.1427, + "step": 39070 + }, + { + "epoch": 34.19, + "learning_rate": 4.414893617021276e-05, + "loss": 0.1523, + "step": 39080 + }, + { + "epoch": 34.2, + "learning_rate": 4.408244680851063e-05, + "loss": 0.1509, + "step": 39090 + }, + { + "epoch": 34.21, + "learning_rate": 4.4015957446808507e-05, + "loss": 0.145, + "step": 39100 + }, + { + "epoch": 34.22, + "learning_rate": 4.3949468085106376e-05, + "loss": 0.082, + "step": 39110 + }, + { + "epoch": 34.23, + "learning_rate": 4.388297872340425e-05, + "loss": 0.1904, + "step": 39120 + }, + { + "epoch": 34.23, + "learning_rate": 4.381648936170212e-05, + "loss": 0.1774, + "step": 39130 + }, + { + "epoch": 34.24, + "learning_rate": 4.375e-05, + "loss": 0.1419, + "step": 39140 + }, + { + "epoch": 34.25, + "learning_rate": 4.368351063829787e-05, + "loss": 0.1391, + "step": 39150 + }, + { + "epoch": 34.26, + "learning_rate": 4.361702127659574e-05, + "loss": 0.1066, + "step": 39160 + }, + { + "epoch": 34.27, + "learning_rate": 4.355053191489361e-05, + "loss": 0.18, + "step": 39170 + }, + { + "epoch": 34.28, + "learning_rate": 4.3484042553191486e-05, + "loss": 0.1135, + "step": 39180 + }, + { + "epoch": 34.29, + "learning_rate": 4.3417553191489356e-05, + "loss": 0.1729, + "step": 39190 + }, + { + "epoch": 34.3, + "learning_rate": 4.335106382978723e-05, + "loss": 0.1651, + "step": 39200 + }, + { + "epoch": 34.3, + "learning_rate": 4.32845744680851e-05, + "loss": 0.0939, + "step": 39210 + }, + { + "epoch": 34.31, + "learning_rate": 4.321808510638298e-05, + "loss": 0.1724, + "step": 39220 + }, + { + "epoch": 34.32, + "learning_rate": 4.315159574468085e-05, + "loss": 0.112, + "step": 39230 + }, + { + "epoch": 34.33, + "learning_rate": 4.3085106382978725e-05, + "loss": 0.1376, + "step": 39240 + }, + { + "epoch": 34.34, + "learning_rate": 4.301861702127659e-05, + "loss": 0.1764, + "step": 39250 + }, + { + "epoch": 34.35, + "learning_rate": 4.2952127659574465e-05, + "loss": 0.109, + "step": 39260 + }, + { + "epoch": 34.36, + "learning_rate": 4.2885638297872335e-05, + "loss": 0.1782, + "step": 39270 + }, + { + "epoch": 34.37, + "learning_rate": 4.281914893617021e-05, + "loss": 0.1304, + "step": 39280 + }, + { + "epoch": 34.37, + "learning_rate": 4.275265957446808e-05, + "loss": 0.1185, + "step": 39290 + }, + { + "epoch": 34.38, + "learning_rate": 4.268617021276596e-05, + "loss": 0.1418, + "step": 39300 + }, + { + "epoch": 34.39, + "learning_rate": 4.261968085106383e-05, + "loss": 0.1296, + "step": 39310 + }, + { + "epoch": 34.4, + "learning_rate": 4.2553191489361704e-05, + "loss": 0.1881, + "step": 39320 + }, + { + "epoch": 34.41, + "learning_rate": 4.2486702127659574e-05, + "loss": 0.1016, + "step": 39330 + }, + { + "epoch": 34.42, + "learning_rate": 4.242021276595744e-05, + "loss": 0.1431, + "step": 39340 + }, + { + "epoch": 34.43, + "learning_rate": 4.2353723404255314e-05, + "loss": 0.1839, + "step": 39350 + }, + { + "epoch": 34.44, + "learning_rate": 4.2287234042553184e-05, + "loss": 0.0789, + "step": 39360 + }, + { + "epoch": 34.44, + "learning_rate": 4.222074468085106e-05, + "loss": 0.188, + "step": 39370 + }, + { + "epoch": 34.45, + "learning_rate": 4.215425531914893e-05, + "loss": 0.1161, + "step": 39380 + }, + { + "epoch": 34.46, + "learning_rate": 4.208776595744681e-05, + "loss": 0.1397, + "step": 39390 + }, + { + "epoch": 34.47, + "learning_rate": 4.202127659574468e-05, + "loss": 0.1422, + "step": 39400 + }, + { + "epoch": 34.48, + "learning_rate": 4.1954787234042554e-05, + "loss": 0.1735, + "step": 39410 + }, + { + "epoch": 34.49, + "learning_rate": 4.1888297872340417e-05, + "loss": 0.1609, + "step": 39420 + }, + { + "epoch": 34.5, + "learning_rate": 4.182180851063829e-05, + "loss": 0.1292, + "step": 39430 + }, + { + "epoch": 34.51, + "learning_rate": 4.175531914893616e-05, + "loss": 0.1211, + "step": 39440 + }, + { + "epoch": 34.51, + "learning_rate": 4.168882978723404e-05, + "loss": 0.167, + "step": 39450 + }, + { + "epoch": 34.52, + "learning_rate": 4.162234042553191e-05, + "loss": 0.0972, + "step": 39460 + }, + { + "epoch": 34.53, + "learning_rate": 4.1555851063829786e-05, + "loss": 0.2312, + "step": 39470 + }, + { + "epoch": 34.54, + "learning_rate": 4.1489361702127656e-05, + "loss": 0.1365, + "step": 39480 + }, + { + "epoch": 34.55, + "learning_rate": 4.142287234042553e-05, + "loss": 0.1377, + "step": 39490 + }, + { + "epoch": 34.56, + "learning_rate": 4.13563829787234e-05, + "loss": 0.1526, + "step": 39500 + }, + { + "epoch": 34.57, + "learning_rate": 4.128989361702127e-05, + "loss": 0.0841, + "step": 39510 + }, + { + "epoch": 34.58, + "learning_rate": 4.122340425531914e-05, + "loss": 0.1784, + "step": 39520 + }, + { + "epoch": 34.58, + "learning_rate": 4.115691489361702e-05, + "loss": 0.124, + "step": 39530 + }, + { + "epoch": 34.59, + "learning_rate": 4.109042553191489e-05, + "loss": 0.1534, + "step": 39540 + }, + { + "epoch": 34.6, + "learning_rate": 4.1023936170212765e-05, + "loss": 0.1613, + "step": 39550 + }, + { + "epoch": 34.61, + "learning_rate": 4.0957446808510635e-05, + "loss": 0.0884, + "step": 39560 + }, + { + "epoch": 34.62, + "learning_rate": 4.089095744680851e-05, + "loss": 0.1884, + "step": 39570 + }, + { + "epoch": 34.63, + "learning_rate": 4.082446808510638e-05, + "loss": 0.1183, + "step": 39580 + }, + { + "epoch": 34.64, + "learning_rate": 4.075797872340426e-05, + "loss": 0.1589, + "step": 39590 + }, + { + "epoch": 34.65, + "learning_rate": 4.069148936170212e-05, + "loss": 0.1278, + "step": 39600 + }, + { + "epoch": 34.65, + "eval_cer1": 0.23999864960669795, + "eval_cer2": 0.2200820344544709, + "eval_cer3": 0.19836654688010455, + "eval_cer4": 0.20019962007791622, + "eval_cer5": 0.22352441613588112, + "eval_loss": 1.0083574056625366, + "eval_runtime": 1486.0879, + "eval_samples_per_second": 5.895, + "step": 39600 + }, + { + "epoch": 34.65, + "learning_rate": 4.062499999999999e-05, + "loss": 0.1222, + "step": 39610 + }, + { + "epoch": 34.66, + "learning_rate": 4.055851063829787e-05, + "loss": 0.1726, + "step": 39620 + }, + { + "epoch": 34.67, + "learning_rate": 4.049202127659574e-05, + "loss": 0.0871, + "step": 39630 + }, + { + "epoch": 34.68, + "learning_rate": 4.0425531914893614e-05, + "loss": 0.1714, + "step": 39640 + }, + { + "epoch": 34.69, + "learning_rate": 4.0359042553191484e-05, + "loss": 0.1602, + "step": 39650 + }, + { + "epoch": 34.7, + "learning_rate": 4.029255319148936e-05, + "loss": 0.11, + "step": 39660 + }, + { + "epoch": 34.71, + "learning_rate": 4.022606382978723e-05, + "loss": 0.1692, + "step": 39670 + }, + { + "epoch": 34.72, + "learning_rate": 4.015957446808511e-05, + "loss": 0.1655, + "step": 39680 + }, + { + "epoch": 34.72, + "learning_rate": 4.009308510638297e-05, + "loss": 0.1708, + "step": 39690 + }, + { + "epoch": 34.73, + "learning_rate": 4.002659574468085e-05, + "loss": 0.1571, + "step": 39700 + }, + { + "epoch": 34.74, + "learning_rate": 3.996010638297872e-05, + "loss": 0.1156, + "step": 39710 + }, + { + "epoch": 34.75, + "learning_rate": 3.9893617021276594e-05, + "loss": 0.1764, + "step": 39720 + }, + { + "epoch": 34.76, + "learning_rate": 3.9827127659574464e-05, + "loss": 0.1355, + "step": 39730 + }, + { + "epoch": 34.77, + "learning_rate": 3.976063829787234e-05, + "loss": 0.1719, + "step": 39740 + }, + { + "epoch": 34.78, + "learning_rate": 3.969414893617021e-05, + "loss": 0.1769, + "step": 39750 + }, + { + "epoch": 34.79, + "learning_rate": 3.962765957446809e-05, + "loss": 0.1249, + "step": 39760 + }, + { + "epoch": 34.79, + "learning_rate": 3.9561170212765957e-05, + "loss": 0.2027, + "step": 39770 + }, + { + "epoch": 34.8, + "learning_rate": 3.949468085106382e-05, + "loss": 0.1311, + "step": 39780 + }, + { + "epoch": 34.81, + "learning_rate": 3.9428191489361696e-05, + "loss": 0.1555, + "step": 39790 + }, + { + "epoch": 34.82, + "learning_rate": 3.936170212765957e-05, + "loss": 0.1708, + "step": 39800 + }, + { + "epoch": 34.83, + "learning_rate": 3.929521276595744e-05, + "loss": 0.0969, + "step": 39810 + }, + { + "epoch": 34.84, + "learning_rate": 3.922872340425532e-05, + "loss": 0.196, + "step": 39820 + }, + { + "epoch": 34.85, + "learning_rate": 3.916223404255319e-05, + "loss": 0.1006, + "step": 39830 + }, + { + "epoch": 34.86, + "learning_rate": 3.9095744680851066e-05, + "loss": 0.1224, + "step": 39840 + }, + { + "epoch": 34.86, + "learning_rate": 3.9029255319148936e-05, + "loss": 0.1495, + "step": 39850 + }, + { + "epoch": 34.87, + "learning_rate": 3.89627659574468e-05, + "loss": 0.1395, + "step": 39860 + }, + { + "epoch": 34.88, + "learning_rate": 3.8896276595744675e-05, + "loss": 0.1644, + "step": 39870 + }, + { + "epoch": 34.89, + "learning_rate": 3.8829787234042545e-05, + "loss": 0.1101, + "step": 39880 + }, + { + "epoch": 34.9, + "learning_rate": 3.876329787234042e-05, + "loss": 0.1537, + "step": 39890 + }, + { + "epoch": 34.91, + "learning_rate": 3.869680851063829e-05, + "loss": 0.1306, + "step": 39900 + }, + { + "epoch": 34.92, + "learning_rate": 3.863031914893617e-05, + "loss": 0.1225, + "step": 39910 + }, + { + "epoch": 34.93, + "learning_rate": 3.856382978723404e-05, + "loss": 0.159, + "step": 39920 + }, + { + "epoch": 34.93, + "learning_rate": 3.8497340425531915e-05, + "loss": 0.1534, + "step": 39930 + }, + { + "epoch": 34.94, + "learning_rate": 3.8430851063829785e-05, + "loss": 0.156, + "step": 39940 + }, + { + "epoch": 34.95, + "learning_rate": 3.8364361702127655e-05, + "loss": 0.159, + "step": 39950 + }, + { + "epoch": 34.96, + "learning_rate": 3.8297872340425525e-05, + "loss": 0.0931, + "step": 39960 + }, + { + "epoch": 34.97, + "learning_rate": 3.82313829787234e-05, + "loss": 0.1429, + "step": 39970 + }, + { + "epoch": 34.98, + "learning_rate": 3.816489361702127e-05, + "loss": 0.09, + "step": 39980 + }, + { + "epoch": 34.99, + "learning_rate": 3.809840425531915e-05, + "loss": 0.1407, + "step": 39990 + }, + { + "epoch": 35.0, + "learning_rate": 3.803191489361702e-05, + "loss": 0.1235, + "step": 40000 + }, + { + "epoch": 35.0, + "learning_rate": 3.7965425531914894e-05, + "loss": 0.142, + "step": 40010 + }, + { + "epoch": 35.01, + "learning_rate": 3.7898936170212764e-05, + "loss": 0.129, + "step": 40020 + }, + { + "epoch": 35.02, + "learning_rate": 3.783244680851064e-05, + "loss": 0.1412, + "step": 40030 + }, + { + "epoch": 35.03, + "learning_rate": 3.7765957446808504e-05, + "loss": 0.1867, + "step": 40040 + }, + { + "epoch": 35.04, + "learning_rate": 3.7699468085106374e-05, + "loss": 0.1494, + "step": 40050 + }, + { + "epoch": 35.05, + "learning_rate": 3.763297872340425e-05, + "loss": 0.1516, + "step": 40060 + }, + { + "epoch": 35.06, + "learning_rate": 3.756648936170212e-05, + "loss": 0.1196, + "step": 40070 + }, + { + "epoch": 35.07, + "learning_rate": 3.75e-05, + "loss": 0.0981, + "step": 40080 + }, + { + "epoch": 35.07, + "learning_rate": 3.743351063829787e-05, + "loss": 0.1873, + "step": 40090 + }, + { + "epoch": 35.08, + "learning_rate": 3.736702127659574e-05, + "loss": 0.1419, + "step": 40100 + }, + { + "epoch": 35.09, + "learning_rate": 3.730053191489361e-05, + "loss": 0.1577, + "step": 40110 + }, + { + "epoch": 35.1, + "learning_rate": 3.723404255319148e-05, + "loss": 0.119, + "step": 40120 + }, + { + "epoch": 35.11, + "learning_rate": 3.716755319148936e-05, + "loss": 0.1047, + "step": 40130 + }, + { + "epoch": 35.12, + "learning_rate": 3.710106382978723e-05, + "loss": 0.1704, + "step": 40140 + }, + { + "epoch": 35.13, + "learning_rate": 3.70345744680851e-05, + "loss": 0.0919, + "step": 40150 + }, + { + "epoch": 35.14, + "learning_rate": 3.6968085106382976e-05, + "loss": 0.1868, + "step": 40160 + }, + { + "epoch": 35.14, + "learning_rate": 3.6901595744680846e-05, + "loss": 0.1866, + "step": 40170 + }, + { + "epoch": 35.15, + "learning_rate": 3.683510638297872e-05, + "loss": 0.1164, + "step": 40180 + }, + { + "epoch": 35.16, + "learning_rate": 3.676861702127659e-05, + "loss": 0.2095, + "step": 40190 + }, + { + "epoch": 35.17, + "learning_rate": 3.670212765957446e-05, + "loss": 0.099, + "step": 40200 + }, + { + "epoch": 35.17, + "eval_cer1": 0.24020120860200533, + "eval_cer2": 0.2192616899097621, + "eval_cer3": 0.199281280627246, + "eval_cer4": 0.20129431082777938, + "eval_cer5": 0.22309978768577496, + "eval_loss": 1.008385419845581, + "eval_runtime": 1543.4531, + "eval_samples_per_second": 5.676, + "step": 40200 + }, + { + "epoch": 35.18, + "learning_rate": 3.663563829787234e-05, + "loss": 0.1347, + "step": 40210 + }, + { + "epoch": 35.19, + "learning_rate": 3.656914893617021e-05, + "loss": 0.1835, + "step": 40220 + }, + { + "epoch": 35.2, + "learning_rate": 3.6502659574468085e-05, + "loss": 0.0729, + "step": 40230 + }, + { + "epoch": 35.21, + "learning_rate": 3.6436170212765955e-05, + "loss": 0.1931, + "step": 40240 + }, + { + "epoch": 35.21, + "learning_rate": 3.6369680851063825e-05, + "loss": 0.1219, + "step": 40250 + }, + { + "epoch": 35.22, + "learning_rate": 3.63031914893617e-05, + "loss": 0.1385, + "step": 40260 + }, + { + "epoch": 35.23, + "learning_rate": 3.623670212765957e-05, + "loss": 0.1155, + "step": 40270 + }, + { + "epoch": 35.24, + "learning_rate": 3.617021276595744e-05, + "loss": 0.1477, + "step": 40280 + }, + { + "epoch": 35.25, + "learning_rate": 3.610372340425532e-05, + "loss": 0.1494, + "step": 40290 + }, + { + "epoch": 35.26, + "learning_rate": 3.603723404255319e-05, + "loss": 0.1184, + "step": 40300 + }, + { + "epoch": 35.27, + "learning_rate": 3.5970744680851064e-05, + "loss": 0.1607, + "step": 40310 + }, + { + "epoch": 35.28, + "learning_rate": 3.5904255319148934e-05, + "loss": 0.1464, + "step": 40320 + }, + { + "epoch": 35.28, + "learning_rate": 3.5837765957446804e-05, + "loss": 0.0835, + "step": 40330 + }, + { + "epoch": 35.29, + "learning_rate": 3.5771276595744674e-05, + "loss": 0.2003, + "step": 40340 + }, + { + "epoch": 35.3, + "learning_rate": 3.570478723404255e-05, + "loss": 0.1016, + "step": 40350 + }, + { + "epoch": 35.31, + "learning_rate": 3.563829787234042e-05, + "loss": 0.1414, + "step": 40360 + }, + { + "epoch": 35.32, + "learning_rate": 3.557180851063829e-05, + "loss": 0.1927, + "step": 40370 + }, + { + "epoch": 35.33, + "learning_rate": 3.550531914893617e-05, + "loss": 0.1094, + "step": 40380 + }, + { + "epoch": 35.34, + "learning_rate": 3.543882978723404e-05, + "loss": 0.1839, + "step": 40390 + }, + { + "epoch": 35.35, + "learning_rate": 3.5372340425531914e-05, + "loss": 0.1464, + "step": 40400 + }, + { + "epoch": 35.35, + "learning_rate": 3.530585106382978e-05, + "loss": 0.1527, + "step": 40410 + }, + { + "epoch": 35.36, + "learning_rate": 3.523936170212765e-05, + "loss": 0.1579, + "step": 40420 + }, + { + "epoch": 35.37, + "learning_rate": 3.517287234042553e-05, + "loss": 0.0867, + "step": 40430 + }, + { + "epoch": 35.38, + "learning_rate": 3.51063829787234e-05, + "loss": 0.2029, + "step": 40440 + }, + { + "epoch": 35.39, + "learning_rate": 3.5039893617021276e-05, + "loss": 0.1257, + "step": 40450 + }, + { + "epoch": 35.4, + "learning_rate": 3.4973404255319146e-05, + "loss": 0.1365, + "step": 40460 + }, + { + "epoch": 35.41, + "learning_rate": 3.4906914893617016e-05, + "loss": 0.1384, + "step": 40470 + }, + { + "epoch": 35.42, + "learning_rate": 3.484042553191489e-05, + "loss": 0.0956, + "step": 40480 + }, + { + "epoch": 35.42, + "learning_rate": 3.477393617021276e-05, + "loss": 0.1614, + "step": 40490 + }, + { + "epoch": 35.43, + "learning_rate": 3.470744680851063e-05, + "loss": 0.1049, + "step": 40500 + }, + { + "epoch": 35.44, + "learning_rate": 3.464095744680851e-05, + "loss": 0.178, + "step": 40510 + }, + { + "epoch": 35.45, + "learning_rate": 3.457446808510638e-05, + "loss": 0.1336, + "step": 40520 + }, + { + "epoch": 35.46, + "learning_rate": 3.4507978723404256e-05, + "loss": 0.1174, + "step": 40530 + }, + { + "epoch": 35.47, + "learning_rate": 3.4441489361702125e-05, + "loss": 0.2118, + "step": 40540 + }, + { + "epoch": 35.48, + "learning_rate": 3.4374999999999995e-05, + "loss": 0.1328, + "step": 40550 + }, + { + "epoch": 35.49, + "learning_rate": 3.430851063829787e-05, + "loss": 0.1714, + "step": 40560 + }, + { + "epoch": 35.49, + "learning_rate": 3.424202127659574e-05, + "loss": 0.1198, + "step": 40570 + }, + { + "epoch": 35.5, + "learning_rate": 3.417553191489362e-05, + "loss": 0.0927, + "step": 40580 + }, + { + "epoch": 35.51, + "learning_rate": 3.410904255319148e-05, + "loss": 0.1732, + "step": 40590 + }, + { + "epoch": 35.52, + "learning_rate": 3.404255319148936e-05, + "loss": 0.1244, + "step": 40600 + }, + { + "epoch": 35.53, + "learning_rate": 3.397606382978723e-05, + "loss": 0.2341, + "step": 40610 + }, + { + "epoch": 35.54, + "learning_rate": 3.3909574468085105e-05, + "loss": 0.1517, + "step": 40620 + }, + { + "epoch": 35.55, + "learning_rate": 3.3843085106382974e-05, + "loss": 0.1489, + "step": 40630 + }, + { + "epoch": 35.56, + "learning_rate": 3.3776595744680844e-05, + "loss": 0.127, + "step": 40640 + }, + { + "epoch": 35.56, + "learning_rate": 3.371010638297872e-05, + "loss": 0.1652, + "step": 40650 + }, + { + "epoch": 35.57, + "learning_rate": 3.364361702127659e-05, + "loss": 0.174, + "step": 40660 + }, + { + "epoch": 35.58, + "learning_rate": 3.357712765957447e-05, + "loss": 0.135, + "step": 40670 + }, + { + "epoch": 35.59, + "learning_rate": 3.351063829787234e-05, + "loss": 0.0801, + "step": 40680 + }, + { + "epoch": 35.6, + "learning_rate": 3.344414893617021e-05, + "loss": 0.1819, + "step": 40690 + }, + { + "epoch": 35.61, + "learning_rate": 3.3377659574468084e-05, + "loss": 0.1186, + "step": 40700 + }, + { + "epoch": 35.62, + "learning_rate": 3.3311170212765954e-05, + "loss": 0.1495, + "step": 40710 + }, + { + "epoch": 35.63, + "learning_rate": 3.3244680851063824e-05, + "loss": 0.1203, + "step": 40720 + }, + { + "epoch": 35.63, + "learning_rate": 3.31781914893617e-05, + "loss": 0.1432, + "step": 40730 + }, + { + "epoch": 35.64, + "learning_rate": 3.311170212765957e-05, + "loss": 0.1543, + "step": 40740 + }, + { + "epoch": 35.65, + "learning_rate": 3.304521276595745e-05, + "loss": 0.087, + "step": 40750 + }, + { + "epoch": 35.66, + "learning_rate": 3.2978723404255317e-05, + "loss": 0.1792, + "step": 40760 + }, + { + "epoch": 35.67, + "learning_rate": 3.2912234042553186e-05, + "loss": 0.1304, + "step": 40770 + }, + { + "epoch": 35.68, + "learning_rate": 3.284574468085106e-05, + "loss": 0.104, + "step": 40780 + }, + { + "epoch": 35.69, + "learning_rate": 3.277925531914893e-05, + "loss": 0.2009, + "step": 40790 + }, + { + "epoch": 35.7, + "learning_rate": 3.271276595744681e-05, + "loss": 0.1386, + "step": 40800 + }, + { + "epoch": 35.7, + "eval_cer1": 0.2388508152999561, + "eval_cer2": 0.22031173092698933, + "eval_cer3": 0.19771316563214636, + "eval_cer4": 0.1999098489970701, + "eval_cer5": 0.22352441613588112, + "eval_loss": 1.0112673044204712, + "eval_runtime": 1556.0584, + "eval_samples_per_second": 5.63, + "step": 40800 + }, + { + "epoch": 35.7, + "learning_rate": 3.264627659574468e-05, + "loss": 0.172, + "step": 40810 + }, + { + "epoch": 35.71, + "learning_rate": 3.257978723404255e-05, + "loss": 0.1797, + "step": 40820 + }, + { + "epoch": 35.72, + "learning_rate": 3.2513297872340426e-05, + "loss": 0.0897, + "step": 40830 + }, + { + "epoch": 35.73, + "learning_rate": 3.2446808510638296e-05, + "loss": 0.1913, + "step": 40840 + }, + { + "epoch": 35.74, + "learning_rate": 3.238031914893617e-05, + "loss": 0.1018, + "step": 40850 + }, + { + "epoch": 35.75, + "learning_rate": 3.2313829787234035e-05, + "loss": 0.1401, + "step": 40860 + }, + { + "epoch": 35.76, + "learning_rate": 3.224734042553191e-05, + "loss": 0.1213, + "step": 40870 + }, + { + "epoch": 35.77, + "learning_rate": 3.218085106382978e-05, + "loss": 0.1149, + "step": 40880 + }, + { + "epoch": 35.77, + "learning_rate": 3.211436170212766e-05, + "loss": 0.178, + "step": 40890 + }, + { + "epoch": 35.78, + "learning_rate": 3.204787234042553e-05, + "loss": 0.1192, + "step": 40900 + }, + { + "epoch": 35.79, + "learning_rate": 3.19813829787234e-05, + "loss": 0.1409, + "step": 40910 + }, + { + "epoch": 35.8, + "learning_rate": 3.1914893617021275e-05, + "loss": 0.1238, + "step": 40920 + }, + { + "epoch": 35.81, + "learning_rate": 3.1848404255319145e-05, + "loss": 0.0919, + "step": 40930 + }, + { + "epoch": 35.82, + "learning_rate": 3.1781914893617015e-05, + "loss": 0.1689, + "step": 40940 + }, + { + "epoch": 35.83, + "learning_rate": 3.171542553191489e-05, + "loss": 0.1163, + "step": 40950 + }, + { + "epoch": 35.84, + "learning_rate": 3.164893617021276e-05, + "loss": 0.1882, + "step": 40960 + }, + { + "epoch": 35.84, + "learning_rate": 3.158244680851064e-05, + "loss": 0.1289, + "step": 40970 + }, + { + "epoch": 35.85, + "learning_rate": 3.151595744680851e-05, + "loss": 0.0977, + "step": 40980 + }, + { + "epoch": 35.86, + "learning_rate": 3.144946808510638e-05, + "loss": 0.1907, + "step": 40990 + }, + { + "epoch": 35.87, + "learning_rate": 3.1382978723404254e-05, + "loss": 0.0776, + "step": 41000 + }, + { + "epoch": 35.88, + "learning_rate": 3.1316489361702124e-05, + "loss": 0.1848, + "step": 41010 + }, + { + "epoch": 35.89, + "learning_rate": 3.125e-05, + "loss": 0.1513, + "step": 41020 + }, + { + "epoch": 35.9, + "learning_rate": 3.118351063829787e-05, + "loss": 0.0972, + "step": 41030 + }, + { + "epoch": 35.91, + "learning_rate": 3.111702127659574e-05, + "loss": 0.1794, + "step": 41040 + }, + { + "epoch": 35.91, + "learning_rate": 3.105053191489362e-05, + "loss": 0.1136, + "step": 41050 + }, + { + "epoch": 35.92, + "learning_rate": 3.098404255319149e-05, + "loss": 0.1498, + "step": 41060 + }, + { + "epoch": 35.93, + "learning_rate": 3.0917553191489363e-05, + "loss": 0.1377, + "step": 41070 + }, + { + "epoch": 35.94, + "learning_rate": 3.085106382978723e-05, + "loss": 0.1244, + "step": 41080 + }, + { + "epoch": 35.95, + "learning_rate": 3.07845744680851e-05, + "loss": 0.1879, + "step": 41090 + }, + { + "epoch": 35.96, + "learning_rate": 3.071808510638298e-05, + "loss": 0.088, + "step": 41100 + }, + { + "epoch": 35.97, + "learning_rate": 3.065159574468085e-05, + "loss": 0.1639, + "step": 41110 + }, + { + "epoch": 35.98, + "learning_rate": 3.058510638297872e-05, + "loss": 0.1356, + "step": 41120 + }, + { + "epoch": 35.98, + "learning_rate": 3.051861702127659e-05, + "loss": 0.085, + "step": 41130 + }, + { + "epoch": 35.99, + "learning_rate": 3.0452127659574466e-05, + "loss": 0.1946, + "step": 41140 + }, + { + "epoch": 36.0, + "learning_rate": 3.038563829787234e-05, + "loss": 0.1563, + "step": 41150 + }, + { + "epoch": 36.01, + "learning_rate": 3.031914893617021e-05, + "loss": 0.1775, + "step": 41160 + }, + { + "epoch": 36.02, + "learning_rate": 3.0252659574468082e-05, + "loss": 0.1084, + "step": 41170 + }, + { + "epoch": 36.03, + "learning_rate": 3.0186170212765956e-05, + "loss": 0.1816, + "step": 41180 + }, + { + "epoch": 36.04, + "learning_rate": 3.011968085106383e-05, + "loss": 0.1028, + "step": 41190 + }, + { + "epoch": 36.05, + "learning_rate": 3.0053191489361702e-05, + "loss": 0.1037, + "step": 41200 + }, + { + "epoch": 36.05, + "learning_rate": 2.9986702127659572e-05, + "loss": 0.1338, + "step": 41210 + }, + { + "epoch": 36.06, + "learning_rate": 2.9920212765957445e-05, + "loss": 0.0973, + "step": 41220 + }, + { + "epoch": 36.07, + "learning_rate": 2.985372340425532e-05, + "loss": 0.1325, + "step": 41230 + }, + { + "epoch": 36.08, + "learning_rate": 2.9787234042553192e-05, + "loss": 0.1334, + "step": 41240 + }, + { + "epoch": 36.09, + "learning_rate": 2.9720744680851058e-05, + "loss": 0.1332, + "step": 41250 + }, + { + "epoch": 36.1, + "learning_rate": 2.965425531914893e-05, + "loss": 0.1163, + "step": 41260 + }, + { + "epoch": 36.11, + "learning_rate": 2.9587765957446805e-05, + "loss": 0.1061, + "step": 41270 + }, + { + "epoch": 36.12, + "learning_rate": 2.9521276595744678e-05, + "loss": 0.1687, + "step": 41280 + }, + { + "epoch": 36.12, + "learning_rate": 2.945478723404255e-05, + "loss": 0.1137, + "step": 41290 + }, + { + "epoch": 36.13, + "learning_rate": 2.938829787234042e-05, + "loss": 0.1184, + "step": 41300 + }, + { + "epoch": 36.14, + "learning_rate": 2.9321808510638294e-05, + "loss": 0.1434, + "step": 41310 + }, + { + "epoch": 36.15, + "learning_rate": 2.9255319148936168e-05, + "loss": 0.1035, + "step": 41320 + }, + { + "epoch": 36.16, + "learning_rate": 2.918882978723404e-05, + "loss": 0.1808, + "step": 41330 + }, + { + "epoch": 36.17, + "learning_rate": 2.912234042553191e-05, + "loss": 0.0918, + "step": 41340 + }, + { + "epoch": 36.18, + "learning_rate": 2.9055851063829784e-05, + "loss": 0.193, + "step": 41350 + }, + { + "epoch": 36.19, + "learning_rate": 2.8989361702127657e-05, + "loss": 0.1212, + "step": 41360 + }, + { + "epoch": 36.19, + "learning_rate": 2.892287234042553e-05, + "loss": 0.1139, + "step": 41370 + }, + { + "epoch": 36.2, + "learning_rate": 2.88563829787234e-05, + "loss": 0.1598, + "step": 41380 + }, + { + "epoch": 36.21, + "learning_rate": 2.8789893617021274e-05, + "loss": 0.092, + "step": 41390 + }, + { + "epoch": 36.22, + "learning_rate": 2.8723404255319147e-05, + "loss": 0.0897, + "step": 41400 + }, + { + "epoch": 36.22, + "eval_cer1": 0.23685898517943352, + "eval_cer2": 0.21827727645611156, + "eval_cer3": 0.19585102907546553, + "eval_cer4": 0.1993947004088992, + "eval_cer5": 0.22284501061571124, + "eval_loss": 1.0036234855651855, + "eval_runtime": 1549.9985, + "eval_samples_per_second": 5.652, + "step": 41400 + }, + { + "epoch": 36.23, + "learning_rate": 2.865691489361702e-05, + "loss": 0.1451, + "step": 41410 + }, + { + "epoch": 36.24, + "learning_rate": 2.8590425531914893e-05, + "loss": 0.1132, + "step": 41420 + }, + { + "epoch": 36.25, + "learning_rate": 2.8523936170212763e-05, + "loss": 0.1699, + "step": 41430 + }, + { + "epoch": 36.26, + "learning_rate": 2.8457446808510636e-05, + "loss": 0.1317, + "step": 41440 + }, + { + "epoch": 36.26, + "learning_rate": 2.839095744680851e-05, + "loss": 0.1125, + "step": 41450 + }, + { + "epoch": 36.27, + "learning_rate": 2.8324468085106383e-05, + "loss": 0.1419, + "step": 41460 + }, + { + "epoch": 36.28, + "learning_rate": 2.825797872340425e-05, + "loss": 0.125, + "step": 41470 + }, + { + "epoch": 36.29, + "learning_rate": 2.8191489361702123e-05, + "loss": 0.194, + "step": 41480 + }, + { + "epoch": 36.3, + "learning_rate": 2.8125e-05, + "loss": 0.1262, + "step": 41490 + }, + { + "epoch": 36.31, + "learning_rate": 2.8058510638297872e-05, + "loss": 0.0977, + "step": 41500 + }, + { + "epoch": 36.32, + "learning_rate": 2.7992021276595746e-05, + "loss": 0.1209, + "step": 41510 + }, + { + "epoch": 36.33, + "learning_rate": 2.7925531914893612e-05, + "loss": 0.1058, + "step": 41520 + }, + { + "epoch": 36.33, + "learning_rate": 2.7859042553191485e-05, + "loss": 0.152, + "step": 41530 + }, + { + "epoch": 36.34, + "learning_rate": 2.779255319148936e-05, + "loss": 0.1175, + "step": 41540 + }, + { + "epoch": 36.35, + "learning_rate": 2.7726063829787232e-05, + "loss": 0.1104, + "step": 41550 + }, + { + "epoch": 36.36, + "learning_rate": 2.7659574468085102e-05, + "loss": 0.1396, + "step": 41560 + }, + { + "epoch": 36.37, + "learning_rate": 2.7593085106382975e-05, + "loss": 0.1016, + "step": 41570 + }, + { + "epoch": 36.38, + "learning_rate": 2.7526595744680848e-05, + "loss": 0.1598, + "step": 41580 + }, + { + "epoch": 36.39, + "learning_rate": 2.746010638297872e-05, + "loss": 0.1189, + "step": 41590 + }, + { + "epoch": 36.4, + "learning_rate": 2.7393617021276595e-05, + "loss": 0.1271, + "step": 41600 + }, + { + "epoch": 36.4, + "learning_rate": 2.7327127659574465e-05, + "loss": 0.1873, + "step": 41610 + }, + { + "epoch": 36.41, + "learning_rate": 2.7260638297872338e-05, + "loss": 0.0913, + "step": 41620 + }, + { + "epoch": 36.42, + "learning_rate": 2.719414893617021e-05, + "loss": 0.1433, + "step": 41630 + }, + { + "epoch": 36.43, + "learning_rate": 2.7127659574468084e-05, + "loss": 0.1026, + "step": 41640 + }, + { + "epoch": 36.44, + "learning_rate": 2.7061170212765954e-05, + "loss": 0.1118, + "step": 41650 + }, + { + "epoch": 36.45, + "learning_rate": 2.6994680851063827e-05, + "loss": 0.1391, + "step": 41660 + }, + { + "epoch": 36.46, + "learning_rate": 2.69281914893617e-05, + "loss": 0.1105, + "step": 41670 + }, + { + "epoch": 36.47, + "learning_rate": 2.6861702127659574e-05, + "loss": 0.156, + "step": 41680 + }, + { + "epoch": 36.47, + "learning_rate": 2.6795212765957444e-05, + "loss": 0.136, + "step": 41690 + }, + { + "epoch": 36.48, + "learning_rate": 2.6728723404255317e-05, + "loss": 0.1837, + "step": 41700 + }, + { + "epoch": 36.49, + "learning_rate": 2.666223404255319e-05, + "loss": 0.1446, + "step": 41710 + }, + { + "epoch": 36.5, + "learning_rate": 2.6595744680851064e-05, + "loss": 0.0798, + "step": 41720 + }, + { + "epoch": 36.51, + "learning_rate": 2.6529255319148937e-05, + "loss": 0.2184, + "step": 41730 + }, + { + "epoch": 36.52, + "learning_rate": 2.6462765957446803e-05, + "loss": 0.1004, + "step": 41740 + }, + { + "epoch": 36.53, + "learning_rate": 2.6396276595744677e-05, + "loss": 0.1484, + "step": 41750 + }, + { + "epoch": 36.54, + "learning_rate": 2.632978723404255e-05, + "loss": 0.1692, + "step": 41760 + }, + { + "epoch": 36.54, + "learning_rate": 2.6263297872340423e-05, + "loss": 0.1253, + "step": 41770 + }, + { + "epoch": 36.55, + "learning_rate": 2.6196808510638293e-05, + "loss": 0.1479, + "step": 41780 + }, + { + "epoch": 36.56, + "learning_rate": 2.6130319148936166e-05, + "loss": 0.1266, + "step": 41790 + }, + { + "epoch": 36.57, + "learning_rate": 2.606382978723404e-05, + "loss": 0.1164, + "step": 41800 + }, + { + "epoch": 36.58, + "learning_rate": 2.5997340425531913e-05, + "loss": 0.1696, + "step": 41810 + }, + { + "epoch": 36.59, + "learning_rate": 2.5930851063829786e-05, + "loss": 0.1059, + "step": 41820 + }, + { + "epoch": 36.6, + "learning_rate": 2.5864361702127656e-05, + "loss": 0.1654, + "step": 41830 + }, + { + "epoch": 36.61, + "learning_rate": 2.579787234042553e-05, + "loss": 0.1185, + "step": 41840 + }, + { + "epoch": 36.61, + "learning_rate": 2.5731382978723402e-05, + "loss": 0.1207, + "step": 41850 + }, + { + "epoch": 36.62, + "learning_rate": 2.5664893617021276e-05, + "loss": 0.1288, + "step": 41860 + }, + { + "epoch": 36.63, + "learning_rate": 2.5598404255319145e-05, + "loss": 0.1088, + "step": 41870 + }, + { + "epoch": 36.64, + "learning_rate": 2.553191489361702e-05, + "loss": 0.1766, + "step": 41880 + }, + { + "epoch": 36.65, + "learning_rate": 2.5465425531914892e-05, + "loss": 0.1723, + "step": 41890 + }, + { + "epoch": 36.66, + "learning_rate": 2.5398936170212765e-05, + "loss": 0.1406, + "step": 41900 + }, + { + "epoch": 36.67, + "learning_rate": 2.5332446808510635e-05, + "loss": 0.1469, + "step": 41910 + }, + { + "epoch": 36.68, + "learning_rate": 2.5265957446808508e-05, + "loss": 0.1708, + "step": 41920 + }, + { + "epoch": 36.68, + "learning_rate": 2.519946808510638e-05, + "loss": 0.1793, + "step": 41930 + }, + { + "epoch": 36.69, + "learning_rate": 2.5132978723404255e-05, + "loss": 0.1511, + "step": 41940 + }, + { + "epoch": 36.7, + "learning_rate": 2.5066489361702128e-05, + "loss": 0.1295, + "step": 41950 + }, + { + "epoch": 36.71, + "learning_rate": 2.4999999999999998e-05, + "loss": 0.1524, + "step": 41960 + }, + { + "epoch": 36.72, + "learning_rate": 2.493351063829787e-05, + "loss": 0.1046, + "step": 41970 + }, + { + "epoch": 36.73, + "learning_rate": 2.4867021276595744e-05, + "loss": 0.1864, + "step": 41980 + }, + { + "epoch": 36.74, + "learning_rate": 2.4800531914893618e-05, + "loss": 0.1109, + "step": 41990 + }, + { + "epoch": 36.75, + "learning_rate": 2.4734042553191484e-05, + "loss": 0.1244, + "step": 42000 + }, + { + "epoch": 36.75, + "eval_cer1": 0.2372978630025995, + "eval_cer2": 0.2181788351107465, + "eval_cer3": 0.19585102907546553, + "eval_cer4": 0.1998776522103094, + "eval_cer5": 0.22072186836518046, + "eval_loss": 1.0039706230163574, + "eval_runtime": 1541.9518, + "eval_samples_per_second": 5.681, + "step": 42000 + }, + { + "epoch": 36.75, + "learning_rate": 2.4667553191489357e-05, + "loss": 0.1606, + "step": 42010 + }, + { + "epoch": 36.76, + "learning_rate": 2.460106382978723e-05, + "loss": 0.1085, + "step": 42020 + }, + { + "epoch": 36.77, + "learning_rate": 2.4534574468085104e-05, + "loss": 0.1228, + "step": 42030 + }, + { + "epoch": 36.78, + "learning_rate": 2.4468085106382977e-05, + "loss": 0.1182, + "step": 42040 + }, + { + "epoch": 36.79, + "learning_rate": 2.4401595744680847e-05, + "loss": 0.1089, + "step": 42050 + }, + { + "epoch": 36.8, + "learning_rate": 2.433510638297872e-05, + "loss": 0.1315, + "step": 42060 + }, + { + "epoch": 36.81, + "learning_rate": 2.4268617021276593e-05, + "loss": 0.1531, + "step": 42070 + }, + { + "epoch": 36.82, + "learning_rate": 2.4202127659574467e-05, + "loss": 0.1197, + "step": 42080 + }, + { + "epoch": 36.82, + "learning_rate": 2.4135638297872336e-05, + "loss": 0.0993, + "step": 42090 + }, + { + "epoch": 36.83, + "learning_rate": 2.406914893617021e-05, + "loss": 0.1296, + "step": 42100 + }, + { + "epoch": 36.84, + "learning_rate": 2.4002659574468083e-05, + "loss": 0.1423, + "step": 42110 + }, + { + "epoch": 36.85, + "learning_rate": 2.3936170212765956e-05, + "loss": 0.1575, + "step": 42120 + }, + { + "epoch": 36.86, + "learning_rate": 2.3869680851063826e-05, + "loss": 0.1753, + "step": 42130 + }, + { + "epoch": 36.87, + "learning_rate": 2.38031914893617e-05, + "loss": 0.1188, + "step": 42140 + }, + { + "epoch": 36.88, + "learning_rate": 2.3736702127659573e-05, + "loss": 0.0828, + "step": 42150 + }, + { + "epoch": 36.89, + "learning_rate": 2.3670212765957446e-05, + "loss": 0.1592, + "step": 42160 + }, + { + "epoch": 36.89, + "learning_rate": 2.360372340425532e-05, + "loss": 0.0964, + "step": 42170 + }, + { + "epoch": 36.9, + "learning_rate": 2.353723404255319e-05, + "loss": 0.1342, + "step": 42180 + }, + { + "epoch": 36.91, + "learning_rate": 2.3470744680851062e-05, + "loss": 0.1323, + "step": 42190 + }, + { + "epoch": 36.92, + "learning_rate": 2.3404255319148935e-05, + "loss": 0.1646, + "step": 42200 + }, + { + "epoch": 36.93, + "learning_rate": 2.333776595744681e-05, + "loss": 0.1266, + "step": 42210 + }, + { + "epoch": 36.94, + "learning_rate": 2.327127659574468e-05, + "loss": 0.1178, + "step": 42220 + }, + { + "epoch": 36.95, + "learning_rate": 2.3204787234042552e-05, + "loss": 0.1201, + "step": 42230 + }, + { + "epoch": 36.95, + "learning_rate": 2.3138297872340425e-05, + "loss": 0.1122, + "step": 42240 + }, + { + "epoch": 36.96, + "learning_rate": 2.3071808510638298e-05, + "loss": 0.0968, + "step": 42250 + }, + { + "epoch": 36.97, + "learning_rate": 2.300531914893617e-05, + "loss": 0.1401, + "step": 42260 + }, + { + "epoch": 36.98, + "learning_rate": 2.2938829787234038e-05, + "loss": 0.1006, + "step": 42270 + }, + { + "epoch": 36.99, + "learning_rate": 2.287234042553191e-05, + "loss": 0.1264, + "step": 42280 + }, + { + "epoch": 37.0, + "learning_rate": 2.2805851063829784e-05, + "loss": 0.1214, + "step": 42290 + }, + { + "epoch": 37.01, + "learning_rate": 2.2739361702127658e-05, + "loss": 0.1647, + "step": 42300 + }, + { + "epoch": 37.02, + "learning_rate": 2.2672872340425528e-05, + "loss": 0.1074, + "step": 42310 + }, + { + "epoch": 37.03, + "learning_rate": 2.26063829787234e-05, + "loss": 0.1337, + "step": 42320 + }, + { + "epoch": 37.03, + "learning_rate": 2.2539893617021274e-05, + "loss": 0.1182, + "step": 42330 + }, + { + "epoch": 37.04, + "learning_rate": 2.2473404255319147e-05, + "loss": 0.0711, + "step": 42340 + }, + { + "epoch": 37.05, + "learning_rate": 2.2406914893617017e-05, + "loss": 0.1657, + "step": 42350 + }, + { + "epoch": 37.06, + "learning_rate": 2.234042553191489e-05, + "loss": 0.1277, + "step": 42360 + }, + { + "epoch": 37.07, + "learning_rate": 2.2273936170212764e-05, + "loss": 0.1109, + "step": 42370 + }, + { + "epoch": 37.08, + "learning_rate": 2.2207446808510637e-05, + "loss": 0.0971, + "step": 42380 + }, + { + "epoch": 37.09, + "learning_rate": 2.214095744680851e-05, + "loss": 0.1456, + "step": 42390 + }, + { + "epoch": 37.1, + "learning_rate": 2.207446808510638e-05, + "loss": 0.152, + "step": 42400 + }, + { + "epoch": 37.1, + "learning_rate": 2.2007978723404253e-05, + "loss": 0.1133, + "step": 42410 + }, + { + "epoch": 37.11, + "learning_rate": 2.1941489361702127e-05, + "loss": 0.1475, + "step": 42420 + }, + { + "epoch": 37.12, + "learning_rate": 2.1875e-05, + "loss": 0.1154, + "step": 42430 + }, + { + "epoch": 37.13, + "learning_rate": 2.180851063829787e-05, + "loss": 0.0825, + "step": 42440 + }, + { + "epoch": 37.14, + "learning_rate": 2.1742021276595743e-05, + "loss": 0.1414, + "step": 42450 + }, + { + "epoch": 37.15, + "learning_rate": 2.1675531914893616e-05, + "loss": 0.0651, + "step": 42460 + }, + { + "epoch": 37.16, + "learning_rate": 2.160904255319149e-05, + "loss": 0.1204, + "step": 42470 + }, + { + "epoch": 37.17, + "learning_rate": 2.1542553191489363e-05, + "loss": 0.1096, + "step": 42480 + }, + { + "epoch": 37.17, + "learning_rate": 2.1476063829787232e-05, + "loss": 0.1096, + "step": 42490 + }, + { + "epoch": 37.18, + "learning_rate": 2.1409574468085106e-05, + "loss": 0.1601, + "step": 42500 + }, + { + "epoch": 37.19, + "learning_rate": 2.134308510638298e-05, + "loss": 0.1252, + "step": 42510 + }, + { + "epoch": 37.2, + "learning_rate": 2.1276595744680852e-05, + "loss": 0.1271, + "step": 42520 + }, + { + "epoch": 37.21, + "learning_rate": 2.121010638297872e-05, + "loss": 0.1384, + "step": 42530 + }, + { + "epoch": 37.22, + "learning_rate": 2.1143617021276592e-05, + "loss": 0.1017, + "step": 42540 + }, + { + "epoch": 37.23, + "learning_rate": 2.1077127659574465e-05, + "loss": 0.1588, + "step": 42550 + }, + { + "epoch": 37.24, + "learning_rate": 2.101063829787234e-05, + "loss": 0.1206, + "step": 42560 + }, + { + "epoch": 37.24, + "learning_rate": 2.0944148936170208e-05, + "loss": 0.1465, + "step": 42570 + }, + { + "epoch": 37.25, + "learning_rate": 2.087765957446808e-05, + "loss": 0.1189, + "step": 42580 + }, + { + "epoch": 37.26, + "learning_rate": 2.0811170212765955e-05, + "loss": 0.0768, + "step": 42590 + }, + { + "epoch": 37.27, + "learning_rate": 2.0744680851063828e-05, + "loss": 0.1463, + "step": 42600 + }, + { + "epoch": 37.27, + "eval_cer1": 0.2354073123797306, + "eval_cer2": 0.2163084495488105, + "eval_cer3": 0.1961450506370467, + "eval_cer4": 0.1993625036221385, + "eval_cer5": 0.22140127388535033, + "eval_loss": 1.0057064294815063, + "eval_runtime": 1564.0938, + "eval_samples_per_second": 5.601, + "step": 42600 + }, + { + "epoch": 37.28, + "learning_rate": 2.06781914893617e-05, + "loss": 0.1169, + "step": 42610 + }, + { + "epoch": 37.29, + "learning_rate": 2.061170212765957e-05, + "loss": 0.1337, + "step": 42620 + }, + { + "epoch": 37.3, + "learning_rate": 2.0545212765957444e-05, + "loss": 0.1105, + "step": 42630 + }, + { + "epoch": 37.31, + "learning_rate": 2.0478723404255318e-05, + "loss": 0.09, + "step": 42640 + }, + { + "epoch": 37.31, + "learning_rate": 2.041223404255319e-05, + "loss": 0.1582, + "step": 42650 + }, + { + "epoch": 37.32, + "learning_rate": 2.034574468085106e-05, + "loss": 0.122, + "step": 42660 + }, + { + "epoch": 37.33, + "learning_rate": 2.0279255319148934e-05, + "loss": 0.116, + "step": 42670 + }, + { + "epoch": 37.34, + "learning_rate": 2.0212765957446807e-05, + "loss": 0.1463, + "step": 42680 + }, + { + "epoch": 37.35, + "learning_rate": 2.014627659574468e-05, + "loss": 0.1347, + "step": 42690 + }, + { + "epoch": 37.36, + "learning_rate": 2.0079787234042554e-05, + "loss": 0.1479, + "step": 42700 + }, + { + "epoch": 37.37, + "learning_rate": 2.0013297872340424e-05, + "loss": 0.089, + "step": 42710 + }, + { + "epoch": 37.38, + "learning_rate": 1.9946808510638297e-05, + "loss": 0.1684, + "step": 42720 + }, + { + "epoch": 37.38, + "learning_rate": 1.988031914893617e-05, + "loss": 0.1372, + "step": 42730 + }, + { + "epoch": 37.39, + "learning_rate": 1.9813829787234043e-05, + "loss": 0.0881, + "step": 42740 + }, + { + "epoch": 37.4, + "learning_rate": 1.974734042553191e-05, + "loss": 0.1521, + "step": 42750 + }, + { + "epoch": 37.41, + "learning_rate": 1.9680851063829786e-05, + "loss": 0.1081, + "step": 42760 + }, + { + "epoch": 37.42, + "learning_rate": 1.961436170212766e-05, + "loss": 0.1176, + "step": 42770 + }, + { + "epoch": 37.43, + "learning_rate": 1.9547872340425533e-05, + "loss": 0.1111, + "step": 42780 + }, + { + "epoch": 37.44, + "learning_rate": 1.94813829787234e-05, + "loss": 0.0497, + "step": 42790 + }, + { + "epoch": 37.45, + "learning_rate": 1.9414893617021273e-05, + "loss": 0.1563, + "step": 42800 + }, + { + "epoch": 37.45, + "learning_rate": 1.9348404255319146e-05, + "loss": 0.1217, + "step": 42810 + }, + { + "epoch": 37.46, + "learning_rate": 1.928191489361702e-05, + "loss": 0.1374, + "step": 42820 + }, + { + "epoch": 37.47, + "learning_rate": 1.9215425531914892e-05, + "loss": 0.1186, + "step": 42830 + }, + { + "epoch": 37.48, + "learning_rate": 1.9148936170212762e-05, + "loss": 0.0788, + "step": 42840 + }, + { + "epoch": 37.49, + "learning_rate": 1.9082446808510636e-05, + "loss": 0.1521, + "step": 42850 + }, + { + "epoch": 37.5, + "learning_rate": 1.901595744680851e-05, + "loss": 0.0921, + "step": 42860 + }, + { + "epoch": 37.51, + "learning_rate": 1.8949468085106382e-05, + "loss": 0.1623, + "step": 42870 + }, + { + "epoch": 37.52, + "learning_rate": 1.8882978723404252e-05, + "loss": 0.1399, + "step": 42880 + }, + { + "epoch": 37.52, + "learning_rate": 1.8816489361702125e-05, + "loss": 0.0978, + "step": 42890 + }, + { + "epoch": 37.53, + "learning_rate": 1.875e-05, + "loss": 0.1189, + "step": 42900 + }, + { + "epoch": 37.54, + "learning_rate": 1.868351063829787e-05, + "loss": 0.1292, + "step": 42910 + }, + { + "epoch": 37.55, + "learning_rate": 1.861702127659574e-05, + "loss": 0.1143, + "step": 42920 + }, + { + "epoch": 37.56, + "learning_rate": 1.8550531914893615e-05, + "loss": 0.1128, + "step": 42930 + }, + { + "epoch": 37.57, + "learning_rate": 1.8484042553191488e-05, + "loss": 0.0874, + "step": 42940 + }, + { + "epoch": 37.58, + "learning_rate": 1.841755319148936e-05, + "loss": 0.1445, + "step": 42950 + }, + { + "epoch": 37.59, + "learning_rate": 1.835106382978723e-05, + "loss": 0.0936, + "step": 42960 + }, + { + "epoch": 37.59, + "learning_rate": 1.8284574468085104e-05, + "loss": 0.1561, + "step": 42970 + }, + { + "epoch": 37.6, + "learning_rate": 1.8218085106382978e-05, + "loss": 0.1266, + "step": 42980 + }, + { + "epoch": 37.61, + "learning_rate": 1.815159574468085e-05, + "loss": 0.1182, + "step": 42990 + }, + { + "epoch": 37.62, + "learning_rate": 1.808510638297872e-05, + "loss": 0.1726, + "step": 43000 + }, + { + "epoch": 37.63, + "learning_rate": 1.8018617021276594e-05, + "loss": 0.1283, + "step": 43010 + }, + { + "epoch": 37.64, + "learning_rate": 1.7952127659574467e-05, + "loss": 0.1479, + "step": 43020 + }, + { + "epoch": 37.65, + "learning_rate": 1.7885638297872337e-05, + "loss": 0.1097, + "step": 43030 + }, + { + "epoch": 37.66, + "learning_rate": 1.781914893617021e-05, + "loss": 0.1079, + "step": 43040 + }, + { + "epoch": 37.66, + "learning_rate": 1.7752659574468084e-05, + "loss": 0.1865, + "step": 43050 + }, + { + "epoch": 37.67, + "learning_rate": 1.7686170212765957e-05, + "loss": 0.0987, + "step": 43060 + }, + { + "epoch": 37.68, + "learning_rate": 1.7619680851063827e-05, + "loss": 0.1382, + "step": 43070 + }, + { + "epoch": 37.69, + "learning_rate": 1.75531914893617e-05, + "loss": 0.1275, + "step": 43080 + }, + { + "epoch": 37.7, + "learning_rate": 1.7486702127659573e-05, + "loss": 0.1079, + "step": 43090 + }, + { + "epoch": 37.71, + "learning_rate": 1.7420212765957446e-05, + "loss": 0.1814, + "step": 43100 + }, + { + "epoch": 37.72, + "learning_rate": 1.7353723404255316e-05, + "loss": 0.1054, + "step": 43110 + }, + { + "epoch": 37.72, + "learning_rate": 1.728723404255319e-05, + "loss": 0.1195, + "step": 43120 + }, + { + "epoch": 37.73, + "learning_rate": 1.7220744680851063e-05, + "loss": 0.1282, + "step": 43130 + }, + { + "epoch": 37.74, + "learning_rate": 1.7154255319148936e-05, + "loss": 0.1088, + "step": 43140 + }, + { + "epoch": 37.75, + "learning_rate": 1.708776595744681e-05, + "loss": 0.1618, + "step": 43150 + }, + { + "epoch": 37.76, + "learning_rate": 1.702127659574468e-05, + "loss": 0.1032, + "step": 43160 + }, + { + "epoch": 37.77, + "learning_rate": 1.6954787234042552e-05, + "loss": 0.1327, + "step": 43170 + }, + { + "epoch": 37.78, + "learning_rate": 1.6888297872340422e-05, + "loss": 0.1375, + "step": 43180 + }, + { + "epoch": 37.79, + "learning_rate": 1.6821808510638295e-05, + "loss": 0.1235, + "step": 43190 + }, + { + "epoch": 37.79, + "learning_rate": 1.675531914893617e-05, + "loss": 0.1587, + "step": 43200 + }, + { + "epoch": 37.79, + "eval_cer1": 0.23466459606360351, + "eval_cer2": 0.21453650533223953, + "eval_cer3": 0.19454426657954918, + "eval_cer4": 0.19788145143114716, + "eval_cer5": 0.22394904458598727, + "eval_loss": 1.0014487504959106, + "eval_runtime": 1569.3035, + "eval_samples_per_second": 5.582, + "step": 43200 + }, + { + "epoch": 37.8, + "learning_rate": 1.6688829787234042e-05, + "loss": 0.1002, + "step": 43210 + }, + { + "epoch": 37.81, + "learning_rate": 1.6622340425531912e-05, + "loss": 0.124, + "step": 43220 + }, + { + "epoch": 37.82, + "learning_rate": 1.6555851063829785e-05, + "loss": 0.1237, + "step": 43230 + }, + { + "epoch": 37.83, + "learning_rate": 1.6489361702127658e-05, + "loss": 0.0647, + "step": 43240 + }, + { + "epoch": 37.84, + "learning_rate": 1.642287234042553e-05, + "loss": 0.1906, + "step": 43250 + }, + { + "epoch": 37.85, + "learning_rate": 1.6356382978723405e-05, + "loss": 0.1235, + "step": 43260 + }, + { + "epoch": 37.86, + "learning_rate": 1.6289893617021275e-05, + "loss": 0.166, + "step": 43270 + }, + { + "epoch": 37.86, + "learning_rate": 1.6223404255319148e-05, + "loss": 0.1124, + "step": 43280 + }, + { + "epoch": 37.87, + "learning_rate": 1.6156914893617018e-05, + "loss": 0.0905, + "step": 43290 + }, + { + "epoch": 37.88, + "learning_rate": 1.609042553191489e-05, + "loss": 0.1618, + "step": 43300 + }, + { + "epoch": 37.89, + "learning_rate": 1.6023936170212764e-05, + "loss": 0.1168, + "step": 43310 + }, + { + "epoch": 37.9, + "learning_rate": 1.5957446808510637e-05, + "loss": 0.1614, + "step": 43320 + }, + { + "epoch": 37.91, + "learning_rate": 1.5890957446808507e-05, + "loss": 0.1148, + "step": 43330 + }, + { + "epoch": 37.92, + "learning_rate": 1.582446808510638e-05, + "loss": 0.1307, + "step": 43340 + }, + { + "epoch": 37.93, + "learning_rate": 1.5757978723404254e-05, + "loss": 0.1806, + "step": 43350 + }, + { + "epoch": 37.93, + "learning_rate": 1.5691489361702127e-05, + "loss": 0.1288, + "step": 43360 + }, + { + "epoch": 37.94, + "learning_rate": 1.5625e-05, + "loss": 0.1105, + "step": 43370 + }, + { + "epoch": 37.95, + "learning_rate": 1.555851063829787e-05, + "loss": 0.1173, + "step": 43380 + }, + { + "epoch": 37.96, + "learning_rate": 1.5492021276595743e-05, + "loss": 0.0933, + "step": 43390 + }, + { + "epoch": 37.97, + "learning_rate": 1.5425531914893617e-05, + "loss": 0.1813, + "step": 43400 + }, + { + "epoch": 37.98, + "learning_rate": 1.535904255319149e-05, + "loss": 0.1602, + "step": 43410 + }, + { + "epoch": 37.99, + "learning_rate": 1.529255319148936e-05, + "loss": 0.0792, + "step": 43420 + }, + { + "epoch": 38.0, + "learning_rate": 1.5226063829787233e-05, + "loss": 0.0989, + "step": 43430 + }, + { + "epoch": 38.01, + "learning_rate": 1.5159574468085105e-05, + "loss": 0.1657, + "step": 43440 + }, + { + "epoch": 38.01, + "learning_rate": 1.5093085106382978e-05, + "loss": 0.1404, + "step": 43450 + }, + { + "epoch": 38.02, + "learning_rate": 1.5026595744680851e-05, + "loss": 0.1052, + "step": 43460 + }, + { + "epoch": 38.03, + "learning_rate": 1.4960106382978723e-05, + "loss": 0.1304, + "step": 43470 + }, + { + "epoch": 38.04, + "learning_rate": 1.4893617021276596e-05, + "loss": 0.1254, + "step": 43480 + }, + { + "epoch": 38.05, + "learning_rate": 1.4827127659574466e-05, + "loss": 0.1278, + "step": 43490 + }, + { + "epoch": 38.06, + "learning_rate": 1.4760638297872339e-05, + "loss": 0.1127, + "step": 43500 + }, + { + "epoch": 38.07, + "learning_rate": 1.469414893617021e-05, + "loss": 0.1294, + "step": 43510 + }, + { + "epoch": 38.08, + "learning_rate": 1.4627659574468084e-05, + "loss": 0.1611, + "step": 43520 + }, + { + "epoch": 38.08, + "learning_rate": 1.4561170212765955e-05, + "loss": 0.1124, + "step": 43530 + }, + { + "epoch": 38.09, + "learning_rate": 1.4494680851063829e-05, + "loss": 0.1192, + "step": 43540 + }, + { + "epoch": 38.1, + "learning_rate": 1.44281914893617e-05, + "loss": 0.154, + "step": 43550 + }, + { + "epoch": 38.11, + "learning_rate": 1.4361702127659573e-05, + "loss": 0.1034, + "step": 43560 + }, + { + "epoch": 38.12, + "learning_rate": 1.4295212765957447e-05, + "loss": 0.1508, + "step": 43570 + }, + { + "epoch": 38.13, + "learning_rate": 1.4228723404255318e-05, + "loss": 0.1236, + "step": 43580 + }, + { + "epoch": 38.14, + "learning_rate": 1.4162234042553191e-05, + "loss": 0.104, + "step": 43590 + }, + { + "epoch": 38.15, + "learning_rate": 1.4095744680851061e-05, + "loss": 0.1027, + "step": 43600 + }, + { + "epoch": 38.15, + "learning_rate": 1.4029255319148936e-05, + "loss": 0.1292, + "step": 43610 + }, + { + "epoch": 38.16, + "learning_rate": 1.3962765957446806e-05, + "loss": 0.1739, + "step": 43620 + }, + { + "epoch": 38.17, + "learning_rate": 1.389627659574468e-05, + "loss": 0.1245, + "step": 43630 + }, + { + "epoch": 38.18, + "learning_rate": 1.3829787234042551e-05, + "loss": 0.1386, + "step": 43640 + }, + { + "epoch": 38.19, + "learning_rate": 1.3763297872340424e-05, + "loss": 0.0873, + "step": 43650 + }, + { + "epoch": 38.2, + "learning_rate": 1.3696808510638297e-05, + "loss": 0.1246, + "step": 43660 + }, + { + "epoch": 38.21, + "learning_rate": 1.3630319148936169e-05, + "loss": 0.1628, + "step": 43670 + }, + { + "epoch": 38.22, + "learning_rate": 1.3563829787234042e-05, + "loss": 0.0928, + "step": 43680 + }, + { + "epoch": 38.22, + "learning_rate": 1.3497340425531914e-05, + "loss": 0.1445, + "step": 43690 + }, + { + "epoch": 38.23, + "learning_rate": 1.3430851063829787e-05, + "loss": 0.0998, + "step": 43700 + }, + { + "epoch": 38.24, + "learning_rate": 1.3364361702127659e-05, + "loss": 0.0773, + "step": 43710 + }, + { + "epoch": 38.25, + "learning_rate": 1.3297872340425532e-05, + "loss": 0.1396, + "step": 43720 + }, + { + "epoch": 38.26, + "learning_rate": 1.3231382978723402e-05, + "loss": 0.0751, + "step": 43730 + }, + { + "epoch": 38.27, + "learning_rate": 1.3164893617021275e-05, + "loss": 0.1667, + "step": 43740 + }, + { + "epoch": 38.28, + "learning_rate": 1.3098404255319146e-05, + "loss": 0.1049, + "step": 43750 + }, + { + "epoch": 38.29, + "learning_rate": 1.303191489361702e-05, + "loss": 0.0908, + "step": 43760 + }, + { + "epoch": 38.29, + "learning_rate": 1.2965425531914893e-05, + "loss": 0.1269, + "step": 43770 + }, + { + "epoch": 38.3, + "learning_rate": 1.2898936170212765e-05, + "loss": 0.1563, + "step": 43780 + }, + { + "epoch": 38.31, + "learning_rate": 1.2832446808510638e-05, + "loss": 0.1266, + "step": 43790 + }, + { + "epoch": 38.32, + "learning_rate": 1.276595744680851e-05, + "loss": 0.1264, + "step": 43800 + }, + { + "epoch": 38.32, + "eval_cer1": 0.23382060024982276, + "eval_cer2": 0.21447087776866283, + "eval_cer3": 0.19509964064031363, + "eval_cer4": 0.19775266428410446, + "eval_cer5": 0.22174097664543524, + "eval_loss": 0.9986442923545837, + "eval_runtime": 1526.627, + "eval_samples_per_second": 5.738, + "step": 43800 + }, + { + "epoch": 38.33, + "learning_rate": 1.2699468085106383e-05, + "loss": 0.1006, + "step": 43810 + }, + { + "epoch": 38.34, + "learning_rate": 1.2632978723404254e-05, + "loss": 0.1246, + "step": 43820 + }, + { + "epoch": 38.35, + "learning_rate": 1.2566489361702127e-05, + "loss": 0.115, + "step": 43830 + }, + { + "epoch": 38.36, + "learning_rate": 1.2499999999999999e-05, + "loss": 0.1206, + "step": 43840 + }, + { + "epoch": 38.36, + "learning_rate": 1.2433510638297872e-05, + "loss": 0.1179, + "step": 43850 + }, + { + "epoch": 38.37, + "learning_rate": 1.2367021276595742e-05, + "loss": 0.1215, + "step": 43860 + }, + { + "epoch": 38.38, + "learning_rate": 1.2300531914893615e-05, + "loss": 0.1313, + "step": 43870 + }, + { + "epoch": 38.39, + "learning_rate": 1.2234042553191489e-05, + "loss": 0.1063, + "step": 43880 + }, + { + "epoch": 38.4, + "learning_rate": 1.216755319148936e-05, + "loss": 0.1281, + "step": 43890 + }, + { + "epoch": 38.41, + "learning_rate": 1.2101063829787233e-05, + "loss": 0.1057, + "step": 43900 + }, + { + "epoch": 38.42, + "learning_rate": 1.2034574468085105e-05, + "loss": 0.1118, + "step": 43910 + }, + { + "epoch": 38.43, + "learning_rate": 1.1968085106382978e-05, + "loss": 0.1376, + "step": 43920 + }, + { + "epoch": 38.43, + "learning_rate": 1.190159574468085e-05, + "loss": 0.0889, + "step": 43930 + }, + { + "epoch": 38.44, + "learning_rate": 1.1835106382978723e-05, + "loss": 0.1308, + "step": 43940 + }, + { + "epoch": 38.45, + "learning_rate": 1.1768617021276594e-05, + "loss": 0.1144, + "step": 43950 + }, + { + "epoch": 38.46, + "learning_rate": 1.1702127659574468e-05, + "loss": 0.1026, + "step": 43960 + }, + { + "epoch": 38.47, + "learning_rate": 1.163563829787234e-05, + "loss": 0.1661, + "step": 43970 + }, + { + "epoch": 38.48, + "learning_rate": 1.1569148936170213e-05, + "loss": 0.0962, + "step": 43980 + }, + { + "epoch": 38.49, + "learning_rate": 1.1502659574468086e-05, + "loss": 0.1378, + "step": 43990 + }, + { + "epoch": 38.49, + "learning_rate": 1.1436170212765956e-05, + "loss": 0.1306, + "step": 44000 + }, + { + "epoch": 38.5, + "learning_rate": 1.1369680851063829e-05, + "loss": 0.0855, + "step": 44010 + }, + { + "epoch": 38.51, + "learning_rate": 1.13031914893617e-05, + "loss": 0.1328, + "step": 44020 + }, + { + "epoch": 38.52, + "learning_rate": 1.1236702127659574e-05, + "loss": 0.1039, + "step": 44030 + }, + { + "epoch": 38.53, + "learning_rate": 1.1170212765957445e-05, + "loss": 0.1658, + "step": 44040 + }, + { + "epoch": 38.54, + "learning_rate": 1.1103723404255318e-05, + "loss": 0.1346, + "step": 44050 + }, + { + "epoch": 38.55, + "learning_rate": 1.103723404255319e-05, + "loss": 0.1297, + "step": 44060 + }, + { + "epoch": 38.56, + "learning_rate": 1.0970744680851063e-05, + "loss": 0.1272, + "step": 44070 + }, + { + "epoch": 38.56, + "learning_rate": 1.0904255319148935e-05, + "loss": 0.0881, + "step": 44080 + }, + { + "epoch": 38.57, + "learning_rate": 1.0837765957446808e-05, + "loss": 0.1505, + "step": 44090 + }, + { + "epoch": 38.58, + "learning_rate": 1.0771276595744681e-05, + "loss": 0.1409, + "step": 44100 + }, + { + "epoch": 38.59, + "learning_rate": 1.0704787234042553e-05, + "loss": 0.0737, + "step": 44110 + }, + { + "epoch": 38.6, + "learning_rate": 1.0638297872340426e-05, + "loss": 0.1263, + "step": 44120 + }, + { + "epoch": 38.61, + "learning_rate": 1.0571808510638296e-05, + "loss": 0.1251, + "step": 44130 + }, + { + "epoch": 38.62, + "learning_rate": 1.050531914893617e-05, + "loss": 0.142, + "step": 44140 + }, + { + "epoch": 38.63, + "learning_rate": 1.043882978723404e-05, + "loss": 0.1062, + "step": 44150 + }, + { + "epoch": 38.63, + "learning_rate": 1.0372340425531914e-05, + "loss": 0.1293, + "step": 44160 + }, + { + "epoch": 38.64, + "learning_rate": 1.0305851063829786e-05, + "loss": 0.1684, + "step": 44170 + }, + { + "epoch": 38.65, + "learning_rate": 1.0239361702127659e-05, + "loss": 0.1099, + "step": 44180 + }, + { + "epoch": 38.66, + "learning_rate": 1.017287234042553e-05, + "loss": 0.1235, + "step": 44190 + }, + { + "epoch": 38.67, + "learning_rate": 1.0106382978723404e-05, + "loss": 0.1046, + "step": 44200 + }, + { + "epoch": 38.68, + "learning_rate": 1.0039893617021277e-05, + "loss": 0.1521, + "step": 44210 + }, + { + "epoch": 38.69, + "learning_rate": 9.973404255319148e-06, + "loss": 0.1433, + "step": 44220 + }, + { + "epoch": 38.7, + "learning_rate": 9.906914893617022e-06, + "loss": 0.0979, + "step": 44230 + }, + { + "epoch": 38.7, + "learning_rate": 9.840425531914893e-06, + "loss": 0.1354, + "step": 44240 + }, + { + "epoch": 38.71, + "learning_rate": 9.773936170212766e-06, + "loss": 0.0895, + "step": 44250 + }, + { + "epoch": 38.72, + "learning_rate": 9.707446808510636e-06, + "loss": 0.1248, + "step": 44260 + }, + { + "epoch": 38.73, + "learning_rate": 9.64095744680851e-06, + "loss": 0.1424, + "step": 44270 + }, + { + "epoch": 38.74, + "learning_rate": 9.574468085106381e-06, + "loss": 0.1442, + "step": 44280 + }, + { + "epoch": 38.75, + "learning_rate": 9.507978723404254e-06, + "loss": 0.1443, + "step": 44290 + }, + { + "epoch": 38.76, + "learning_rate": 9.441489361702126e-06, + "loss": 0.1153, + "step": 44300 + }, + { + "epoch": 38.77, + "learning_rate": 9.375e-06, + "loss": 0.125, + "step": 44310 + }, + { + "epoch": 38.77, + "learning_rate": 9.30851063829787e-06, + "loss": 0.1187, + "step": 44320 + }, + { + "epoch": 38.78, + "learning_rate": 9.242021276595744e-06, + "loss": 0.07, + "step": 44330 + }, + { + "epoch": 38.79, + "learning_rate": 9.175531914893616e-06, + "loss": 0.1322, + "step": 44340 + }, + { + "epoch": 38.8, + "learning_rate": 9.109042553191489e-06, + "loss": 0.0856, + "step": 44350 + }, + { + "epoch": 38.81, + "learning_rate": 9.04255319148936e-06, + "loss": 0.0942, + "step": 44360 + }, + { + "epoch": 38.82, + "learning_rate": 8.976063829787234e-06, + "loss": 0.139, + "step": 44370 + }, + { + "epoch": 38.83, + "learning_rate": 8.909574468085105e-06, + "loss": 0.1209, + "step": 44380 + }, + { + "epoch": 38.84, + "learning_rate": 8.843085106382978e-06, + "loss": 0.1357, + "step": 44390 + }, + { + "epoch": 38.84, + "learning_rate": 8.77659574468085e-06, + "loss": 0.1148, + "step": 44400 + }, + { + "epoch": 38.84, + "eval_cer1": 0.23280780527328584, + "eval_cer2": 0.2152255947497949, + "eval_cer3": 0.19372754001960144, + "eval_cer4": 0.1973341060562156, + "eval_cer5": 0.2197027600849257, + "eval_loss": 0.9971761107444763, + "eval_runtime": 1545.9305, + "eval_samples_per_second": 5.666, + "step": 44400 + }, + { + "epoch": 38.85, + "learning_rate": 8.710106382978723e-06, + "loss": 0.1107, + "step": 44410 + }, + { + "epoch": 38.86, + "learning_rate": 8.643617021276595e-06, + "loss": 0.1444, + "step": 44420 + }, + { + "epoch": 38.87, + "learning_rate": 8.577127659574468e-06, + "loss": 0.1091, + "step": 44430 + }, + { + "epoch": 38.88, + "learning_rate": 8.51063829787234e-06, + "loss": 0.1231, + "step": 44440 + }, + { + "epoch": 38.89, + "learning_rate": 8.444148936170211e-06, + "loss": 0.104, + "step": 44450 + }, + { + "epoch": 38.9, + "learning_rate": 8.377659574468084e-06, + "loss": 0.1162, + "step": 44460 + }, + { + "epoch": 38.91, + "learning_rate": 8.311170212765956e-06, + "loss": 0.1644, + "step": 44470 + }, + { + "epoch": 38.91, + "learning_rate": 8.244680851063829e-06, + "loss": 0.0847, + "step": 44480 + }, + { + "epoch": 38.92, + "learning_rate": 8.178191489361702e-06, + "loss": 0.1391, + "step": 44490 + }, + { + "epoch": 38.93, + "learning_rate": 8.111702127659574e-06, + "loss": 0.0722, + "step": 44500 + }, + { + "epoch": 38.94, + "learning_rate": 8.045212765957445e-06, + "loss": 0.1239, + "step": 44510 + }, + { + "epoch": 38.95, + "learning_rate": 7.978723404255319e-06, + "loss": 0.1615, + "step": 44520 + }, + { + "epoch": 38.96, + "learning_rate": 7.91223404255319e-06, + "loss": 0.0797, + "step": 44530 + }, + { + "epoch": 38.97, + "learning_rate": 7.845744680851064e-06, + "loss": 0.1284, + "step": 44540 + }, + { + "epoch": 38.98, + "learning_rate": 7.779255319148935e-06, + "loss": 0.0877, + "step": 44550 + }, + { + "epoch": 38.98, + "learning_rate": 7.712765957446808e-06, + "loss": 0.1075, + "step": 44560 + }, + { + "epoch": 38.99, + "learning_rate": 7.64627659574468e-06, + "loss": 0.1408, + "step": 44570 + }, + { + "epoch": 39.0, + "learning_rate": 7.579787234042552e-06, + "loss": 0.1525, + "step": 44580 + }, + { + "epoch": 39.01, + "learning_rate": 7.5132978723404255e-06, + "loss": 0.1289, + "step": 44590 + }, + { + "epoch": 39.02, + "learning_rate": 7.446808510638298e-06, + "loss": 0.1055, + "step": 44600 + }, + { + "epoch": 39.03, + "learning_rate": 7.3803191489361695e-06, + "loss": 0.167, + "step": 44610 + }, + { + "epoch": 39.04, + "learning_rate": 7.313829787234042e-06, + "loss": 0.091, + "step": 44620 + }, + { + "epoch": 39.05, + "learning_rate": 7.247340425531914e-06, + "loss": 0.1064, + "step": 44630 + }, + { + "epoch": 39.06, + "learning_rate": 7.180851063829787e-06, + "loss": 0.1184, + "step": 44640 + }, + { + "epoch": 39.06, + "learning_rate": 7.114361702127659e-06, + "loss": 0.0808, + "step": 44650 + }, + { + "epoch": 39.07, + "learning_rate": 7.047872340425531e-06, + "loss": 0.1331, + "step": 44660 + }, + { + "epoch": 39.08, + "learning_rate": 6.981382978723403e-06, + "loss": 0.1058, + "step": 44670 + }, + { + "epoch": 39.09, + "learning_rate": 6.9148936170212754e-06, + "loss": 0.1137, + "step": 44680 + }, + { + "epoch": 39.1, + "learning_rate": 6.848404255319149e-06, + "loss": 0.1149, + "step": 44690 + }, + { + "epoch": 39.11, + "learning_rate": 6.781914893617021e-06, + "loss": 0.1043, + "step": 44700 + }, + { + "epoch": 39.12, + "learning_rate": 6.7154255319148935e-06, + "loss": 0.1516, + "step": 44710 + }, + { + "epoch": 39.13, + "learning_rate": 6.648936170212766e-06, + "loss": 0.1496, + "step": 44720 + }, + { + "epoch": 39.13, + "learning_rate": 6.5824468085106375e-06, + "loss": 0.1316, + "step": 44730 + }, + { + "epoch": 39.14, + "learning_rate": 6.51595744680851e-06, + "loss": 0.1079, + "step": 44740 + }, + { + "epoch": 39.15, + "learning_rate": 6.449468085106382e-06, + "loss": 0.108, + "step": 44750 + }, + { + "epoch": 39.16, + "learning_rate": 6.382978723404255e-06, + "loss": 0.1287, + "step": 44760 + }, + { + "epoch": 39.17, + "learning_rate": 6.316489361702127e-06, + "loss": 0.0844, + "step": 44770 + }, + { + "epoch": 39.18, + "learning_rate": 6.2499999999999995e-06, + "loss": 0.1874, + "step": 44780 + }, + { + "epoch": 39.19, + "learning_rate": 6.183510638297871e-06, + "loss": 0.1283, + "step": 44790 + }, + { + "epoch": 39.2, + "learning_rate": 6.117021276595744e-06, + "loss": 0.1002, + "step": 44800 + }, + { + "epoch": 39.2, + "learning_rate": 6.050531914893617e-06, + "loss": 0.1119, + "step": 44810 + }, + { + "epoch": 39.21, + "learning_rate": 5.984042553191489e-06, + "loss": 0.1132, + "step": 44820 + }, + { + "epoch": 39.22, + "learning_rate": 5.9175531914893615e-06, + "loss": 0.078, + "step": 44830 + }, + { + "epoch": 39.23, + "learning_rate": 5.851063829787234e-06, + "loss": 0.1296, + "step": 44840 + }, + { + "epoch": 39.24, + "learning_rate": 5.784574468085106e-06, + "loss": 0.1403, + "step": 44850 + }, + { + "epoch": 39.25, + "learning_rate": 5.718085106382978e-06, + "loss": 0.1594, + "step": 44860 + }, + { + "epoch": 39.26, + "learning_rate": 5.65159574468085e-06, + "loss": 0.0925, + "step": 44870 + }, + { + "epoch": 39.26, + "learning_rate": 5.585106382978723e-06, + "loss": 0.0862, + "step": 44880 + }, + { + "epoch": 39.27, + "learning_rate": 5.518617021276595e-06, + "loss": 0.1441, + "step": 44890 + }, + { + "epoch": 39.28, + "learning_rate": 5.452127659574467e-06, + "loss": 0.0903, + "step": 44900 + }, + { + "epoch": 39.29, + "learning_rate": 5.385638297872341e-06, + "loss": 0.1384, + "step": 44910 + }, + { + "epoch": 39.3, + "learning_rate": 5.319148936170213e-06, + "loss": 0.0934, + "step": 44920 + }, + { + "epoch": 39.31, + "learning_rate": 5.252659574468085e-06, + "loss": 0.1469, + "step": 44930 + }, + { + "epoch": 39.32, + "learning_rate": 5.186170212765957e-06, + "loss": 0.1163, + "step": 44940 + }, + { + "epoch": 39.33, + "learning_rate": 5.119680851063829e-06, + "loss": 0.0964, + "step": 44950 + }, + { + "epoch": 39.33, + "learning_rate": 5.053191489361702e-06, + "loss": 0.1217, + "step": 44960 + }, + { + "epoch": 39.34, + "learning_rate": 4.986702127659574e-06, + "loss": 0.1045, + "step": 44970 + }, + { + "epoch": 39.35, + "learning_rate": 4.920212765957447e-06, + "loss": 0.091, + "step": 44980 + }, + { + "epoch": 39.36, + "learning_rate": 4.853723404255318e-06, + "loss": 0.1472, + "step": 44990 + }, + { + "epoch": 39.37, + "learning_rate": 4.7872340425531906e-06, + "loss": 0.101, + "step": 45000 + }, + { + "epoch": 39.37, + "eval_cer1": 0.2319638094595051, + "eval_cer2": 0.21532403609515996, + "eval_cer3": 0.19372754001960144, + "eval_cer4": 0.19675456389452334, + "eval_cer5": 0.22140127388535033, + "eval_loss": 0.997524619102478, + "eval_runtime": 1508.5228, + "eval_samples_per_second": 5.807, + "step": 45000 + }, + { + "epoch": 39.38, + "learning_rate": 4.720744680851063e-06, + "loss": 0.1406, + "step": 45010 + }, + { + "epoch": 39.39, + "learning_rate": 4.654255319148935e-06, + "loss": 0.1025, + "step": 45020 + }, + { + "epoch": 39.4, + "learning_rate": 4.587765957446808e-06, + "loss": 0.1326, + "step": 45030 + }, + { + "epoch": 39.4, + "learning_rate": 4.52127659574468e-06, + "loss": 0.1187, + "step": 45040 + }, + { + "epoch": 39.41, + "learning_rate": 4.4547872340425526e-06, + "loss": 0.1037, + "step": 45050 + }, + { + "epoch": 39.42, + "learning_rate": 4.388297872340425e-06, + "loss": 0.1222, + "step": 45060 + }, + { + "epoch": 39.43, + "learning_rate": 4.321808510638297e-06, + "loss": 0.1087, + "step": 45070 + }, + { + "epoch": 39.44, + "learning_rate": 4.25531914893617e-06, + "loss": 0.1324, + "step": 45080 + }, + { + "epoch": 39.45, + "learning_rate": 4.188829787234042e-06, + "loss": 0.1203, + "step": 45090 + }, + { + "epoch": 39.46, + "learning_rate": 4.1223404255319146e-06, + "loss": 0.1337, + "step": 45100 + }, + { + "epoch": 39.47, + "learning_rate": 4.055851063829787e-06, + "loss": 0.1308, + "step": 45110 + }, + { + "epoch": 39.47, + "learning_rate": 3.989361702127659e-06, + "loss": 0.0758, + "step": 45120 + }, + { + "epoch": 39.48, + "learning_rate": 3.922872340425532e-06, + "loss": 0.1323, + "step": 45130 + }, + { + "epoch": 39.49, + "learning_rate": 3.856382978723404e-06, + "loss": 0.1132, + "step": 45140 + }, + { + "epoch": 39.5, + "learning_rate": 3.789893617021276e-06, + "loss": 0.1114, + "step": 45150 + }, + { + "epoch": 39.51, + "learning_rate": 3.723404255319149e-06, + "loss": 0.155, + "step": 45160 + }, + { + "epoch": 39.52, + "learning_rate": 3.656914893617021e-06, + "loss": 0.1053, + "step": 45170 + }, + { + "epoch": 39.53, + "learning_rate": 3.5904255319148933e-06, + "loss": 0.1569, + "step": 45180 + }, + { + "epoch": 39.54, + "learning_rate": 3.5239361702127653e-06, + "loss": 0.1222, + "step": 45190 + }, + { + "epoch": 39.54, + "learning_rate": 3.4574468085106377e-06, + "loss": 0.082, + "step": 45200 + }, + { + "epoch": 39.55, + "learning_rate": 3.3909574468085105e-06, + "loss": 0.1357, + "step": 45210 + }, + { + "epoch": 39.56, + "learning_rate": 3.324468085106383e-06, + "loss": 0.1036, + "step": 45220 + }, + { + "epoch": 39.57, + "learning_rate": 3.257978723404255e-06, + "loss": 0.0981, + "step": 45230 + }, + { + "epoch": 39.58, + "learning_rate": 3.1914893617021273e-06, + "loss": 0.1168, + "step": 45240 + }, + { + "epoch": 39.59, + "learning_rate": 3.1249999999999997e-06, + "loss": 0.0744, + "step": 45250 + }, + { + "epoch": 39.6, + "learning_rate": 3.058510638297872e-06, + "loss": 0.1455, + "step": 45260 + }, + { + "epoch": 39.61, + "learning_rate": 2.9920212765957445e-06, + "loss": 0.1381, + "step": 45270 + }, + { + "epoch": 39.61, + "learning_rate": 2.925531914893617e-06, + "loss": 0.1188, + "step": 45280 + }, + { + "epoch": 39.62, + "learning_rate": 2.859042553191489e-06, + "loss": 0.1167, + "step": 45290 + }, + { + "epoch": 39.63, + "learning_rate": 2.7925531914893613e-06, + "loss": 0.1172, + "step": 45300 + }, + { + "epoch": 39.64, + "learning_rate": 2.7260638297872337e-06, + "loss": 0.1058, + "step": 45310 + }, + { + "epoch": 39.65, + "learning_rate": 2.6595744680851065e-06, + "loss": 0.0801, + "step": 45320 + }, + { + "epoch": 39.66, + "learning_rate": 2.5930851063829785e-06, + "loss": 0.1102, + "step": 45330 + }, + { + "epoch": 39.67, + "learning_rate": 2.526595744680851e-06, + "loss": 0.1171, + "step": 45340 + }, + { + "epoch": 39.68, + "learning_rate": 2.4601063829787233e-06, + "loss": 0.1058, + "step": 45350 + }, + { + "epoch": 39.68, + "learning_rate": 2.3936170212765953e-06, + "loss": 0.1445, + "step": 45360 + }, + { + "epoch": 39.69, + "learning_rate": 2.3271276595744677e-06, + "loss": 0.1169, + "step": 45370 + }, + { + "epoch": 39.7, + "learning_rate": 2.26063829787234e-06, + "loss": 0.111, + "step": 45380 + }, + { + "epoch": 39.71, + "learning_rate": 2.1941489361702125e-06, + "loss": 0.1165, + "step": 45390 + }, + { + "epoch": 39.72, + "learning_rate": 2.127659574468085e-06, + "loss": 0.1212, + "step": 45400 + }, + { + "epoch": 39.73, + "learning_rate": 2.0611702127659573e-06, + "loss": 0.1413, + "step": 45410 + }, + { + "epoch": 39.74, + "learning_rate": 1.9946808510638297e-06, + "loss": 0.1318, + "step": 45420 + }, + { + "epoch": 39.75, + "learning_rate": 1.928191489361702e-06, + "loss": 0.1365, + "step": 45430 + }, + { + "epoch": 39.75, + "learning_rate": 1.8617021276595745e-06, + "loss": 0.1256, + "step": 45440 + }, + { + "epoch": 39.76, + "learning_rate": 1.7952127659574467e-06, + "loss": 0.1005, + "step": 45450 + }, + { + "epoch": 39.77, + "learning_rate": 1.7287234042553189e-06, + "loss": 0.1351, + "step": 45460 + }, + { + "epoch": 39.78, + "learning_rate": 1.6622340425531915e-06, + "loss": 0.1322, + "step": 45470 + }, + { + "epoch": 39.79, + "learning_rate": 1.5957446808510637e-06, + "loss": 0.1354, + "step": 45480 + }, + { + "epoch": 39.8, + "learning_rate": 1.529255319148936e-06, + "loss": 0.1178, + "step": 45490 + }, + { + "epoch": 39.81, + "learning_rate": 1.4627659574468085e-06, + "loss": 0.0833, + "step": 45500 + }, + { + "epoch": 39.82, + "learning_rate": 1.3962765957446807e-06, + "loss": 0.1427, + "step": 45510 + }, + { + "epoch": 39.82, + "learning_rate": 1.3297872340425533e-06, + "loss": 0.1157, + "step": 45520 + }, + { + "epoch": 39.83, + "learning_rate": 1.2632978723404255e-06, + "loss": 0.1085, + "step": 45530 + }, + { + "epoch": 39.84, + "learning_rate": 1.1968085106382976e-06, + "loss": 0.1455, + "step": 45540 + }, + { + "epoch": 39.85, + "learning_rate": 1.13031914893617e-06, + "loss": 0.0739, + "step": 45550 + }, + { + "epoch": 39.86, + "learning_rate": 1.0638297872340424e-06, + "loss": 0.1533, + "step": 45560 + }, + { + "epoch": 39.87, + "learning_rate": 9.973404255319148e-07, + "loss": 0.0906, + "step": 45570 + }, + { + "epoch": 39.88, + "learning_rate": 9.308510638297872e-07, + "loss": 0.1182, + "step": 45580 + }, + { + "epoch": 39.89, + "learning_rate": 8.643617021276594e-07, + "loss": 0.1603, + "step": 45590 + }, + { + "epoch": 39.89, + "learning_rate": 7.978723404255318e-07, + "loss": 0.1093, + "step": 45600 + }, + { + "epoch": 39.89, + "eval_cer1": 0.23250396678032478, + "eval_cer2": 0.21384741591468417, + "eval_cer3": 0.19333551127082652, + "eval_cer4": 0.19691554782832674, + "eval_cer5": 0.22148619957537155, + "eval_loss": 0.9972271919250488, + "eval_runtime": 1369.6838, + "eval_samples_per_second": 6.396, + "step": 45600 + }, + { + "epoch": 39.9, + "learning_rate": 7.313829787234042e-07, + "loss": 0.1321, + "step": 45610 + }, + { + "epoch": 39.91, + "learning_rate": 6.648936170212766e-07, + "loss": 0.1192, + "step": 45620 + }, + { + "epoch": 39.92, + "learning_rate": 5.984042553191488e-07, + "loss": 0.1085, + "step": 45630 + }, + { + "epoch": 39.93, + "learning_rate": 5.319148936170212e-07, + "loss": 0.115, + "step": 45640 + }, + { + "epoch": 39.94, + "learning_rate": 4.654255319148936e-07, + "loss": 0.0707, + "step": 45650 + }, + { + "epoch": 39.95, + "learning_rate": 3.989361702127659e-07, + "loss": 0.1043, + "step": 45660 + }, + { + "epoch": 39.96, + "learning_rate": 3.324468085106383e-07, + "loss": 0.128, + "step": 45670 + }, + { + "epoch": 39.96, + "learning_rate": 2.659574468085106e-07, + "loss": 0.0935, + "step": 45680 + }, + { + "epoch": 39.97, + "learning_rate": 1.9946808510638296e-07, + "loss": 0.0999, + "step": 45690 + }, + { + "epoch": 39.98, + "learning_rate": 1.329787234042553e-07, + "loss": 0.0846, + "step": 45700 } ], "max_steps": 45720, "num_train_epochs": 40, - "total_flos": 1.601241517283e+20, + "total_flos": 2.5343023234719593e+20, "trial_name": null, "trial_params": null }