{ "best_metric": null, "best_model_checkpoint": null, "epoch": 8.321388756171364, "global_step": 104500, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.04, "learning_rate": 1.9960000000000002e-05, "loss": 0.3401, "step": 500 }, { "epoch": 0.04, "eval_cer": 0.05505943280676956, "eval_loss": 0.23293745517730713, "eval_runtime": 964.5334, "eval_samples_per_second": 10.94, "eval_steps_per_second": 5.47, "eval_wer": 0.16114398009742228, "step": 500 }, { "epoch": 0.08, "learning_rate": 1.9960185111306155e-05, "loss": 0.3315, "step": 1000 }, { "epoch": 0.08, "eval_cer": 0.05545081745226068, "eval_loss": 0.2401716113090515, "eval_runtime": 950.9231, "eval_samples_per_second": 11.097, "eval_steps_per_second": 5.548, "eval_wer": 0.162095206238371, "step": 1000 }, { "epoch": 0.12, "learning_rate": 1.9920290433256203e-05, "loss": 0.3035, "step": 1500 }, { "epoch": 0.12, "eval_cer": 0.05505593830100624, "eval_loss": 0.23731189966201782, "eval_runtime": 951.7866, "eval_samples_per_second": 11.087, "eval_steps_per_second": 5.543, "eval_wer": 0.16098718457968347, "step": 1500 }, { "epoch": 0.16, "learning_rate": 1.9880395755206258e-05, "loss": 0.3333, "step": 2000 }, { "epoch": 0.16, "eval_cer": 0.05457893826431393, "eval_loss": 0.22870676219463348, "eval_runtime": 974.2674, "eval_samples_per_second": 10.831, "eval_steps_per_second": 5.415, "eval_wer": 0.15954466581648652, "step": 2000 }, { "epoch": 0.2, "learning_rate": 1.9840580866512408e-05, "loss": 0.3406, "step": 2500 }, { "epoch": 0.2, "eval_cer": 0.05494061961081689, "eval_loss": 0.23157823085784912, "eval_runtime": 942.0206, "eval_samples_per_second": 11.201, "eval_steps_per_second": 5.601, "eval_wer": 0.16144711809838397, "step": 2500 }, { "epoch": 0.24, "learning_rate": 1.9800686188462463e-05, "loss": 0.3232, "step": 3000 }, { "epoch": 0.24, "eval_cer": 0.05591034496013642, "eval_loss": 0.2290341705083847, "eval_runtime": 914.2178, "eval_samples_per_second": 11.542, "eval_steps_per_second": 5.771, "eval_wer": 0.16311960362093117, "step": 3000 }, { "epoch": 0.28, "learning_rate": 1.9760791510412514e-05, "loss": 0.3218, "step": 3500 }, { "epoch": 0.28, "eval_cer": 0.05532326799189974, "eval_loss": 0.22873252630233765, "eval_runtime": 913.382, "eval_samples_per_second": 11.553, "eval_steps_per_second": 5.776, "eval_wer": 0.1619384107206322, "step": 3500 }, { "epoch": 0.32, "learning_rate": 1.9720896832362562e-05, "loss": 0.3165, "step": 4000 }, { "epoch": 0.32, "eval_cer": 0.055456059210905656, "eval_loss": 0.2304326593875885, "eval_runtime": 931.5603, "eval_samples_per_second": 11.327, "eval_steps_per_second": 5.664, "eval_wer": 0.16228336085965755, "step": 4000 }, { "epoch": 0.36, "learning_rate": 1.9681081943668715e-05, "loss": 0.3485, "step": 4500 }, { "epoch": 0.36, "eval_cer": 0.05544732294649737, "eval_loss": 0.22790302336215973, "eval_runtime": 950.134, "eval_samples_per_second": 11.106, "eval_steps_per_second": 5.553, "eval_wer": 0.1616248196851546, "step": 4500 }, { "epoch": 0.4, "learning_rate": 1.964118726561877e-05, "loss": 0.3416, "step": 5000 }, { "epoch": 0.4, "eval_cer": 0.05489519103589382, "eval_loss": 0.23012946546077728, "eval_runtime": 933.9668, "eval_samples_per_second": 11.298, "eval_steps_per_second": 5.649, "eval_wer": 0.16180252127192524, "step": 5000 }, { "epoch": 0.44, "learning_rate": 1.960137237692492e-05, "loss": 0.3487, "step": 5500 }, { "epoch": 0.44, "eval_cer": 0.05520096029018376, "eval_loss": 0.22688831388950348, "eval_runtime": 943.4893, "eval_samples_per_second": 11.184, "eval_steps_per_second": 5.592, "eval_wer": 0.1605795162335626, "step": 5500 }, { "epoch": 0.48, "learning_rate": 1.956147769887497e-05, "loss": 0.3285, "step": 6000 }, { "epoch": 0.48, "eval_cer": 0.055174751496958906, "eval_loss": 0.22907914221286774, "eval_runtime": 918.4091, "eval_samples_per_second": 11.489, "eval_steps_per_second": 5.745, "eval_wer": 0.1609453724416198, "step": 6000 }, { "epoch": 0.52, "learning_rate": 1.9521583020825023e-05, "loss": 0.3293, "step": 6500 }, { "epoch": 0.52, "eval_cer": 0.055221927324763644, "eval_loss": 0.23320981860160828, "eval_runtime": 942.5174, "eval_samples_per_second": 11.196, "eval_steps_per_second": 5.598, "eval_wer": 0.16107080885581085, "step": 6500 }, { "epoch": 0.56, "learning_rate": 1.9481688342775075e-05, "loss": 0.3371, "step": 7000 }, { "epoch": 0.56, "eval_cer": 0.05506816907117784, "eval_loss": 0.23159052431583405, "eval_runtime": 934.7505, "eval_samples_per_second": 11.289, "eval_steps_per_second": 5.644, "eval_wer": 0.1610603558212949, "step": 7000 }, { "epoch": 0.6, "learning_rate": 1.944179366472513e-05, "loss": 0.3339, "step": 7500 }, { "epoch": 0.6, "eval_cer": 0.05462436683923701, "eval_loss": 0.23084835708141327, "eval_runtime": 938.542, "eval_samples_per_second": 11.243, "eval_steps_per_second": 5.621, "eval_wer": 0.16049589195743524, "step": 7500 }, { "epoch": 0.64, "learning_rate": 1.9401898986675178e-05, "loss": 0.3058, "step": 8000 }, { "epoch": 0.64, "eval_cer": 0.054107179986266594, "eval_loss": 0.23283512890338898, "eval_runtime": 952.8447, "eval_samples_per_second": 11.074, "eval_steps_per_second": 5.537, "eval_wer": 0.1582798486400602, "step": 8000 }, { "epoch": 0.68, "learning_rate": 1.936208409798133e-05, "loss": 0.3142, "step": 8500 }, { "epoch": 0.68, "eval_cer": 0.054398971217503284, "eval_loss": 0.2275152951478958, "eval_runtime": 925.1793, "eval_samples_per_second": 11.405, "eval_steps_per_second": 5.703, "eval_wer": 0.15972236740325715, "step": 8500 }, { "epoch": 0.72, "learning_rate": 1.9322189419931382e-05, "loss": 0.3026, "step": 9000 }, { "epoch": 0.72, "eval_cer": 0.054205026147639376, "eval_loss": 0.2291727066040039, "eval_runtime": 924.5764, "eval_samples_per_second": 11.413, "eval_steps_per_second": 5.706, "eval_wer": 0.15947149457487508, "step": 9000 }, { "epoch": 0.76, "learning_rate": 1.9282294741881434e-05, "loss": 0.3201, "step": 9500 }, { "epoch": 0.76, "eval_cer": 0.054220751423574284, "eval_loss": 0.2310110330581665, "eval_runtime": 943.6124, "eval_samples_per_second": 11.183, "eval_steps_per_second": 5.591, "eval_wer": 0.159220621746493, "step": 9500 }, { "epoch": 0.8, "learning_rate": 1.9242400063831485e-05, "loss": 0.3219, "step": 10000 }, { "epoch": 0.8, "eval_cer": 0.05398836679031393, "eval_loss": 0.23035095632076263, "eval_runtime": 936.4474, "eval_samples_per_second": 11.268, "eval_steps_per_second": 5.634, "eval_wer": 0.15835301988167164, "step": 10000 }, { "epoch": 0.84, "learning_rate": 1.9202505385781537e-05, "loss": 0.3295, "step": 10500 }, { "epoch": 0.84, "eval_cer": 0.05505419104812458, "eval_loss": 0.22920408844947815, "eval_runtime": 925.5202, "eval_samples_per_second": 11.401, "eval_steps_per_second": 5.701, "eval_wer": 0.16102899671774717, "step": 10500 }, { "epoch": 0.88, "learning_rate": 1.916269049708769e-05, "loss": 0.3436, "step": 11000 }, { "epoch": 0.88, "eval_cer": 0.0538520810655447, "eval_loss": 0.2316814512014389, "eval_runtime": 949.5795, "eval_samples_per_second": 11.112, "eval_steps_per_second": 5.556, "eval_wer": 0.1578617272594234, "step": 11000 }, { "epoch": 0.92, "learning_rate": 1.912279581903774e-05, "loss": 0.3104, "step": 11500 }, { "epoch": 0.92, "eval_cer": 0.05466804816127843, "eval_loss": 0.23170439898967743, "eval_runtime": 947.8382, "eval_samples_per_second": 11.133, "eval_steps_per_second": 5.566, "eval_wer": 0.15990006899002782, "step": 11500 }, { "epoch": 0.96, "learning_rate": 1.9082901140987793e-05, "loss": 0.3283, "step": 12000 }, { "epoch": 0.96, "eval_cer": 0.05422249867645594, "eval_loss": 0.22942642867565155, "eval_runtime": 929.578, "eval_samples_per_second": 11.351, "eval_steps_per_second": 5.676, "eval_wer": 0.15938787029874774, "step": 12000 }, { "epoch": 1.0, "learning_rate": 1.9043006462937845e-05, "loss": 0.3108, "step": 12500 }, { "epoch": 1.0, "eval_cer": 0.053904498651994405, "eval_loss": 0.2244606465101242, "eval_runtime": 919.5832, "eval_samples_per_second": 11.475, "eval_steps_per_second": 5.737, "eval_wer": 0.15835301988167164, "step": 12500 }, { "epoch": 1.04, "learning_rate": 1.9003111784887896e-05, "loss": 0.3195, "step": 13000 }, { "epoch": 1.04, "eval_cer": 0.0546977514602666, "eval_loss": 0.23177924752235413, "eval_runtime": 936.5823, "eval_samples_per_second": 11.266, "eval_steps_per_second": 5.633, "eval_wer": 0.15980599167938453, "step": 13000 }, { "epoch": 1.08, "learning_rate": 1.896329689619405e-05, "loss": 0.3458, "step": 13500 }, { "epoch": 1.08, "eval_cer": 0.05474318003518967, "eval_loss": 0.2328505516052246, "eval_runtime": 913.1325, "eval_samples_per_second": 11.556, "eval_steps_per_second": 5.778, "eval_wer": 0.1593251520916522, "step": 13500 }, { "epoch": 1.11, "learning_rate": 1.89234022181441e-05, "loss": 0.3019, "step": 14000 }, { "epoch": 1.11, "eval_cer": 0.05441644374631985, "eval_loss": 0.23426495492458344, "eval_runtime": 921.2679, "eval_samples_per_second": 11.454, "eval_steps_per_second": 5.727, "eval_wer": 0.1596387431271298, "step": 14000 }, { "epoch": 1.15, "learning_rate": 1.8883507540094152e-05, "loss": 0.3178, "step": 14500 }, { "epoch": 1.15, "eval_cer": 0.05391323491640269, "eval_loss": 0.22591577470302582, "eval_runtime": 899.54, "eval_samples_per_second": 11.73, "eval_steps_per_second": 5.865, "eval_wer": 0.15841573808876716, "step": 14500 }, { "epoch": 1.19, "learning_rate": 1.8843612862044204e-05, "loss": 0.2875, "step": 15000 }, { "epoch": 1.19, "eval_cer": 0.05423997120527251, "eval_loss": 0.2320357859134674, "eval_runtime": 917.8061, "eval_samples_per_second": 11.497, "eval_steps_per_second": 5.748, "eval_wer": 0.15887567160746766, "step": 15000 }, { "epoch": 1.23, "learning_rate": 1.880371818399426e-05, "loss": 0.3146, "step": 15500 }, { "epoch": 1.23, "eval_cer": 0.054225993182219254, "eval_loss": 0.23161908984184265, "eval_runtime": 924.5404, "eval_samples_per_second": 11.413, "eval_steps_per_second": 5.707, "eval_wer": 0.1600568645077666, "step": 15500 }, { "epoch": 1.27, "learning_rate": 1.8763823505944307e-05, "loss": 0.3026, "step": 16000 }, { "epoch": 1.27, "eval_cer": 0.055894619684201514, "eval_loss": 0.2382396012544632, "eval_runtime": 900.5773, "eval_samples_per_second": 11.717, "eval_steps_per_second": 5.858, "eval_wer": 0.16226245479062573, "step": 16000 }, { "epoch": 1.31, "learning_rate": 1.872392882789436e-05, "loss": 0.3248, "step": 16500 }, { "epoch": 1.31, "eval_cer": 0.05442168550496482, "eval_loss": 0.23420971632003784, "eval_runtime": 902.3765, "eval_samples_per_second": 11.694, "eval_steps_per_second": 5.847, "eval_wer": 0.15955511885100246, "step": 16500 }, { "epoch": 1.35, "learning_rate": 1.8684034149844413e-05, "loss": 0.3067, "step": 17000 }, { "epoch": 1.35, "eval_cer": 0.053754234904171916, "eval_loss": 0.22963067889213562, "eval_runtime": 895.93, "eval_samples_per_second": 11.778, "eval_steps_per_second": 5.889, "eval_wer": 0.158175318294901, "step": 17000 }, { "epoch": 1.39, "learning_rate": 1.8644219261150563e-05, "loss": 0.3009, "step": 17500 }, { "epoch": 1.39, "eval_cer": 0.05442518001072813, "eval_loss": 0.23200643062591553, "eval_runtime": 896.3694, "eval_samples_per_second": 11.772, "eval_steps_per_second": 5.886, "eval_wer": 0.15981644471390044, "step": 17500 }, { "epoch": 1.43, "learning_rate": 1.8604324583100618e-05, "loss": 0.3262, "step": 18000 }, { "epoch": 1.43, "eval_cer": 0.05472920201213642, "eval_loss": 0.23050285875797272, "eval_runtime": 908.5096, "eval_samples_per_second": 11.615, "eval_steps_per_second": 5.807, "eval_wer": 0.16033909643969643, "step": 18000 }, { "epoch": 1.47, "learning_rate": 1.8564429905050666e-05, "loss": 0.3152, "step": 18500 }, { "epoch": 1.47, "eval_cer": 0.05423123494086422, "eval_loss": 0.23030424118041992, "eval_runtime": 904.961, "eval_samples_per_second": 11.66, "eval_steps_per_second": 5.83, "eval_wer": 0.15819622436393285, "step": 18500 }, { "epoch": 1.51, "learning_rate": 1.852453522700072e-05, "loss": 0.3143, "step": 19000 }, { "epoch": 1.51, "eval_cer": 0.05423123494086422, "eval_loss": 0.22637102007865906, "eval_runtime": 915.5045, "eval_samples_per_second": 11.526, "eval_steps_per_second": 5.763, "eval_wer": 0.15950285367842285, "step": 19000 }, { "epoch": 1.55, "learning_rate": 1.848472033830687e-05, "loss": 0.3004, "step": 19500 }, { "epoch": 1.55, "eval_cer": 0.05468027893145003, "eval_loss": 0.22641883790493011, "eval_runtime": 935.8875, "eval_samples_per_second": 11.275, "eval_steps_per_second": 5.637, "eval_wer": 0.1609349194071039, "step": 19500 }, { "epoch": 1.59, "learning_rate": 1.8444825660256926e-05, "loss": 0.2804, "step": 20000 }, { "epoch": 1.59, "eval_cer": 0.054790355862994404, "eval_loss": 0.23191003501415253, "eval_runtime": 1043.7138, "eval_samples_per_second": 10.11, "eval_steps_per_second": 5.055, "eval_wer": 0.159743273472289, "step": 20000 }, { "epoch": 1.63, "learning_rate": 1.8404930982206974e-05, "loss": 0.2875, "step": 20500 }, { "epoch": 1.63, "eval_cer": 0.054765894322651214, "eval_loss": 0.23086883127689362, "eval_runtime": 1016.2119, "eval_samples_per_second": 10.384, "eval_steps_per_second": 5.192, "eval_wer": 0.15847845629586269, "step": 20500 }, { "epoch": 1.67, "learning_rate": 1.8365116093513127e-05, "loss": 0.3241, "step": 21000 }, { "epoch": 1.67, "eval_cer": 0.05488645477148553, "eval_loss": 0.23257198929786682, "eval_runtime": 1123.4321, "eval_samples_per_second": 9.393, "eval_steps_per_second": 4.696, "eval_wer": 0.15990006899002782, "step": 21000 }, { "epoch": 1.71, "learning_rate": 1.832522141546318e-05, "loss": 0.3233, "step": 21500 }, { "epoch": 1.71, "eval_cer": 0.053128718372538776, "eval_loss": 0.22576376795768738, "eval_runtime": 1100.6586, "eval_samples_per_second": 9.587, "eval_steps_per_second": 4.793, "eval_wer": 0.15670144042815629, "step": 21500 }, { "epoch": 1.75, "learning_rate": 1.828532673741323e-05, "loss": 0.3148, "step": 22000 }, { "epoch": 1.75, "eval_cer": 0.05433432286088198, "eval_loss": 0.2339024692773819, "eval_runtime": 1081.304, "eval_samples_per_second": 9.759, "eval_steps_per_second": 4.879, "eval_wer": 0.1599627871971233, "step": 22000 }, { "epoch": 1.79, "learning_rate": 1.824543205936328e-05, "loss": 0.3207, "step": 22500 }, { "epoch": 1.79, "eval_cer": 0.054479344850059494, "eval_loss": 0.23086592555046082, "eval_runtime": 1030.6142, "eval_samples_per_second": 10.239, "eval_steps_per_second": 5.119, "eval_wer": 0.15999414630067108, "step": 22500 }, { "epoch": 1.83, "learning_rate": 1.8205537381313333e-05, "loss": 0.2894, "step": 23000 }, { "epoch": 1.83, "eval_cer": 0.054685520690094996, "eval_loss": 0.23256057500839233, "eval_runtime": 1070.5285, "eval_samples_per_second": 9.857, "eval_steps_per_second": 4.928, "eval_wer": 0.16039136161227605, "step": 23000 }, { "epoch": 1.87, "learning_rate": 1.8165722492619486e-05, "loss": 0.3057, "step": 23500 }, { "epoch": 1.87, "eval_cer": 0.053551553569899726, "eval_loss": 0.22639597952365875, "eval_runtime": 1056.3324, "eval_samples_per_second": 9.989, "eval_steps_per_second": 4.995, "eval_wer": 0.15808124098425774, "step": 23500 }, { "epoch": 1.91, "learning_rate": 1.8125827814569538e-05, "loss": 0.3126, "step": 24000 }, { "epoch": 1.91, "eval_cer": 0.05350263048921333, "eval_loss": 0.2320026159286499, "eval_runtime": 1042.7739, "eval_samples_per_second": 10.119, "eval_steps_per_second": 5.06, "eval_wer": 0.158436644157799, "step": 24000 }, { "epoch": 1.95, "learning_rate": 1.808593313651959e-05, "loss": 0.3214, "step": 24500 }, { "epoch": 1.95, "eval_cer": 0.05516601523255062, "eval_loss": 0.23359209299087524, "eval_runtime": 1036.5856, "eval_samples_per_second": 10.18, "eval_steps_per_second": 5.09, "eval_wer": 0.1606317814061422, "step": 24500 }, { "epoch": 1.99, "learning_rate": 1.804603845846964e-05, "loss": 0.3016, "step": 25000 }, { "epoch": 1.99, "eval_cer": 0.053539322799728124, "eval_loss": 0.22656488418579102, "eval_runtime": 1063.4142, "eval_samples_per_second": 9.923, "eval_steps_per_second": 4.961, "eval_wer": 0.15769447870716868, "step": 25000 }, { "epoch": 2.03, "learning_rate": 1.8006143780419692e-05, "loss": 0.2943, "step": 25500 }, { "epoch": 2.03, "eval_cer": 0.05433082835511866, "eval_loss": 0.22971460223197937, "eval_runtime": 1032.208, "eval_samples_per_second": 10.223, "eval_steps_per_second": 5.111, "eval_wer": 0.16019275395647356, "step": 25500 }, { "epoch": 2.07, "learning_rate": 1.7966249102369747e-05, "loss": 0.2904, "step": 26000 }, { "epoch": 2.07, "eval_cer": 0.054390234953094994, "eval_loss": 0.2325425148010254, "eval_runtime": 1057.8159, "eval_samples_per_second": 9.975, "eval_steps_per_second": 4.988, "eval_wer": 0.15850981539941045, "step": 26000 }, { "epoch": 2.11, "learning_rate": 1.7926354424319795e-05, "loss": 0.3017, "step": 26500 }, { "epoch": 2.11, "eval_cer": 0.05451254265481097, "eval_loss": 0.22905828058719635, "eval_runtime": 1064.1914, "eval_samples_per_second": 9.916, "eval_steps_per_second": 4.958, "eval_wer": 0.15975372650680492, "step": 26500 }, { "epoch": 2.15, "learning_rate": 1.7886459746269847e-05, "loss": 0.2966, "step": 27000 }, { "epoch": 2.15, "eval_cer": 0.05473444377078139, "eval_loss": 0.23365609347820282, "eval_runtime": 1050.9505, "eval_samples_per_second": 10.04, "eval_steps_per_second": 5.02, "eval_wer": 0.16018230092195765, "step": 27000 }, { "epoch": 2.19, "learning_rate": 1.7846644857576e-05, "loss": 0.3251, "step": 27500 }, { "epoch": 2.19, "eval_cer": 0.05426967450426068, "eval_loss": 0.2257428914308548, "eval_runtime": 1060.4671, "eval_samples_per_second": 9.95, "eval_steps_per_second": 4.975, "eval_wer": 0.16054815713001486, "step": 27500 }, { "epoch": 2.23, "learning_rate": 1.780675017952605e-05, "loss": 0.3053, "step": 28000 }, { "epoch": 2.23, "eval_cer": 0.05410019097473996, "eval_loss": 0.23043210804462433, "eval_runtime": 1033.4582, "eval_samples_per_second": 10.21, "eval_steps_per_second": 5.105, "eval_wer": 0.1583843789852194, "step": 28000 }, { "epoch": 2.27, "learning_rate": 1.7766855501476103e-05, "loss": 0.3298, "step": 28500 }, { "epoch": 2.27, "eval_cer": 0.05580376253435536, "eval_loss": 0.22545896470546722, "eval_runtime": 914.35, "eval_samples_per_second": 11.54, "eval_steps_per_second": 5.77, "eval_wer": 0.16234607906675308, "step": 28500 }, { "epoch": 2.31, "learning_rate": 1.7726960823426155e-05, "loss": 0.2814, "step": 29000 }, { "epoch": 2.31, "eval_cer": 0.053995355801840554, "eval_loss": 0.23109014332294464, "eval_runtime": 905.8755, "eval_samples_per_second": 11.648, "eval_steps_per_second": 5.824, "eval_wer": 0.15831120774360796, "step": 29000 }, { "epoch": 2.35, "learning_rate": 1.7687145934732308e-05, "loss": 0.3215, "step": 29500 }, { "epoch": 2.35, "eval_cer": 0.05462611409211866, "eval_loss": 0.22737212479114532, "eval_runtime": 912.3862, "eval_samples_per_second": 11.565, "eval_steps_per_second": 5.783, "eval_wer": 0.15886521857295172, "step": 29500 }, { "epoch": 2.39, "learning_rate": 1.764725125668236e-05, "loss": 0.2922, "step": 30000 }, { "epoch": 2.39, "eval_cer": 0.054563212988379024, "eval_loss": 0.22737739980220795, "eval_runtime": 915.0652, "eval_samples_per_second": 11.531, "eval_steps_per_second": 5.766, "eval_wer": 0.15986870988648005, "step": 30000 }, { "epoch": 2.43, "learning_rate": 1.760735657863241e-05, "loss": 0.295, "step": 30500 }, { "epoch": 2.43, "eval_cer": 0.05397613602014233, "eval_loss": 0.22714464366436005, "eval_runtime": 930.602, "eval_samples_per_second": 11.339, "eval_steps_per_second": 5.669, "eval_wer": 0.15825894257102838, "step": 30500 }, { "epoch": 2.47, "learning_rate": 1.7567461900582462e-05, "loss": 0.2938, "step": 31000 }, { "epoch": 2.47, "eval_cer": 0.0541473668025447, "eval_loss": 0.22911103069782257, "eval_runtime": 908.336, "eval_samples_per_second": 11.617, "eval_steps_per_second": 5.808, "eval_wer": 0.15907427926327014, "step": 31000 }, { "epoch": 2.51, "learning_rate": 1.7527567222532514e-05, "loss": 0.3076, "step": 31500 }, { "epoch": 2.51, "eval_cer": 0.054402465723266596, "eval_loss": 0.2284567654132843, "eval_runtime": 902.124, "eval_samples_per_second": 11.697, "eval_steps_per_second": 5.848, "eval_wer": 0.1595864779545502, "step": 31500 }, { "epoch": 2.55, "learning_rate": 1.748767254448257e-05, "loss": 0.3023, "step": 32000 }, { "epoch": 2.55, "eval_cer": 0.05438149868868671, "eval_loss": 0.2315172702074051, "eval_runtime": 905.8123, "eval_samples_per_second": 11.649, "eval_steps_per_second": 5.825, "eval_wer": 0.16001505236970293, "step": 32000 }, { "epoch": 2.59, "learning_rate": 1.744777786643262e-05, "loss": 0.3005, "step": 32500 }, { "epoch": 2.59, "eval_cer": 0.05475366355247961, "eval_loss": 0.22995078563690186, "eval_runtime": 909.4081, "eval_samples_per_second": 11.603, "eval_steps_per_second": 5.802, "eval_wer": 0.1594192294022955, "step": 32500 }, { "epoch": 2.63, "learning_rate": 1.7407883188382672e-05, "loss": 0.3145, "step": 33000 }, { "epoch": 2.63, "eval_cer": 0.05403903712388198, "eval_loss": 0.23045602440834045, "eval_runtime": 898.147, "eval_samples_per_second": 11.749, "eval_steps_per_second": 5.874, "eval_wer": 0.15892793678004724, "step": 33000 }, { "epoch": 2.67, "learning_rate": 1.7367988510332723e-05, "loss": 0.3066, "step": 33500 }, { "epoch": 2.67, "eval_cer": 0.054526520677864225, "eval_loss": 0.23219020664691925, "eval_runtime": 905.3676, "eval_samples_per_second": 11.655, "eval_steps_per_second": 5.827, "eval_wer": 0.15857253360650597, "step": 33500 }, { "epoch": 2.71, "learning_rate": 1.7328093832282775e-05, "loss": 0.2937, "step": 34000 }, { "epoch": 2.71, "eval_cer": 0.052908564509450015, "eval_loss": 0.228409081697464, "eval_runtime": 907.6141, "eval_samples_per_second": 11.626, "eval_steps_per_second": 5.813, "eval_wer": 0.1561892417368762, "step": 34000 }, { "epoch": 2.75, "learning_rate": 1.7288278943588928e-05, "loss": 0.3055, "step": 34500 }, { "epoch": 2.75, "eval_cer": 0.05396390524997073, "eval_loss": 0.23174947500228882, "eval_runtime": 882.5566, "eval_samples_per_second": 11.956, "eval_steps_per_second": 5.978, "eval_wer": 0.15776764994878012, "step": 34500 }, { "epoch": 2.79, "learning_rate": 1.7248384265538976e-05, "loss": 0.305, "step": 35000 }, { "epoch": 2.79, "eval_cer": 0.05505593830100624, "eval_loss": 0.2276100516319275, "eval_runtime": 888.7434, "eval_samples_per_second": 11.873, "eval_steps_per_second": 5.936, "eval_wer": 0.16033909643969643, "step": 35000 }, { "epoch": 2.83, "learning_rate": 1.720856937684513e-05, "loss": 0.3103, "step": 35500 }, { "epoch": 2.83, "eval_cer": 0.05433607011376364, "eval_loss": 0.22940921783447266, "eval_runtime": 900.3729, "eval_samples_per_second": 11.72, "eval_steps_per_second": 5.86, "eval_wer": 0.1581648652603851, "step": 35500 }, { "epoch": 2.87, "learning_rate": 1.716867469879518e-05, "loss": 0.2993, "step": 36000 }, { "epoch": 2.87, "eval_cer": 0.054682026184331683, "eval_loss": 0.23304207623004913, "eval_runtime": 906.2924, "eval_samples_per_second": 11.643, "eval_steps_per_second": 5.822, "eval_wer": 0.15976417954132086, "step": 36000 }, { "epoch": 2.91, "learning_rate": 1.7128780020745236e-05, "loss": 0.3011, "step": 36500 }, { "epoch": 2.91, "eval_cer": 0.052677927129071316, "eval_loss": 0.22949661314487457, "eval_runtime": 922.484, "eval_samples_per_second": 11.439, "eval_steps_per_second": 5.719, "eval_wer": 0.1561892417368762, "step": 36500 }, { "epoch": 2.95, "learning_rate": 1.7088885342695284e-05, "loss": 0.2944, "step": 37000 }, { "epoch": 2.95, "eval_cer": 0.05484277344944411, "eval_loss": 0.23222215473651886, "eval_runtime": 903.8916, "eval_samples_per_second": 11.674, "eval_steps_per_second": 5.837, "eval_wer": 0.15936696422971589, "step": 37000 }, { "epoch": 2.99, "learning_rate": 1.704899066464534e-05, "loss": 0.3098, "step": 37500 }, { "epoch": 2.99, "eval_cer": 0.0542644327456157, "eval_loss": 0.23203817009925842, "eval_runtime": 910.7868, "eval_samples_per_second": 11.586, "eval_steps_per_second": 5.793, "eval_wer": 0.1576422135345891, "step": 37500 }, { "epoch": 3.03, "learning_rate": 1.700909598659539e-05, "loss": 0.3042, "step": 38000 }, { "epoch": 3.03, "eval_cer": 0.0534554546614086, "eval_loss": 0.22991453111171722, "eval_runtime": 907.0893, "eval_samples_per_second": 11.633, "eval_steps_per_second": 5.816, "eval_wer": 0.15791399243200302, "step": 38000 }, { "epoch": 3.07, "learning_rate": 1.6969201308545442e-05, "loss": 0.2866, "step": 38500 }, { "epoch": 3.07, "eval_cer": 0.05340653158072221, "eval_loss": 0.2294275462627411, "eval_runtime": 902.7096, "eval_samples_per_second": 11.689, "eval_steps_per_second": 5.845, "eval_wer": 0.15704639056718164, "step": 38500 }, { "epoch": 3.11, "learning_rate": 1.6929386419851592e-05, "loss": 0.2957, "step": 39000 }, { "epoch": 3.11, "eval_cer": 0.05404253162964529, "eval_loss": 0.2295570820569992, "eval_runtime": 912.5312, "eval_samples_per_second": 11.563, "eval_steps_per_second": 5.782, "eval_wer": 0.15921016871197707, "step": 39000 }, { "epoch": 3.15, "learning_rate": 1.6889491741801643e-05, "loss": 0.3086, "step": 39500 }, { "epoch": 3.15, "eval_cer": 0.052947004072846464, "eval_loss": 0.22821466624736786, "eval_runtime": 904.495, "eval_samples_per_second": 11.666, "eval_steps_per_second": 5.833, "eval_wer": 0.15652373884138565, "step": 39500 }, { "epoch": 3.19, "learning_rate": 1.6849597063751698e-05, "loss": 0.3051, "step": 40000 }, { "epoch": 3.19, "eval_cer": 0.05373850962823701, "eval_loss": 0.23392616212368011, "eval_runtime": 907.2245, "eval_samples_per_second": 11.631, "eval_steps_per_second": 5.816, "eval_wer": 0.15729726339556374, "step": 40000 }, { "epoch": 3.23, "learning_rate": 1.680970238570175e-05, "loss": 0.2968, "step": 40500 }, { "epoch": 3.23, "eval_cer": 0.052592311737870136, "eval_loss": 0.22787103056907654, "eval_runtime": 886.2434, "eval_samples_per_second": 11.906, "eval_steps_per_second": 5.953, "eval_wer": 0.15359688917692807, "step": 40500 }, { "epoch": 3.26, "learning_rate": 1.67698077076518e-05, "loss": 0.3064, "step": 41000 }, { "epoch": 3.26, "eval_cer": 0.053928960192337595, "eval_loss": 0.22640632092952728, "eval_runtime": 893.134, "eval_samples_per_second": 11.815, "eval_steps_per_second": 5.907, "eval_wer": 0.15839483201973534, "step": 41000 }, { "epoch": 3.3, "learning_rate": 1.6729913029601853e-05, "loss": 0.2945, "step": 41500 }, { "epoch": 3.3, "eval_cer": 0.053990114043195585, "eval_loss": 0.2269200086593628, "eval_runtime": 897.6935, "eval_samples_per_second": 11.755, "eval_steps_per_second": 5.877, "eval_wer": 0.15750632408588214, "step": 41500 }, { "epoch": 3.34, "learning_rate": 1.6690018351551904e-05, "loss": 0.3054, "step": 42000 }, { "epoch": 3.34, "eval_cer": 0.05332441069528434, "eval_loss": 0.23121361434459686, "eval_runtime": 891.0698, "eval_samples_per_second": 11.842, "eval_steps_per_second": 5.921, "eval_wer": 0.15614742959881253, "step": 42000 }, { "epoch": 3.38, "learning_rate": 1.6650123673501956e-05, "loss": 0.2968, "step": 42500 }, { "epoch": 3.38, "eval_cer": 0.053640663466864226, "eval_loss": 0.22707530856132507, "eval_runtime": 893.1267, "eval_samples_per_second": 11.815, "eval_steps_per_second": 5.907, "eval_wer": 0.15787218029393932, "step": 42500 }, { "epoch": 3.42, "learning_rate": 1.661022899545201e-05, "loss": 0.3076, "step": 43000 }, { "epoch": 3.42, "eval_cer": 0.05363367445533759, "eval_loss": 0.22719860076904297, "eval_runtime": 884.4414, "eval_samples_per_second": 11.931, "eval_steps_per_second": 5.965, "eval_wer": 0.15708820270524534, "step": 43000 }, { "epoch": 3.46, "learning_rate": 1.657049389611426e-05, "loss": 0.3085, "step": 43500 }, { "epoch": 3.46, "eval_cer": 0.054032048112355346, "eval_loss": 0.22836348414421082, "eval_runtime": 899.2209, "eval_samples_per_second": 11.735, "eval_steps_per_second": 5.867, "eval_wer": 0.15824848953651244, "step": 43500 }, { "epoch": 3.5, "learning_rate": 1.653059921806431e-05, "loss": 0.2953, "step": 44000 }, { "epoch": 3.5, "eval_cer": 0.05415086130830801, "eval_loss": 0.23102371394634247, "eval_runtime": 903.7149, "eval_samples_per_second": 11.676, "eval_steps_per_second": 5.838, "eval_wer": 0.1580707879497418, "step": 44000 }, { "epoch": 3.54, "learning_rate": 1.6490704540014365e-05, "loss": 0.2847, "step": 44500 }, { "epoch": 3.54, "eval_cer": 0.05441993825208316, "eval_loss": 0.23333939909934998, "eval_runtime": 916.0284, "eval_samples_per_second": 11.519, "eval_steps_per_second": 5.76, "eval_wer": 0.15811260008780548, "step": 44500 }, { "epoch": 3.58, "learning_rate": 1.6450809861964417e-05, "loss": 0.2769, "step": 45000 }, { "epoch": 3.58, "eval_cer": 0.053523597523793216, "eval_loss": 0.22939017415046692, "eval_runtime": 901.6619, "eval_samples_per_second": 11.703, "eval_steps_per_second": 5.851, "eval_wer": 0.1558651976668827, "step": 45000 }, { "epoch": 3.62, "learning_rate": 1.6410915183914465e-05, "loss": 0.3033, "step": 45500 }, { "epoch": 3.62, "eval_cer": 0.05366687226008907, "eval_loss": 0.22338353097438812, "eval_runtime": 915.4355, "eval_samples_per_second": 11.527, "eval_steps_per_second": 5.763, "eval_wer": 0.15741224677523885, "step": 45500 }, { "epoch": 3.66, "learning_rate": 1.637102050586452e-05, "loss": 0.2844, "step": 46000 }, { "epoch": 3.66, "eval_cer": 0.05305009199286422, "eval_loss": 0.22461895644664764, "eval_runtime": 913.8136, "eval_samples_per_second": 11.547, "eval_steps_per_second": 5.774, "eval_wer": 0.15634603725461502, "step": 46000 }, { "epoch": 3.7, "learning_rate": 1.633112582781457e-05, "loss": 0.3141, "step": 46500 }, { "epoch": 3.7, "eval_cer": 0.05363367445533759, "eval_loss": 0.23098349571228027, "eval_runtime": 946.9043, "eval_samples_per_second": 11.144, "eval_steps_per_second": 5.572, "eval_wer": 0.15681642380783142, "step": 46500 }, { "epoch": 3.74, "learning_rate": 1.6291310939120724e-05, "loss": 0.2894, "step": 47000 }, { "epoch": 3.74, "eval_cer": 0.054661059149751806, "eval_loss": 0.23053082823753357, "eval_runtime": 940.905, "eval_samples_per_second": 11.215, "eval_steps_per_second": 5.607, "eval_wer": 0.16014048878389398, "step": 47000 }, { "epoch": 3.78, "learning_rate": 1.6251416261070773e-05, "loss": 0.3119, "step": 47500 }, { "epoch": 3.78, "eval_cer": 0.05410543273338494, "eval_loss": 0.2325323075056076, "eval_runtime": 925.0513, "eval_samples_per_second": 11.407, "eval_steps_per_second": 5.703, "eval_wer": 0.15784082119039158, "step": 47500 }, { "epoch": 3.82, "learning_rate": 1.6211521583020827e-05, "loss": 0.3031, "step": 48000 }, { "epoch": 3.82, "eval_cer": 0.05328771838476955, "eval_loss": 0.22975291311740875, "eval_runtime": 925.8474, "eval_samples_per_second": 11.397, "eval_steps_per_second": 5.699, "eval_wer": 0.15668053435912446, "step": 48000 }, { "epoch": 3.86, "learning_rate": 1.617162690497088e-05, "loss": 0.2883, "step": 48500 }, { "epoch": 3.86, "eval_cer": 0.05370007006484055, "eval_loss": 0.22732804715633392, "eval_runtime": 1115.9674, "eval_samples_per_second": 9.455, "eval_steps_per_second": 4.728, "eval_wer": 0.15818577132941694, "step": 48500 }, { "epoch": 3.9, "learning_rate": 1.613173222692093e-05, "loss": 0.3044, "step": 49000 }, { "epoch": 3.9, "eval_cer": 0.053820630513674875, "eval_loss": 0.230909526348114, "eval_runtime": 1093.0332, "eval_samples_per_second": 9.654, "eval_steps_per_second": 4.827, "eval_wer": 0.15783036815587564, "step": 49000 }, { "epoch": 3.94, "learning_rate": 1.6091837548870982e-05, "loss": 0.2802, "step": 49500 }, { "epoch": 3.94, "eval_cer": 0.053707059076367185, "eval_loss": 0.23501825332641602, "eval_runtime": 939.4078, "eval_samples_per_second": 11.233, "eval_steps_per_second": 5.616, "eval_wer": 0.1580707879497418, "step": 49500 }, { "epoch": 3.98, "learning_rate": 1.6051942870821034e-05, "loss": 0.3047, "step": 50000 }, { "epoch": 3.98, "eval_cer": 0.05406349866422517, "eval_loss": 0.2330075204372406, "eval_runtime": 924.6444, "eval_samples_per_second": 11.412, "eval_steps_per_second": 5.706, "eval_wer": 0.15756904229297766, "step": 50000 }, { "epoch": 4.02, "learning_rate": 1.6012048192771085e-05, "loss": 0.2947, "step": 50500 }, { "epoch": 4.02, "eval_cer": 0.05417881735441452, "eval_loss": 0.22912316024303436, "eval_runtime": 927.7361, "eval_samples_per_second": 11.374, "eval_steps_per_second": 5.687, "eval_wer": 0.15802897581167813, "step": 50500 }, { "epoch": 4.06, "learning_rate": 1.5972233304077238e-05, "loss": 0.2842, "step": 51000 }, { "epoch": 4.06, "eval_cer": 0.05391323491640269, "eval_loss": 0.2270590364933014, "eval_runtime": 939.0751, "eval_samples_per_second": 11.237, "eval_steps_per_second": 5.618, "eval_wer": 0.15742269980975476, "step": 51000 }, { "epoch": 4.1, "learning_rate": 1.593233862602729e-05, "loss": 0.2807, "step": 51500 }, { "epoch": 4.1, "eval_cer": 0.05416309207847961, "eval_loss": 0.23343749344348907, "eval_runtime": 928.4697, "eval_samples_per_second": 11.365, "eval_steps_per_second": 5.682, "eval_wer": 0.15750632408588214, "step": 51500 }, { "epoch": 4.14, "learning_rate": 1.589252373733344e-05, "loss": 0.2736, "step": 52000 }, { "epoch": 4.14, "eval_cer": 0.05329994915494114, "eval_loss": 0.2331331968307495, "eval_runtime": 1015.9505, "eval_samples_per_second": 10.386, "eval_steps_per_second": 5.193, "eval_wer": 0.15667008132460852, "step": 52000 }, { "epoch": 4.18, "learning_rate": 1.5852629059283494e-05, "loss": 0.2977, "step": 52500 }, { "epoch": 4.18, "eval_cer": 0.05435004813681689, "eval_loss": 0.22801466286182404, "eval_runtime": 991.652, "eval_samples_per_second": 10.641, "eval_steps_per_second": 5.32, "eval_wer": 0.1582798486400602, "step": 52500 }, { "epoch": 4.22, "learning_rate": 1.5812734381233546e-05, "loss": 0.3093, "step": 53000 }, { "epoch": 4.22, "eval_cer": 0.05384683930689973, "eval_loss": 0.2338476926088333, "eval_runtime": 972.8304, "eval_samples_per_second": 10.847, "eval_steps_per_second": 5.423, "eval_wer": 0.15704639056718164, "step": 53000 }, { "epoch": 4.26, "learning_rate": 1.5772839703183594e-05, "loss": 0.2835, "step": 53500 }, { "epoch": 4.26, "eval_cer": 0.053495641477686706, "eval_loss": 0.23169097304344177, "eval_runtime": 1058.4118, "eval_samples_per_second": 9.97, "eval_steps_per_second": 4.985, "eval_wer": 0.1573808876716911, "step": 53500 }, { "epoch": 4.3, "learning_rate": 1.573294502513365e-05, "loss": 0.2934, "step": 54000 }, { "epoch": 4.3, "eval_cer": 0.053934201950982565, "eval_loss": 0.23185814917087555, "eval_runtime": 1059.1095, "eval_samples_per_second": 9.963, "eval_steps_per_second": 4.982, "eval_wer": 0.15761085443104134, "step": 54000 }, { "epoch": 4.34, "learning_rate": 1.56930503470837e-05, "loss": 0.2744, "step": 54500 }, { "epoch": 4.34, "eval_cer": 0.05386431183571629, "eval_loss": 0.23005205392837524, "eval_runtime": 1012.8884, "eval_samples_per_second": 10.418, "eval_steps_per_second": 5.209, "eval_wer": 0.1580707879497418, "step": 54500 }, { "epoch": 4.38, "learning_rate": 1.5653155669033752e-05, "loss": 0.2903, "step": 55000 }, { "epoch": 4.38, "eval_cer": 0.05332441069528434, "eval_loss": 0.22401565313339233, "eval_runtime": 1009.2863, "eval_samples_per_second": 10.455, "eval_steps_per_second": 5.227, "eval_wer": 0.15702548449814982, "step": 55000 }, { "epoch": 4.42, "learning_rate": 1.5613260990983804e-05, "loss": 0.2866, "step": 55500 }, { "epoch": 4.42, "eval_cer": 0.05411067449202991, "eval_loss": 0.23450933396816254, "eval_runtime": 1009.3103, "eval_samples_per_second": 10.455, "eval_steps_per_second": 5.227, "eval_wer": 0.15835301988167164, "step": 55500 }, { "epoch": 4.46, "learning_rate": 1.5573366312933855e-05, "loss": 0.2764, "step": 56000 }, { "epoch": 4.46, "eval_cer": 0.05301689418811274, "eval_loss": 0.2333006113767624, "eval_runtime": 982.7778, "eval_samples_per_second": 10.737, "eval_steps_per_second": 5.368, "eval_wer": 0.15660736311751303, "step": 56000 }, { "epoch": 4.5, "learning_rate": 1.5533551424240008e-05, "loss": 0.3075, "step": 56500 }, { "epoch": 4.5, "eval_cer": 0.0538398502953731, "eval_loss": 0.22900772094726562, "eval_runtime": 969.2813, "eval_samples_per_second": 10.886, "eval_steps_per_second": 5.443, "eval_wer": 0.1587397821587607, "step": 56500 }, { "epoch": 4.54, "learning_rate": 1.549365674619006e-05, "loss": 0.2838, "step": 57000 }, { "epoch": 4.54, "eval_cer": 0.05381189424926659, "eval_loss": 0.23882387578487396, "eval_runtime": 1031.107, "eval_samples_per_second": 10.234, "eval_steps_per_second": 5.117, "eval_wer": 0.1572240921539523, "step": 57000 }, { "epoch": 4.58, "learning_rate": 1.545376206814011e-05, "loss": 0.3018, "step": 57500 }, { "epoch": 4.58, "eval_cer": 0.053486905213278424, "eval_loss": 0.23316600918769836, "eval_runtime": 975.4161, "eval_samples_per_second": 10.818, "eval_steps_per_second": 5.409, "eval_wer": 0.15625195994397173, "step": 57500 }, { "epoch": 4.62, "learning_rate": 1.5413867390090163e-05, "loss": 0.2785, "step": 58000 }, { "epoch": 4.62, "eval_cer": 0.054060004158461857, "eval_loss": 0.23457208275794983, "eval_runtime": 1012.462, "eval_samples_per_second": 10.422, "eval_steps_per_second": 5.211, "eval_wer": 0.15756904229297766, "step": 58000 }, { "epoch": 4.66, "learning_rate": 1.5374052501396316e-05, "loss": 0.3107, "step": 58500 }, { "epoch": 4.66, "eval_cer": 0.052777520543325754, "eval_loss": 0.22570756077766418, "eval_runtime": 1008.8834, "eval_samples_per_second": 10.459, "eval_steps_per_second": 5.23, "eval_wer": 0.15601154015010557, "step": 58500 }, { "epoch": 4.7, "learning_rate": 1.5334157823346368e-05, "loss": 0.3028, "step": 59000 }, { "epoch": 4.7, "eval_cer": 0.054101938227621625, "eval_loss": 0.23060066998004913, "eval_runtime": 1028.987, "eval_samples_per_second": 10.255, "eval_steps_per_second": 5.127, "eval_wer": 0.15910563836681788, "step": 59000 }, { "epoch": 4.74, "learning_rate": 1.529426314529642e-05, "loss": 0.3106, "step": 59500 }, { "epoch": 4.74, "eval_cer": 0.054463619574124586, "eval_loss": 0.23061639070510864, "eval_runtime": 955.5647, "eval_samples_per_second": 11.043, "eval_steps_per_second": 5.521, "eval_wer": 0.15960738402358204, "step": 59500 }, { "epoch": 4.78, "learning_rate": 1.525436846724647e-05, "loss": 0.2894, "step": 60000 }, { "epoch": 4.78, "eval_cer": 0.053415267845130496, "eval_loss": 0.23042044043540955, "eval_runtime": 908.3665, "eval_samples_per_second": 11.616, "eval_steps_per_second": 5.808, "eval_wer": 0.1562833190475195, "step": 60000 }, { "epoch": 4.82, "learning_rate": 1.5214473789196522e-05, "loss": 0.2754, "step": 60500 }, { "epoch": 4.82, "eval_cer": 0.05379966347909499, "eval_loss": 0.23432183265686035, "eval_runtime": 1022.0559, "eval_samples_per_second": 10.324, "eval_steps_per_second": 5.162, "eval_wer": 0.1567537056007359, "step": 60500 }, { "epoch": 4.86, "learning_rate": 1.5174579111146575e-05, "loss": 0.3196, "step": 61000 }, { "epoch": 4.86, "eval_cer": 0.054460125068361266, "eval_loss": 0.22781531512737274, "eval_runtime": 1006.3856, "eval_samples_per_second": 10.485, "eval_steps_per_second": 5.243, "eval_wer": 0.15841573808876716, "step": 61000 }, { "epoch": 4.9, "learning_rate": 1.5134684433096627e-05, "loss": 0.3011, "step": 61500 }, { "epoch": 4.9, "eval_cer": 0.05315317991288197, "eval_loss": 0.2283407747745514, "eval_runtime": 1025.3718, "eval_samples_per_second": 10.291, "eval_steps_per_second": 5.145, "eval_wer": 0.15667008132460852, "step": 61500 }, { "epoch": 4.94, "learning_rate": 1.5094789755046677e-05, "loss": 0.2888, "step": 62000 }, { "epoch": 4.94, "eval_cer": 0.05300466341794114, "eval_loss": 0.2278449833393097, "eval_runtime": 1036.1869, "eval_samples_per_second": 10.183, "eval_steps_per_second": 5.092, "eval_wer": 0.15573976125269165, "step": 62000 }, { "epoch": 4.98, "learning_rate": 1.505497486635283e-05, "loss": 0.3007, "step": 62500 }, { "epoch": 4.98, "eval_cer": 0.05329121289053286, "eval_loss": 0.23174849152565002, "eval_runtime": 1016.9601, "eval_samples_per_second": 10.376, "eval_steps_per_second": 5.188, "eval_wer": 0.15661781615202894, "step": 62500 }, { "epoch": 5.02, "learning_rate": 1.5015159977658981e-05, "loss": 0.2913, "step": 63000 }, { "epoch": 5.02, "eval_cer": 0.05368958654755061, "eval_loss": 0.22989778220653534, "eval_runtime": 1001.4101, "eval_samples_per_second": 10.537, "eval_steps_per_second": 5.269, "eval_wer": 0.1568582359458951, "step": 63000 }, { "epoch": 5.06, "learning_rate": 1.4975265299609034e-05, "loss": 0.2951, "step": 63500 }, { "epoch": 5.06, "eval_cer": 0.05276004801450919, "eval_loss": 0.22874189913272858, "eval_runtime": 1029.0957, "eval_samples_per_second": 10.254, "eval_steps_per_second": 5.127, "eval_wer": 0.15457947442142453, "step": 63500 }, { "epoch": 5.1, "learning_rate": 1.4935370621559084e-05, "loss": 0.2914, "step": 64000 }, { "epoch": 5.1, "eval_cer": 0.05322656453391156, "eval_loss": 0.2295147180557251, "eval_runtime": 1064.5011, "eval_samples_per_second": 9.913, "eval_steps_per_second": 4.956, "eval_wer": 0.15624150690945582, "step": 64000 }, { "epoch": 5.14, "learning_rate": 1.4895475943509138e-05, "loss": 0.2698, "step": 64500 }, { "epoch": 5.14, "eval_cer": 0.05335760850003582, "eval_loss": 0.23344850540161133, "eval_runtime": 1016.5089, "eval_samples_per_second": 10.381, "eval_steps_per_second": 5.19, "eval_wer": 0.15601154015010557, "step": 64500 }, { "epoch": 5.18, "learning_rate": 1.4855581265459189e-05, "loss": 0.3092, "step": 65000 }, { "epoch": 5.18, "eval_cer": 0.053848586559781385, "eval_loss": 0.22819994390010834, "eval_runtime": 1014.9268, "eval_samples_per_second": 10.397, "eval_steps_per_second": 5.198, "eval_wer": 0.15716137394685678, "step": 65000 }, { "epoch": 5.22, "learning_rate": 1.4815686587409242e-05, "loss": 0.2626, "step": 65500 }, { "epoch": 5.22, "eval_cer": 0.05425919098697073, "eval_loss": 0.23320025205612183, "eval_runtime": 1004.3012, "eval_samples_per_second": 10.507, "eval_steps_per_second": 5.253, "eval_wer": 0.15773629084523236, "step": 65500 }, { "epoch": 5.26, "learning_rate": 1.4775791909359292e-05, "loss": 0.292, "step": 66000 }, { "epoch": 5.26, "eval_cer": 0.053600476650586114, "eval_loss": 0.2286536544561386, "eval_runtime": 1059.7099, "eval_samples_per_second": 9.957, "eval_steps_per_second": 4.979, "eval_wer": 0.1566596282900926, "step": 66000 }, { "epoch": 5.3, "learning_rate": 1.4735897231309344e-05, "loss": 0.2876, "step": 66500 }, { "epoch": 5.3, "eval_cer": 0.05356902609871629, "eval_loss": 0.23624327778816223, "eval_runtime": 1087.8499, "eval_samples_per_second": 9.7, "eval_steps_per_second": 4.85, "eval_wer": 0.1569732193255702, "step": 66500 }, { "epoch": 5.34, "learning_rate": 1.4696082342615497e-05, "loss": 0.3083, "step": 67000 }, { "epoch": 5.34, "eval_cer": 0.05395516898556245, "eval_loss": 0.22930724918842316, "eval_runtime": 1060.9006, "eval_samples_per_second": 9.946, "eval_steps_per_second": 4.973, "eval_wer": 0.15801852277716222, "step": 67000 }, { "epoch": 5.38, "learning_rate": 1.4656187664565548e-05, "loss": 0.2829, "step": 67500 }, { "epoch": 5.38, "eval_cer": 0.052884102969106825, "eval_loss": 0.23014146089553833, "eval_runtime": 982.6766, "eval_samples_per_second": 10.738, "eval_steps_per_second": 5.369, "eval_wer": 0.15458992745594047, "step": 67500 }, { "epoch": 5.41, "learning_rate": 1.4616372775871698e-05, "loss": 0.3064, "step": 68000 }, { "epoch": 5.41, "eval_cer": 0.05366337775432576, "eval_loss": 0.2316119372844696, "eval_runtime": 995.6763, "eval_samples_per_second": 10.598, "eval_steps_per_second": 5.299, "eval_wer": 0.15700457842911797, "step": 68000 }, { "epoch": 5.45, "learning_rate": 1.4576478097821751e-05, "loss": 0.2968, "step": 68500 }, { "epoch": 5.45, "eval_cer": 0.05196854245911865, "eval_loss": 0.22566300630569458, "eval_runtime": 999.0896, "eval_samples_per_second": 10.562, "eval_steps_per_second": 5.281, "eval_wer": 0.1545585683523927, "step": 68500 }, { "epoch": 5.49, "learning_rate": 1.4536583419771803e-05, "loss": 0.2924, "step": 69000 }, { "epoch": 5.49, "eval_cer": 0.05315317991288197, "eval_loss": 0.2279421091079712, "eval_runtime": 995.0687, "eval_samples_per_second": 10.604, "eval_steps_per_second": 5.302, "eval_wer": 0.15660736311751303, "step": 69000 }, { "epoch": 5.53, "learning_rate": 1.4496688741721856e-05, "loss": 0.2837, "step": 69500 }, { "epoch": 5.53, "eval_cer": 0.05344147663835534, "eval_loss": 0.23239023983478546, "eval_runtime": 1002.0877, "eval_samples_per_second": 10.53, "eval_steps_per_second": 5.265, "eval_wer": 0.15640875546171054, "step": 69500 }, { "epoch": 5.57, "learning_rate": 1.4456794063671908e-05, "loss": 0.2757, "step": 70000 }, { "epoch": 5.57, "eval_cer": 0.053209092005094986, "eval_loss": 0.22870585322380066, "eval_runtime": 987.89, "eval_samples_per_second": 10.681, "eval_steps_per_second": 5.341, "eval_wer": 0.15694186022202244, "step": 70000 }, { "epoch": 5.61, "learning_rate": 1.4416979174978059e-05, "loss": 0.2933, "step": 70500 }, { "epoch": 5.61, "eval_cer": 0.052419333702586106, "eval_loss": 0.2281671166419983, "eval_runtime": 1014.9291, "eval_samples_per_second": 10.397, "eval_steps_per_second": 5.198, "eval_wer": 0.15453766228336085, "step": 70500 }, { "epoch": 5.65, "learning_rate": 1.437708449692811e-05, "loss": 0.2837, "step": 71000 }, { "epoch": 5.65, "eval_cer": 0.053895762387586116, "eval_loss": 0.23612989485263824, "eval_runtime": 1011.556, "eval_samples_per_second": 10.431, "eval_steps_per_second": 5.216, "eval_wer": 0.15788263332845526, "step": 71000 }, { "epoch": 5.69, "learning_rate": 1.4337189818878164e-05, "loss": 0.2926, "step": 71500 }, { "epoch": 5.69, "eval_cer": 0.0533785755346157, "eval_loss": 0.2293144315481186, "eval_runtime": 973.6724, "eval_samples_per_second": 10.837, "eval_steps_per_second": 5.419, "eval_wer": 0.15773629084523236, "step": 71500 }, { "epoch": 5.73, "learning_rate": 1.4297295140828215e-05, "loss": 0.2864, "step": 72000 }, { "epoch": 5.73, "eval_cer": 0.053410026086485526, "eval_loss": 0.2307540327310562, "eval_runtime": 1005.1235, "eval_samples_per_second": 10.498, "eval_steps_per_second": 5.249, "eval_wer": 0.15692095415299062, "step": 72000 }, { "epoch": 5.77, "learning_rate": 1.4257400462778265e-05, "loss": 0.2682, "step": 72500 }, { "epoch": 5.77, "eval_cer": 0.05274082823281096, "eval_loss": 0.22183704376220703, "eval_runtime": 994.7947, "eval_samples_per_second": 10.607, "eval_steps_per_second": 5.304, "eval_wer": 0.15527982773399118, "step": 72500 }, { "epoch": 5.81, "learning_rate": 1.4217505784728318e-05, "loss": 0.2841, "step": 73000 }, { "epoch": 5.81, "eval_cer": 0.05319860848780505, "eval_loss": 0.22810408473014832, "eval_runtime": 997.7636, "eval_samples_per_second": 10.576, "eval_steps_per_second": 5.288, "eval_wer": 0.1560742583572011, "step": 73000 }, { "epoch": 5.85, "learning_rate": 1.417769089603447e-05, "loss": 0.2783, "step": 73500 }, { "epoch": 5.85, "eval_cer": 0.05318113595898848, "eval_loss": 0.2253616899251938, "eval_runtime": 993.1265, "eval_samples_per_second": 10.625, "eval_steps_per_second": 5.313, "eval_wer": 0.15653419187590156, "step": 73500 }, { "epoch": 5.89, "learning_rate": 1.4137796217984523e-05, "loss": 0.2764, "step": 74000 }, { "epoch": 5.89, "eval_cer": 0.053308685419349425, "eval_loss": 0.2277914136648178, "eval_runtime": 995.9704, "eval_samples_per_second": 10.595, "eval_steps_per_second": 5.297, "eval_wer": 0.15622060084042397, "step": 74000 }, { "epoch": 5.93, "learning_rate": 1.4097901539934573e-05, "loss": 0.2846, "step": 74500 }, { "epoch": 5.93, "eval_cer": 0.05289109198063345, "eval_loss": 0.22751808166503906, "eval_runtime": 1009.4915, "eval_samples_per_second": 10.453, "eval_steps_per_second": 5.226, "eval_wer": 0.1557502142872076, "step": 74500 }, { "epoch": 5.97, "learning_rate": 1.4058006861884626e-05, "loss": 0.2837, "step": 75000 }, { "epoch": 5.97, "eval_cer": 0.05339430081055061, "eval_loss": 0.22733652591705322, "eval_runtime": 1005.1836, "eval_samples_per_second": 10.498, "eval_steps_per_second": 5.249, "eval_wer": 0.15630422511655134, "step": 75000 }, { "epoch": 6.01, "learning_rate": 1.4018112183834678e-05, "loss": 0.295, "step": 75500 }, { "epoch": 6.01, "eval_cer": 0.053111245843722205, "eval_loss": 0.23248015344142914, "eval_runtime": 979.3989, "eval_samples_per_second": 10.774, "eval_steps_per_second": 5.387, "eval_wer": 0.1561787887023603, "step": 75500 }, { "epoch": 6.05, "learning_rate": 1.397821750578473e-05, "loss": 0.2799, "step": 76000 }, { "epoch": 6.05, "eval_cer": 0.05339954256919558, "eval_loss": 0.227718323469162, "eval_runtime": 1033.6163, "eval_samples_per_second": 10.209, "eval_steps_per_second": 5.104, "eval_wer": 0.15693140718750653, "step": 76000 }, { "epoch": 6.09, "learning_rate": 1.393832282773478e-05, "loss": 0.2626, "step": 76500 }, { "epoch": 6.09, "eval_cer": 0.05273209196840268, "eval_loss": 0.23209738731384277, "eval_runtime": 1100.8278, "eval_samples_per_second": 9.586, "eval_steps_per_second": 4.793, "eval_wer": 0.15478853511174293, "step": 76500 }, { "epoch": 6.13, "learning_rate": 1.3898428149684832e-05, "loss": 0.2951, "step": 77000 }, { "epoch": 6.13, "eval_cer": 0.0537105535821305, "eval_loss": 0.2339087873697281, "eval_runtime": 990.6062, "eval_samples_per_second": 10.652, "eval_steps_per_second": 5.326, "eval_wer": 0.1574854180168503, "step": 77000 }, { "epoch": 6.17, "learning_rate": 1.3858533471634885e-05, "loss": 0.2836, "step": 77500 }, { "epoch": 6.17, "eval_cer": 0.053375081028852384, "eval_loss": 0.2342662364244461, "eval_runtime": 1011.222, "eval_samples_per_second": 10.435, "eval_steps_per_second": 5.217, "eval_wer": 0.15747496498233438, "step": 77500 }, { "epoch": 6.21, "learning_rate": 1.3818718582941037e-05, "loss": 0.292, "step": 78000 }, { "epoch": 6.21, "eval_cer": 0.05331567443087606, "eval_loss": 0.23277445137500763, "eval_runtime": 1002.9949, "eval_samples_per_second": 10.52, "eval_steps_per_second": 5.26, "eval_wer": 0.1565550979449334, "step": 78000 }, { "epoch": 6.25, "learning_rate": 1.3778903694247188e-05, "loss": 0.2941, "step": 78500 }, { "epoch": 6.25, "eval_cer": 0.0527233557039944, "eval_loss": 0.23166391253471375, "eval_runtime": 987.0345, "eval_samples_per_second": 10.691, "eval_steps_per_second": 5.345, "eval_wer": 0.15485125331883845, "step": 78500 }, { "epoch": 6.29, "learning_rate": 1.373900901619724e-05, "loss": 0.2889, "step": 79000 }, { "epoch": 6.29, "eval_cer": 0.05313745463694706, "eval_loss": 0.22406452894210815, "eval_runtime": 1003.3137, "eval_samples_per_second": 10.517, "eval_steps_per_second": 5.259, "eval_wer": 0.15667008132460852, "step": 79000 }, { "epoch": 6.33, "learning_rate": 1.3699114338147293e-05, "loss": 0.276, "step": 79500 }, { "epoch": 6.33, "eval_cer": 0.05304310298133759, "eval_loss": 0.2285362333059311, "eval_runtime": 1000.5197, "eval_samples_per_second": 10.547, "eval_steps_per_second": 5.273, "eval_wer": 0.15591746283946228, "step": 79500 }, { "epoch": 6.37, "learning_rate": 1.3659219660097345e-05, "loss": 0.2725, "step": 80000 }, { "epoch": 6.37, "eval_cer": 0.05252941063413049, "eval_loss": 0.22845245897769928, "eval_runtime": 1007.5295, "eval_samples_per_second": 10.473, "eval_steps_per_second": 5.237, "eval_wer": 0.15441222586916983, "step": 80000 }, { "epoch": 6.41, "learning_rate": 1.3619404771403494e-05, "loss": 0.3079, "step": 80500 }, { "epoch": 6.41, "eval_cer": 0.0528404216470654, "eval_loss": 0.22764278948307037, "eval_runtime": 1022.7476, "eval_samples_per_second": 10.317, "eval_steps_per_second": 5.159, "eval_wer": 0.15559341876946878, "step": 80500 }, { "epoch": 6.45, "learning_rate": 1.3579510093353548e-05, "loss": 0.2872, "step": 81000 }, { "epoch": 6.45, "eval_cer": 0.05274606999145593, "eval_loss": 0.22662149369716644, "eval_runtime": 993.8039, "eval_samples_per_second": 10.618, "eval_steps_per_second": 5.309, "eval_wer": 0.15533209290657077, "step": 81000 }, { "epoch": 6.49, "learning_rate": 1.3539615415303599e-05, "loss": 0.2759, "step": 81500 }, { "epoch": 6.49, "eval_cer": 0.052761795267390846, "eval_loss": 0.22488127648830414, "eval_runtime": 1001.1627, "eval_samples_per_second": 10.54, "eval_steps_per_second": 5.27, "eval_wer": 0.15532163987205486, "step": 81500 }, { "epoch": 6.53, "learning_rate": 1.3499720737253652e-05, "loss": 0.2799, "step": 82000 }, { "epoch": 6.53, "eval_cer": 0.053640663466864226, "eval_loss": 0.23271960020065308, "eval_runtime": 981.0803, "eval_samples_per_second": 10.755, "eval_steps_per_second": 5.378, "eval_wer": 0.15670144042815629, "step": 82000 }, { "epoch": 6.57, "learning_rate": 1.3459826059203702e-05, "loss": 0.2838, "step": 82500 }, { "epoch": 6.57, "eval_cer": 0.053139201889828715, "eval_loss": 0.22912931442260742, "eval_runtime": 1016.4192, "eval_samples_per_second": 10.382, "eval_steps_per_second": 5.191, "eval_wer": 0.15532163987205486, "step": 82500 }, { "epoch": 6.61, "learning_rate": 1.3419931381153755e-05, "loss": 0.2843, "step": 83000 }, { "epoch": 6.61, "eval_cer": 0.053375081028852384, "eval_loss": 0.2322521209716797, "eval_runtime": 992.6032, "eval_samples_per_second": 10.631, "eval_steps_per_second": 5.315, "eval_wer": 0.1552380155959275, "step": 83000 }, { "epoch": 6.65, "learning_rate": 1.3380036703103807e-05, "loss": 0.2594, "step": 83500 }, { "epoch": 6.65, "eval_cer": 0.052249850173065396, "eval_loss": 0.22961102426052094, "eval_runtime": 1004.8962, "eval_samples_per_second": 10.501, "eval_steps_per_second": 5.25, "eval_wer": 0.15491397152593397, "step": 83500 }, { "epoch": 6.69, "learning_rate": 1.334014202505386e-05, "loss": 0.2977, "step": 84000 }, { "epoch": 6.69, "eval_cer": 0.0527635425202725, "eval_loss": 0.22668838500976562, "eval_runtime": 1013.6978, "eval_samples_per_second": 10.409, "eval_steps_per_second": 5.205, "eval_wer": 0.15500804883657726, "step": 84000 }, { "epoch": 6.73, "learning_rate": 1.3300247347003912e-05, "loss": 0.2839, "step": 84500 }, { "epoch": 6.73, "eval_cer": 0.05319860848780505, "eval_loss": 0.23399870097637177, "eval_runtime": 974.964, "eval_samples_per_second": 10.823, "eval_steps_per_second": 5.411, "eval_wer": 0.15662826918654485, "step": 84500 }, { "epoch": 6.77, "learning_rate": 1.3260352668953961e-05, "loss": 0.2793, "step": 85000 }, { "epoch": 6.77, "eval_cer": 0.05322656453391156, "eval_loss": 0.23137907683849335, "eval_runtime": 1005.324, "eval_samples_per_second": 10.496, "eval_steps_per_second": 5.248, "eval_wer": 0.15626241297848764, "step": 85000 }, { "epoch": 6.81, "learning_rate": 1.3220457990904015e-05, "loss": 0.2904, "step": 85500 }, { "epoch": 6.81, "eval_cer": 0.0526220150368583, "eval_loss": 0.23123595118522644, "eval_runtime": 994.7751, "eval_samples_per_second": 10.607, "eval_steps_per_second": 5.304, "eval_wer": 0.15501850187109317, "step": 85500 }, { "epoch": 6.85, "learning_rate": 1.3180563312854066e-05, "loss": 0.2876, "step": 86000 }, { "epoch": 6.85, "eval_cer": 0.05300466341794114, "eval_loss": 0.2295524775981903, "eval_runtime": 991.0961, "eval_samples_per_second": 10.647, "eval_steps_per_second": 5.323, "eval_wer": 0.1548198942152907, "step": 86000 }, { "epoch": 6.89, "learning_rate": 1.314074842416022e-05, "loss": 0.2837, "step": 86500 }, { "epoch": 6.89, "eval_cer": 0.05278450955485239, "eval_loss": 0.23204663395881653, "eval_runtime": 982.9191, "eval_samples_per_second": 10.735, "eval_steps_per_second": 5.368, "eval_wer": 0.15546798235527773, "step": 86500 }, { "epoch": 6.93, "learning_rate": 1.310085374611027e-05, "loss": 0.2883, "step": 87000 }, { "epoch": 6.93, "eval_cer": 0.05388527887029618, "eval_loss": 0.23330089449882507, "eval_runtime": 1005.5183, "eval_samples_per_second": 10.494, "eval_steps_per_second": 5.247, "eval_wer": 0.15745405891330252, "step": 87000 }, { "epoch": 6.97, "learning_rate": 1.306095906806032e-05, "loss": 0.2999, "step": 87500 }, { "epoch": 6.97, "eval_cer": 0.05274082823281096, "eval_loss": 0.22357943654060364, "eval_runtime": 991.3811, "eval_samples_per_second": 10.644, "eval_steps_per_second": 5.322, "eval_wer": 0.15510212614722055, "step": 87500 }, { "epoch": 7.01, "learning_rate": 1.3021064390010374e-05, "loss": 0.2851, "step": 88000 }, { "epoch": 7.01, "eval_cer": 0.05307630078608907, "eval_loss": 0.23096595704555511, "eval_runtime": 1013.0612, "eval_samples_per_second": 10.416, "eval_steps_per_second": 5.208, "eval_wer": 0.15626241297848764, "step": 88000 }, { "epoch": 7.05, "learning_rate": 1.2981169711960426e-05, "loss": 0.2818, "step": 88500 }, { "epoch": 7.05, "eval_cer": 0.05257833371481688, "eval_loss": 0.23177887499332428, "eval_runtime": 969.6339, "eval_samples_per_second": 10.882, "eval_steps_per_second": 5.441, "eval_wer": 0.1553425459410867, "step": 88500 }, { "epoch": 7.09, "learning_rate": 1.2941434612622677e-05, "loss": 0.2967, "step": 89000 }, { "epoch": 7.09, "eval_cer": 0.053834608536728126, "eval_loss": 0.23280788958072662, "eval_runtime": 980.771, "eval_samples_per_second": 10.759, "eval_steps_per_second": 5.379, "eval_wer": 0.15621014780590806, "step": 89000 }, { "epoch": 7.13, "learning_rate": 1.2901539934572728e-05, "loss": 0.2811, "step": 89500 }, { "epoch": 7.13, "eval_cer": 0.05324403706272812, "eval_loss": 0.22902736067771912, "eval_runtime": 1013.5591, "eval_samples_per_second": 10.411, "eval_steps_per_second": 5.205, "eval_wer": 0.1564401145652583, "step": 89500 }, { "epoch": 7.17, "learning_rate": 1.2861645256522782e-05, "loss": 0.2796, "step": 90000 }, { "epoch": 7.17, "eval_cer": 0.05300466341794114, "eval_loss": 0.22609573602676392, "eval_runtime": 972.0883, "eval_samples_per_second": 10.855, "eval_steps_per_second": 5.427, "eval_wer": 0.15550979449334143, "step": 90000 }, { "epoch": 7.21, "learning_rate": 1.2821830367828933e-05, "loss": 0.2643, "step": 90500 }, { "epoch": 7.21, "eval_cer": 0.0533785755346157, "eval_loss": 0.2270972579717636, "eval_runtime": 1011.007, "eval_samples_per_second": 10.437, "eval_steps_per_second": 5.219, "eval_wer": 0.1563983024271946, "step": 90500 }, { "epoch": 7.25, "learning_rate": 1.2781935689778983e-05, "loss": 0.2724, "step": 91000 }, { "epoch": 7.25, "eval_cer": 0.05331043267223109, "eval_loss": 0.2323487550020218, "eval_runtime": 1008.5634, "eval_samples_per_second": 10.462, "eval_steps_per_second": 5.231, "eval_wer": 0.15645056759977422, "step": 91000 }, { "epoch": 7.29, "learning_rate": 1.2742041011729036e-05, "loss": 0.2993, "step": 91500 }, { "epoch": 7.29, "eval_cer": 0.05329296014341452, "eval_loss": 0.22676041722297668, "eval_runtime": 997.9884, "eval_samples_per_second": 10.573, "eval_steps_per_second": 5.287, "eval_wer": 0.15522756256141157, "step": 91500 }, { "epoch": 7.33, "learning_rate": 1.2702146333679088e-05, "loss": 0.2751, "step": 92000 }, { "epoch": 7.33, "eval_cer": 0.05339954256919558, "eval_loss": 0.22875265777111053, "eval_runtime": 1016.6429, "eval_samples_per_second": 10.379, "eval_steps_per_second": 5.19, "eval_wer": 0.15630422511655134, "step": 92000 }, { "epoch": 7.37, "learning_rate": 1.2662251655629141e-05, "loss": 0.2854, "step": 92500 }, { "epoch": 7.37, "eval_cer": 0.05395342173268079, "eval_loss": 0.23149354755878448, "eval_runtime": 1016.6463, "eval_samples_per_second": 10.379, "eval_steps_per_second": 5.19, "eval_wer": 0.15708820270524534, "step": 92500 }, { "epoch": 7.41, "learning_rate": 1.262235697757919e-05, "loss": 0.29, "step": 93000 }, { "epoch": 7.41, "eval_cer": 0.053205597499331674, "eval_loss": 0.22764912247657776, "eval_runtime": 992.1449, "eval_samples_per_second": 10.636, "eval_steps_per_second": 5.318, "eval_wer": 0.15562477787301654, "step": 93000 }, { "epoch": 7.45, "learning_rate": 1.2582462299529244e-05, "loss": 0.2712, "step": 93500 }, { "epoch": 7.45, "eval_cer": 0.05297845462471629, "eval_loss": 0.235035240650177, "eval_runtime": 998.0334, "eval_samples_per_second": 10.573, "eval_steps_per_second": 5.286, "eval_wer": 0.15616833566784438, "step": 93500 }, { "epoch": 7.49, "learning_rate": 1.2542567621479295e-05, "loss": 0.2841, "step": 94000 }, { "epoch": 7.49, "eval_cer": 0.05259056448498848, "eval_loss": 0.2267538160085678, "eval_runtime": 1011.9601, "eval_samples_per_second": 10.427, "eval_steps_per_second": 5.214, "eval_wer": 0.1547571760081952, "step": 94000 }, { "epoch": 7.53, "learning_rate": 1.2502672943429349e-05, "loss": 0.2762, "step": 94500 }, { "epoch": 7.53, "eval_cer": 0.05283692714130209, "eval_loss": 0.2273728996515274, "eval_runtime": 1023.2923, "eval_samples_per_second": 10.312, "eval_steps_per_second": 5.156, "eval_wer": 0.15531118683753894, "step": 94500 }, { "epoch": 7.56, "learning_rate": 1.24627782653794e-05, "loss": 0.2644, "step": 95000 }, { "epoch": 7.56, "eval_cer": 0.053640663466864226, "eval_loss": 0.23487049341201782, "eval_runtime": 975.0457, "eval_samples_per_second": 10.822, "eval_steps_per_second": 5.411, "eval_wer": 0.15825894257102838, "step": 95000 }, { "epoch": 7.6, "learning_rate": 1.242288358732945e-05, "loss": 0.2605, "step": 95500 }, { "epoch": 7.6, "eval_cer": 0.05368783929466896, "eval_loss": 0.23216651380062103, "eval_runtime": 1017.8333, "eval_samples_per_second": 10.367, "eval_steps_per_second": 5.184, "eval_wer": 0.15798716367361446, "step": 95500 }, { "epoch": 7.64, "learning_rate": 1.2382988909279503e-05, "loss": 0.2777, "step": 96000 }, { "epoch": 7.64, "eval_cer": 0.05315842167152694, "eval_loss": 0.23125576972961426, "eval_runtime": 1011.4981, "eval_samples_per_second": 10.432, "eval_steps_per_second": 5.216, "eval_wer": 0.15590700980494637, "step": 96000 }, { "epoch": 7.68, "learning_rate": 1.2343174020585655e-05, "loss": 0.2859, "step": 96500 }, { "epoch": 7.68, "eval_cer": 0.053002916165059484, "eval_loss": 0.22942064702510834, "eval_runtime": 1024.1009, "eval_samples_per_second": 10.304, "eval_steps_per_second": 5.152, "eval_wer": 0.15512303221625237, "step": 96500 }, { "epoch": 7.72, "learning_rate": 1.2303279342535708e-05, "loss": 0.2538, "step": 97000 }, { "epoch": 7.72, "eval_cer": 0.053937696456745884, "eval_loss": 0.23439116775989532, "eval_runtime": 1004.398, "eval_samples_per_second": 10.506, "eval_steps_per_second": 5.253, "eval_wer": 0.15724499822298413, "step": 97000 }, { "epoch": 7.76, "learning_rate": 1.2263384664485758e-05, "loss": 0.271, "step": 97500 }, { "epoch": 7.76, "eval_cer": 0.053871300847242926, "eval_loss": 0.23197893798351288, "eval_runtime": 1022.2159, "eval_samples_per_second": 10.323, "eval_steps_per_second": 5.161, "eval_wer": 0.1566491752555767, "step": 97500 }, { "epoch": 7.8, "learning_rate": 1.2223569775791911e-05, "loss": 0.2818, "step": 98000 }, { "epoch": 7.8, "eval_cer": 0.052466509530390844, "eval_loss": 0.22931723296642303, "eval_runtime": 1006.4602, "eval_samples_per_second": 10.484, "eval_steps_per_second": 5.242, "eval_wer": 0.15418225910981959, "step": 98000 }, { "epoch": 7.84, "learning_rate": 1.2183675097741962e-05, "loss": 0.2734, "step": 98500 }, { "epoch": 7.84, "eval_cer": 0.053212586510858306, "eval_loss": 0.22494953870773315, "eval_runtime": 995.2729, "eval_samples_per_second": 10.602, "eval_steps_per_second": 5.301, "eval_wer": 0.1569732193255702, "step": 98500 }, { "epoch": 7.88, "learning_rate": 1.2143780419692016e-05, "loss": 0.2803, "step": 99000 }, { "epoch": 7.88, "eval_cer": 0.05317065244169854, "eval_loss": 0.23138034343719482, "eval_runtime": 1015.8371, "eval_samples_per_second": 10.387, "eval_steps_per_second": 5.194, "eval_wer": 0.15510212614722055, "step": 99000 }, { "epoch": 7.92, "learning_rate": 1.2103885741642065e-05, "loss": 0.2718, "step": 99500 }, { "epoch": 7.92, "eval_cer": 0.05306232276303582, "eval_loss": 0.233502596616745, "eval_runtime": 1022.6702, "eval_samples_per_second": 10.318, "eval_steps_per_second": 5.159, "eval_wer": 0.15613697656429662, "step": 99500 }, { "epoch": 7.96, "learning_rate": 1.2063991063592117e-05, "loss": 0.2955, "step": 100000 }, { "epoch": 7.96, "eval_cer": 0.05277926779620741, "eval_loss": 0.22855418920516968, "eval_runtime": 991.7786, "eval_samples_per_second": 10.639, "eval_steps_per_second": 5.32, "eval_wer": 0.15492442456044989, "step": 100000 }, { "epoch": 8.0, "learning_rate": 1.202409638554217e-05, "loss": 0.2842, "step": 100500 }, { "epoch": 8.0, "eval_cer": 0.05253989415142043, "eval_loss": 0.22677482664585114, "eval_runtime": 995.1219, "eval_samples_per_second": 10.604, "eval_steps_per_second": 5.302, "eval_wer": 0.1556665900110802, "step": 100500 }, { "epoch": 8.04, "learning_rate": 1.1984201707492222e-05, "loss": 0.2815, "step": 101000 }, { "epoch": 8.04, "eval_cer": 0.053106004085077235, "eval_loss": 0.23340827226638794, "eval_runtime": 1020.4782, "eval_samples_per_second": 10.34, "eval_steps_per_second": 5.17, "eval_wer": 0.1560742583572011, "step": 101000 }, { "epoch": 8.08, "learning_rate": 1.1944307029442273e-05, "loss": 0.2691, "step": 101500 }, { "epoch": 8.08, "eval_cer": 0.05241758644970445, "eval_loss": 0.23170696198940277, "eval_runtime": 1016.9098, "eval_samples_per_second": 10.377, "eval_steps_per_second": 5.188, "eval_wer": 0.15385821503982605, "step": 101500 }, { "epoch": 8.12, "learning_rate": 1.1904412351392325e-05, "loss": 0.2653, "step": 102000 }, { "epoch": 8.12, "eval_cer": 0.053289465637651204, "eval_loss": 0.23294131457805634, "eval_runtime": 995.0594, "eval_samples_per_second": 10.604, "eval_steps_per_second": 5.302, "eval_wer": 0.1556665900110802, "step": 102000 }, { "epoch": 8.16, "learning_rate": 1.1864517673342378e-05, "loss": 0.2666, "step": 102500 }, { "epoch": 8.16, "eval_cer": 0.05316890518881688, "eval_loss": 0.23137402534484863, "eval_runtime": 1018.3921, "eval_samples_per_second": 10.361, "eval_steps_per_second": 5.181, "eval_wer": 0.15641920849622645, "step": 102500 }, { "epoch": 8.2, "learning_rate": 1.182462299529243e-05, "loss": 0.2502, "step": 103000 }, { "epoch": 8.2, "eval_cer": 0.052225388632722206, "eval_loss": 0.22777153551578522, "eval_runtime": 1019.8931, "eval_samples_per_second": 10.346, "eval_steps_per_second": 5.173, "eval_wer": 0.1537641377291828, "step": 103000 }, { "epoch": 8.24, "learning_rate": 1.178472831724248e-05, "loss": 0.2625, "step": 103500 }, { "epoch": 8.24, "eval_cer": 0.05278276230197072, "eval_loss": 0.23133881390094757, "eval_runtime": 1004.6555, "eval_samples_per_second": 10.503, "eval_steps_per_second": 5.252, "eval_wer": 0.15499759580206135, "step": 103500 }, { "epoch": 8.28, "learning_rate": 1.1744913428548633e-05, "loss": 0.2779, "step": 104000 }, { "epoch": 8.28, "eval_cer": 0.05239312490936126, "eval_loss": 0.22765225172042847, "eval_runtime": 1054.7994, "eval_samples_per_second": 10.004, "eval_steps_per_second": 5.002, "eval_wer": 0.15512303221625237, "step": 104000 }, { "epoch": 8.32, "learning_rate": 1.1705018750498684e-05, "loss": 0.2815, "step": 104500 }, { "epoch": 8.32, "eval_cer": 0.05215025675881096, "eval_loss": 0.22691141068935394, "eval_runtime": 1019.8114, "eval_samples_per_second": 10.347, "eval_steps_per_second": 5.174, "eval_wer": 0.15538435807915038, "step": 104500 } ], "max_steps": 251160, "num_train_epochs": 20, "total_flos": 5.975247917634884e+19, "trial_name": null, "trial_params": null }