diff --git "a/trainer_state.json" "b/trainer_state.json" --- "a/trainer_state.json" +++ "b/trainer_state.json" @@ -1,8 +1,8 @@ { - "best_metric": 0.09579244742265228, - "best_model_checkpoint": "./wav2vec2-large-xlsr-53-german-cv9/checkpoint-117381", - "epoch": 32.999859451862264, - "global_step": 117381, + "best_metric": 0.09092025712063107, + "best_model_checkpoint": "./wav2vec2-large-xlsr-53-german-cv9/checkpoint-160065", + "epoch": 44.999859451862264, + "global_step": 160065, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, @@ -23775,11 +23775,8657 @@ "eval_steps_per_second": 0.79, "eval_wer": 0.09579244742265228, "step": 117381 + }, + { + "epoch": 33.0, + "learning_rate": 3.780089338706151e-05, + "loss": 0.0576, + "step": 117390 + }, + { + "epoch": 33.01, + "learning_rate": 3.778215100115578e-05, + "loss": 0.0484, + "step": 117420 + }, + { + "epoch": 33.02, + "learning_rate": 3.776340861525006e-05, + "loss": 0.0556, + "step": 117450 + }, + { + "epoch": 33.03, + "learning_rate": 3.774466622934433e-05, + "loss": 0.0565, + "step": 117480 + }, + { + "epoch": 33.04, + "learning_rate": 3.772592384343861e-05, + "loss": 0.0475, + "step": 117510 + }, + { + "epoch": 33.04, + "learning_rate": 3.770718145753288e-05, + "loss": 0.0623, + "step": 117540 + }, + { + "epoch": 33.05, + "learning_rate": 3.768843907162715e-05, + "loss": 0.052, + "step": 117570 + }, + { + "epoch": 33.06, + "learning_rate": 3.766969668572143e-05, + "loss": 0.0606, + "step": 117600 + }, + { + "epoch": 33.07, + "learning_rate": 3.76509542998157e-05, + "loss": 0.0558, + "step": 117630 + }, + { + "epoch": 33.08, + "learning_rate": 3.763221191390998e-05, + "loss": 0.0525, + "step": 117660 + }, + { + "epoch": 33.09, + "learning_rate": 3.761346952800425e-05, + "loss": 0.0605, + "step": 117690 + }, + { + "epoch": 33.1, + "learning_rate": 3.759472714209853e-05, + "loss": 0.0482, + "step": 117720 + }, + { + "epoch": 33.1, + "learning_rate": 3.75759847561928e-05, + "loss": 0.0554, + "step": 117750 + }, + { + "epoch": 33.11, + "learning_rate": 3.755724237028707e-05, + "loss": 0.0519, + "step": 117780 + }, + { + "epoch": 33.12, + "learning_rate": 3.753849998438135e-05, + "loss": 0.0496, + "step": 117810 + }, + { + "epoch": 33.13, + "learning_rate": 3.751975759847562e-05, + "loss": 0.0607, + "step": 117840 + }, + { + "epoch": 33.14, + "learning_rate": 3.75010152125699e-05, + "loss": 0.0513, + "step": 117870 + }, + { + "epoch": 33.15, + "learning_rate": 3.748227282666417e-05, + "loss": 0.056, + "step": 117900 + }, + { + "epoch": 33.15, + "learning_rate": 3.7463530440758446e-05, + "loss": 0.0586, + "step": 117930 + }, + { + "epoch": 33.16, + "learning_rate": 3.744478805485272e-05, + "loss": 0.0506, + "step": 117960 + }, + { + "epoch": 33.17, + "learning_rate": 3.742604566894699e-05, + "loss": 0.059, + "step": 117990 + }, + { + "epoch": 33.18, + "learning_rate": 3.740730328304127e-05, + "loss": 0.055, + "step": 118020 + }, + { + "epoch": 33.19, + "learning_rate": 3.7388560897135536e-05, + "loss": 0.0578, + "step": 118050 + }, + { + "epoch": 33.2, + "learning_rate": 3.736981851122982e-05, + "loss": 0.0612, + "step": 118080 + }, + { + "epoch": 33.2, + "learning_rate": 3.735107612532409e-05, + "loss": 0.0525, + "step": 118110 + }, + { + "epoch": 33.21, + "learning_rate": 3.7332333739418365e-05, + "loss": 0.0556, + "step": 118140 + }, + { + "epoch": 33.22, + "learning_rate": 3.731359135351264e-05, + "loss": 0.0512, + "step": 118170 + }, + { + "epoch": 33.23, + "learning_rate": 3.729484896760691e-05, + "loss": 0.0612, + "step": 118200 + }, + { + "epoch": 33.24, + "learning_rate": 3.727610658170119e-05, + "loss": 0.0602, + "step": 118230 + }, + { + "epoch": 33.25, + "learning_rate": 3.7257364195795455e-05, + "loss": 0.0498, + "step": 118260 + }, + { + "epoch": 33.26, + "learning_rate": 3.7238621809889736e-05, + "loss": 0.0594, + "step": 118290 + }, + { + "epoch": 33.26, + "learning_rate": 3.721987942398401e-05, + "loss": 0.051, + "step": 118320 + }, + { + "epoch": 33.27, + "learning_rate": 3.7201137038078285e-05, + "loss": 0.0534, + "step": 118350 + }, + { + "epoch": 33.28, + "learning_rate": 3.718239465217256e-05, + "loss": 0.0567, + "step": 118380 + }, + { + "epoch": 33.29, + "learning_rate": 3.7163652266266826e-05, + "loss": 0.0535, + "step": 118410 + }, + { + "epoch": 33.3, + "learning_rate": 3.714490988036111e-05, + "loss": 0.0621, + "step": 118440 + }, + { + "epoch": 33.31, + "learning_rate": 3.7126167494455375e-05, + "loss": 0.0524, + "step": 118470 + }, + { + "epoch": 33.31, + "learning_rate": 3.7107425108549656e-05, + "loss": 0.0539, + "step": 118500 + }, + { + "epoch": 33.32, + "learning_rate": 3.708868272264393e-05, + "loss": 0.058, + "step": 118530 + }, + { + "epoch": 33.33, + "learning_rate": 3.7069940336738204e-05, + "loss": 0.0535, + "step": 118560 + }, + { + "epoch": 33.34, + "learning_rate": 3.705119795083248e-05, + "loss": 0.0625, + "step": 118590 + }, + { + "epoch": 33.35, + "learning_rate": 3.703245556492675e-05, + "loss": 0.0491, + "step": 118620 + }, + { + "epoch": 33.36, + "learning_rate": 3.7013713179021027e-05, + "loss": 0.0542, + "step": 118650 + }, + { + "epoch": 33.37, + "learning_rate": 3.6994970793115294e-05, + "loss": 0.06, + "step": 118680 + }, + { + "epoch": 33.37, + "learning_rate": 3.6976228407209575e-05, + "loss": 0.0484, + "step": 118710 + }, + { + "epoch": 33.38, + "learning_rate": 3.695748602130385e-05, + "loss": 0.0597, + "step": 118740 + }, + { + "epoch": 33.39, + "learning_rate": 3.693874363539812e-05, + "loss": 0.0514, + "step": 118770 + }, + { + "epoch": 33.4, + "learning_rate": 3.69200012494924e-05, + "loss": 0.0573, + "step": 118800 + }, + { + "epoch": 33.41, + "learning_rate": 3.690125886358667e-05, + "loss": 0.0574, + "step": 118830 + }, + { + "epoch": 33.42, + "learning_rate": 3.6882516477680946e-05, + "loss": 0.0553, + "step": 118860 + }, + { + "epoch": 33.42, + "learning_rate": 3.686377409177521e-05, + "loss": 0.0586, + "step": 118890 + }, + { + "epoch": 33.43, + "learning_rate": 3.6845031705869494e-05, + "loss": 0.0507, + "step": 118920 + }, + { + "epoch": 33.44, + "learning_rate": 3.682628931996376e-05, + "loss": 0.0559, + "step": 118950 + }, + { + "epoch": 33.45, + "learning_rate": 3.680754693405804e-05, + "loss": 0.0596, + "step": 118980 + }, + { + "epoch": 33.46, + "learning_rate": 3.678880454815232e-05, + "loss": 0.051, + "step": 119010 + }, + { + "epoch": 33.47, + "learning_rate": 3.677006216224659e-05, + "loss": 0.0614, + "step": 119040 + }, + { + "epoch": 33.47, + "learning_rate": 3.6751319776340865e-05, + "loss": 0.0499, + "step": 119070 + }, + { + "epoch": 33.48, + "learning_rate": 3.673257739043513e-05, + "loss": 0.0544, + "step": 119100 + }, + { + "epoch": 33.49, + "learning_rate": 3.6713835004529414e-05, + "loss": 0.0557, + "step": 119130 + }, + { + "epoch": 33.5, + "learning_rate": 3.669509261862368e-05, + "loss": 0.0507, + "step": 119160 + }, + { + "epoch": 33.51, + "learning_rate": 3.667635023271796e-05, + "loss": 0.058, + "step": 119190 + }, + { + "epoch": 33.52, + "learning_rate": 3.6657607846812236e-05, + "loss": 0.0533, + "step": 119220 + }, + { + "epoch": 33.53, + "learning_rate": 3.663886546090651e-05, + "loss": 0.0547, + "step": 119250 + }, + { + "epoch": 33.53, + "learning_rate": 3.6620123075000785e-05, + "loss": 0.0555, + "step": 119280 + }, + { + "epoch": 33.54, + "learning_rate": 3.660138068909505e-05, + "loss": 0.0506, + "step": 119310 + }, + { + "epoch": 33.55, + "learning_rate": 3.658263830318933e-05, + "loss": 0.0586, + "step": 119340 + }, + { + "epoch": 33.56, + "learning_rate": 3.65638959172836e-05, + "loss": 0.0534, + "step": 119370 + }, + { + "epoch": 33.57, + "learning_rate": 3.654515353137788e-05, + "loss": 0.0563, + "step": 119400 + }, + { + "epoch": 33.58, + "learning_rate": 3.6526411145472156e-05, + "loss": 0.0581, + "step": 119430 + }, + { + "epoch": 33.58, + "learning_rate": 3.650766875956643e-05, + "loss": 0.052, + "step": 119460 + }, + { + "epoch": 33.59, + "learning_rate": 3.6488926373660704e-05, + "loss": 0.0591, + "step": 119490 + }, + { + "epoch": 33.6, + "learning_rate": 3.647018398775497e-05, + "loss": 0.0501, + "step": 119520 + }, + { + "epoch": 33.61, + "learning_rate": 3.645144160184925e-05, + "loss": 0.0555, + "step": 119550 + }, + { + "epoch": 33.62, + "learning_rate": 3.643269921594352e-05, + "loss": 0.0541, + "step": 119580 + }, + { + "epoch": 33.63, + "learning_rate": 3.64139568300378e-05, + "loss": 0.0505, + "step": 119610 + }, + { + "epoch": 33.63, + "learning_rate": 3.6395214444132075e-05, + "loss": 0.058, + "step": 119640 + }, + { + "epoch": 33.64, + "learning_rate": 3.637647205822635e-05, + "loss": 0.0494, + "step": 119670 + }, + { + "epoch": 33.65, + "learning_rate": 3.635772967232062e-05, + "loss": 0.0568, + "step": 119700 + }, + { + "epoch": 33.66, + "learning_rate": 3.633898728641489e-05, + "loss": 0.0581, + "step": 119730 + }, + { + "epoch": 33.67, + "learning_rate": 3.632024490050917e-05, + "loss": 0.0507, + "step": 119760 + }, + { + "epoch": 33.68, + "learning_rate": 3.630150251460344e-05, + "loss": 0.0595, + "step": 119790 + }, + { + "epoch": 33.69, + "learning_rate": 3.628276012869772e-05, + "loss": 0.0476, + "step": 119820 + }, + { + "epoch": 33.69, + "learning_rate": 3.626464248898885e-05, + "loss": 0.0534, + "step": 119850 + }, + { + "epoch": 33.7, + "learning_rate": 3.624590010308312e-05, + "loss": 0.0571, + "step": 119880 + }, + { + "epoch": 33.71, + "learning_rate": 3.6227157717177396e-05, + "loss": 0.0502, + "step": 119910 + }, + { + "epoch": 33.72, + "learning_rate": 3.620841533127167e-05, + "loss": 0.059, + "step": 119940 + }, + { + "epoch": 33.73, + "learning_rate": 3.618967294536595e-05, + "loss": 0.0532, + "step": 119970 + }, + { + "epoch": 33.74, + "learning_rate": 3.617093055946022e-05, + "loss": 0.055, + "step": 120000 + }, + { + "epoch": 33.74, + "learning_rate": 3.61521881735545e-05, + "loss": 0.0539, + "step": 120030 + }, + { + "epoch": 33.75, + "learning_rate": 3.613344578764877e-05, + "loss": 0.0505, + "step": 120060 + }, + { + "epoch": 33.76, + "learning_rate": 3.611470340174304e-05, + "loss": 0.0575, + "step": 120090 + }, + { + "epoch": 33.77, + "learning_rate": 3.6095961015837315e-05, + "loss": 0.0489, + "step": 120120 + }, + { + "epoch": 33.78, + "learning_rate": 3.607721862993159e-05, + "loss": 0.0555, + "step": 120150 + }, + { + "epoch": 33.79, + "learning_rate": 3.605847624402587e-05, + "loss": 0.0545, + "step": 120180 + }, + { + "epoch": 33.8, + "learning_rate": 3.603973385812014e-05, + "loss": 0.0513, + "step": 120210 + }, + { + "epoch": 33.8, + "learning_rate": 3.602099147221442e-05, + "loss": 0.0551, + "step": 120240 + }, + { + "epoch": 33.81, + "learning_rate": 3.6002249086308686e-05, + "loss": 0.0509, + "step": 120270 + }, + { + "epoch": 33.82, + "learning_rate": 3.598350670040296e-05, + "loss": 0.0545, + "step": 120300 + }, + { + "epoch": 33.83, + "learning_rate": 3.5964764314497234e-05, + "loss": 0.0566, + "step": 120330 + }, + { + "epoch": 33.84, + "learning_rate": 3.594602192859151e-05, + "loss": 0.0523, + "step": 120360 + }, + { + "epoch": 33.85, + "learning_rate": 3.592727954268579e-05, + "loss": 0.0609, + "step": 120390 + }, + { + "epoch": 33.85, + "learning_rate": 3.590853715678006e-05, + "loss": 0.0493, + "step": 120420 + }, + { + "epoch": 33.86, + "learning_rate": 3.588979477087434e-05, + "loss": 0.0535, + "step": 120450 + }, + { + "epoch": 33.87, + "learning_rate": 3.5871052384968605e-05, + "loss": 0.055, + "step": 120480 + }, + { + "epoch": 33.88, + "learning_rate": 3.585230999906288e-05, + "loss": 0.0506, + "step": 120510 + }, + { + "epoch": 33.89, + "learning_rate": 3.5833567613157154e-05, + "loss": 0.0584, + "step": 120540 + }, + { + "epoch": 33.9, + "learning_rate": 3.581482522725143e-05, + "loss": 0.0548, + "step": 120570 + }, + { + "epoch": 33.9, + "learning_rate": 3.579608284134571e-05, + "loss": 0.0544, + "step": 120600 + }, + { + "epoch": 33.91, + "learning_rate": 3.5777340455439976e-05, + "loss": 0.0563, + "step": 120630 + }, + { + "epoch": 33.92, + "learning_rate": 3.575859806953426e-05, + "loss": 0.0506, + "step": 120660 + }, + { + "epoch": 33.93, + "learning_rate": 3.5739855683628525e-05, + "loss": 0.058, + "step": 120690 + }, + { + "epoch": 33.94, + "learning_rate": 3.5721113297722806e-05, + "loss": 0.052, + "step": 120720 + }, + { + "epoch": 33.95, + "learning_rate": 3.570237091181707e-05, + "loss": 0.0533, + "step": 120750 + }, + { + "epoch": 33.96, + "learning_rate": 3.568362852591135e-05, + "loss": 0.0572, + "step": 120780 + }, + { + "epoch": 33.96, + "learning_rate": 3.566488614000563e-05, + "loss": 0.051, + "step": 120810 + }, + { + "epoch": 33.97, + "learning_rate": 3.5646143754099896e-05, + "loss": 0.057, + "step": 120840 + }, + { + "epoch": 33.98, + "learning_rate": 3.562740136819418e-05, + "loss": 0.0518, + "step": 120870 + }, + { + "epoch": 33.99, + "learning_rate": 3.5608658982288444e-05, + "loss": 0.0561, + "step": 120900 + }, + { + "epoch": 34.0, + "learning_rate": 3.5589916596382725e-05, + "loss": 0.0601, + "step": 120930 + }, + { + "epoch": 34.0, + "eval_loss": 0.10950275510549545, + "eval_runtime": 635.2492, + "eval_samples_per_second": 25.239, + "eval_steps_per_second": 0.79, + "eval_wer": 0.09571738566729901, + "step": 120938 + }, + { + "epoch": 34.01, + "learning_rate": 3.557117421047699e-05, + "loss": 0.0525, + "step": 120960 + }, + { + "epoch": 34.01, + "learning_rate": 3.555243182457127e-05, + "loss": 0.0614, + "step": 120990 + }, + { + "epoch": 34.02, + "learning_rate": 3.553368943866555e-05, + "loss": 0.0447, + "step": 121020 + }, + { + "epoch": 34.03, + "learning_rate": 3.5514947052759815e-05, + "loss": 0.0569, + "step": 121050 + }, + { + "epoch": 34.04, + "learning_rate": 3.5496204666854096e-05, + "loss": 0.0538, + "step": 121080 + }, + { + "epoch": 34.05, + "learning_rate": 3.5477462280948363e-05, + "loss": 0.0549, + "step": 121110 + }, + { + "epoch": 34.06, + "learning_rate": 3.5458719895042644e-05, + "loss": 0.0593, + "step": 121140 + }, + { + "epoch": 34.07, + "learning_rate": 3.543997750913691e-05, + "loss": 0.0482, + "step": 121170 + }, + { + "epoch": 34.07, + "learning_rate": 3.5421235123231186e-05, + "loss": 0.0544, + "step": 121200 + }, + { + "epoch": 34.08, + "learning_rate": 3.540249273732547e-05, + "loss": 0.0528, + "step": 121230 + }, + { + "epoch": 34.09, + "learning_rate": 3.5384375097616594e-05, + "loss": 0.0516, + "step": 121260 + }, + { + "epoch": 34.1, + "learning_rate": 3.536563271171087e-05, + "loss": 0.0591, + "step": 121290 + }, + { + "epoch": 34.11, + "learning_rate": 3.534689032580514e-05, + "loss": 0.0459, + "step": 121320 + }, + { + "epoch": 34.12, + "learning_rate": 3.532814793989942e-05, + "loss": 0.0567, + "step": 121350 + }, + { + "epoch": 34.12, + "learning_rate": 3.530940555399369e-05, + "loss": 0.0522, + "step": 121380 + }, + { + "epoch": 34.13, + "learning_rate": 3.5290663168087965e-05, + "loss": 0.0501, + "step": 121410 + }, + { + "epoch": 34.14, + "learning_rate": 3.527192078218224e-05, + "loss": 0.0632, + "step": 121440 + }, + { + "epoch": 34.15, + "learning_rate": 3.5253178396276514e-05, + "loss": 0.0473, + "step": 121470 + }, + { + "epoch": 34.16, + "learning_rate": 3.523443601037079e-05, + "loss": 0.0553, + "step": 121500 + }, + { + "epoch": 34.17, + "learning_rate": 3.521569362446506e-05, + "loss": 0.0531, + "step": 121530 + }, + { + "epoch": 34.17, + "learning_rate": 3.5196951238559336e-05, + "loss": 0.0493, + "step": 121560 + }, + { + "epoch": 34.18, + "learning_rate": 3.517820885265361e-05, + "loss": 0.0607, + "step": 121590 + }, + { + "epoch": 34.19, + "learning_rate": 3.5159466466747885e-05, + "loss": 0.0467, + "step": 121620 + }, + { + "epoch": 34.2, + "learning_rate": 3.514072408084216e-05, + "loss": 0.0601, + "step": 121650 + }, + { + "epoch": 34.21, + "learning_rate": 3.512198169493643e-05, + "loss": 0.0513, + "step": 121680 + }, + { + "epoch": 34.22, + "learning_rate": 3.510323930903071e-05, + "loss": 0.0575, + "step": 121710 + }, + { + "epoch": 34.23, + "learning_rate": 3.508449692312498e-05, + "loss": 0.0582, + "step": 121740 + }, + { + "epoch": 34.23, + "learning_rate": 3.5065754537219256e-05, + "loss": 0.049, + "step": 121770 + }, + { + "epoch": 34.24, + "learning_rate": 3.504701215131353e-05, + "loss": 0.0564, + "step": 121800 + }, + { + "epoch": 34.25, + "learning_rate": 3.5028269765407804e-05, + "loss": 0.0527, + "step": 121830 + }, + { + "epoch": 34.26, + "learning_rate": 3.500952737950208e-05, + "loss": 0.0562, + "step": 121860 + }, + { + "epoch": 34.27, + "learning_rate": 3.499078499359635e-05, + "loss": 0.0583, + "step": 121890 + }, + { + "epoch": 34.28, + "learning_rate": 3.4972042607690627e-05, + "loss": 0.0485, + "step": 121920 + }, + { + "epoch": 34.28, + "learning_rate": 3.49533002217849e-05, + "loss": 0.0616, + "step": 121950 + }, + { + "epoch": 34.29, + "learning_rate": 3.4934557835879175e-05, + "loss": 0.0513, + "step": 121980 + }, + { + "epoch": 34.3, + "learning_rate": 3.491581544997345e-05, + "loss": 0.0533, + "step": 122010 + }, + { + "epoch": 34.31, + "learning_rate": 3.489707306406772e-05, + "loss": 0.0566, + "step": 122040 + }, + { + "epoch": 34.32, + "learning_rate": 3.4878330678162e-05, + "loss": 0.0512, + "step": 122070 + }, + { + "epoch": 34.33, + "learning_rate": 3.485958829225627e-05, + "loss": 0.0535, + "step": 122100 + }, + { + "epoch": 34.34, + "learning_rate": 3.4840845906350546e-05, + "loss": 0.0539, + "step": 122130 + }, + { + "epoch": 34.34, + "learning_rate": 3.482210352044482e-05, + "loss": 0.0538, + "step": 122160 + }, + { + "epoch": 34.35, + "learning_rate": 3.4803361134539094e-05, + "loss": 0.06, + "step": 122190 + }, + { + "epoch": 34.36, + "learning_rate": 3.478461874863337e-05, + "loss": 0.0489, + "step": 122220 + }, + { + "epoch": 34.37, + "learning_rate": 3.476587636272764e-05, + "loss": 0.0573, + "step": 122250 + }, + { + "epoch": 34.38, + "learning_rate": 3.474713397682192e-05, + "loss": 0.0505, + "step": 122280 + }, + { + "epoch": 34.39, + "learning_rate": 3.472839159091619e-05, + "loss": 0.0542, + "step": 122310 + }, + { + "epoch": 34.39, + "learning_rate": 3.4709649205010465e-05, + "loss": 0.0562, + "step": 122340 + }, + { + "epoch": 34.4, + "learning_rate": 3.469090681910474e-05, + "loss": 0.0482, + "step": 122370 + }, + { + "epoch": 34.41, + "learning_rate": 3.4672164433199014e-05, + "loss": 0.0562, + "step": 122400 + }, + { + "epoch": 34.42, + "learning_rate": 3.465342204729329e-05, + "loss": 0.0532, + "step": 122430 + }, + { + "epoch": 34.43, + "learning_rate": 3.463467966138756e-05, + "loss": 0.0506, + "step": 122460 + }, + { + "epoch": 34.44, + "learning_rate": 3.4615937275481836e-05, + "loss": 0.057, + "step": 122490 + }, + { + "epoch": 34.44, + "learning_rate": 3.459719488957611e-05, + "loss": 0.0466, + "step": 122520 + }, + { + "epoch": 34.45, + "learning_rate": 3.4578452503670385e-05, + "loss": 0.0542, + "step": 122550 + }, + { + "epoch": 34.46, + "learning_rate": 3.455971011776466e-05, + "loss": 0.0504, + "step": 122580 + }, + { + "epoch": 34.47, + "learning_rate": 3.454096773185894e-05, + "loss": 0.0561, + "step": 122610 + }, + { + "epoch": 34.48, + "learning_rate": 3.452222534595321e-05, + "loss": 0.0599, + "step": 122640 + }, + { + "epoch": 34.49, + "learning_rate": 3.450348296004748e-05, + "loss": 0.0469, + "step": 122670 + }, + { + "epoch": 34.5, + "learning_rate": 3.4484740574141756e-05, + "loss": 0.0622, + "step": 122700 + }, + { + "epoch": 34.5, + "learning_rate": 3.446599818823603e-05, + "loss": 0.0502, + "step": 122730 + }, + { + "epoch": 34.51, + "learning_rate": 3.4447255802330304e-05, + "loss": 0.0536, + "step": 122760 + }, + { + "epoch": 34.52, + "learning_rate": 3.442851341642458e-05, + "loss": 0.0596, + "step": 122790 + }, + { + "epoch": 34.53, + "learning_rate": 3.440977103051886e-05, + "loss": 0.0467, + "step": 122820 + }, + { + "epoch": 34.54, + "learning_rate": 3.4391028644613127e-05, + "loss": 0.0559, + "step": 122850 + }, + { + "epoch": 34.55, + "learning_rate": 3.43722862587074e-05, + "loss": 0.0514, + "step": 122880 + }, + { + "epoch": 34.55, + "learning_rate": 3.4353543872801675e-05, + "loss": 0.0558, + "step": 122910 + }, + { + "epoch": 34.56, + "learning_rate": 3.433480148689595e-05, + "loss": 0.0592, + "step": 122940 + }, + { + "epoch": 34.57, + "learning_rate": 3.431605910099022e-05, + "loss": 0.0479, + "step": 122970 + }, + { + "epoch": 34.58, + "learning_rate": 3.42973167150845e-05, + "loss": 0.0578, + "step": 123000 + }, + { + "epoch": 34.59, + "learning_rate": 3.427857432917878e-05, + "loss": 0.0474, + "step": 123030 + }, + { + "epoch": 34.6, + "learning_rate": 3.4259831943273046e-05, + "loss": 0.0556, + "step": 123060 + }, + { + "epoch": 34.6, + "learning_rate": 3.424108955736732e-05, + "loss": 0.058, + "step": 123090 + }, + { + "epoch": 34.61, + "learning_rate": 3.4222347171461594e-05, + "loss": 0.0469, + "step": 123120 + }, + { + "epoch": 34.62, + "learning_rate": 3.420360478555587e-05, + "loss": 0.0545, + "step": 123150 + }, + { + "epoch": 34.63, + "learning_rate": 3.418486239965014e-05, + "loss": 0.0528, + "step": 123180 + }, + { + "epoch": 34.64, + "learning_rate": 3.416612001374442e-05, + "loss": 0.0531, + "step": 123210 + }, + { + "epoch": 34.65, + "learning_rate": 3.41473776278387e-05, + "loss": 0.0593, + "step": 123240 + }, + { + "epoch": 34.66, + "learning_rate": 3.4128635241932965e-05, + "loss": 0.0467, + "step": 123270 + }, + { + "epoch": 34.66, + "learning_rate": 3.410989285602724e-05, + "loss": 0.0529, + "step": 123300 + }, + { + "epoch": 34.67, + "learning_rate": 3.4091150470121514e-05, + "loss": 0.0527, + "step": 123330 + }, + { + "epoch": 34.68, + "learning_rate": 3.407240808421579e-05, + "loss": 0.0528, + "step": 123360 + }, + { + "epoch": 34.69, + "learning_rate": 3.405366569831006e-05, + "loss": 0.0558, + "step": 123390 + }, + { + "epoch": 34.7, + "learning_rate": 3.4034923312404336e-05, + "loss": 0.0483, + "step": 123420 + }, + { + "epoch": 34.71, + "learning_rate": 3.401618092649862e-05, + "loss": 0.0568, + "step": 123450 + }, + { + "epoch": 34.71, + "learning_rate": 3.3997438540592885e-05, + "loss": 0.0524, + "step": 123480 + }, + { + "epoch": 34.72, + "learning_rate": 3.397869615468716e-05, + "loss": 0.0526, + "step": 123510 + }, + { + "epoch": 34.73, + "learning_rate": 3.395995376878143e-05, + "loss": 0.0546, + "step": 123540 + }, + { + "epoch": 34.74, + "learning_rate": 3.394121138287571e-05, + "loss": 0.0473, + "step": 123570 + }, + { + "epoch": 34.75, + "learning_rate": 3.392246899696998e-05, + "loss": 0.0563, + "step": 123600 + }, + { + "epoch": 34.76, + "learning_rate": 3.3903726611064255e-05, + "loss": 0.0476, + "step": 123630 + }, + { + "epoch": 34.77, + "learning_rate": 3.3884984225158536e-05, + "loss": 0.0573, + "step": 123660 + }, + { + "epoch": 34.77, + "learning_rate": 3.3866241839252804e-05, + "loss": 0.0584, + "step": 123690 + }, + { + "epoch": 34.78, + "learning_rate": 3.384749945334708e-05, + "loss": 0.0471, + "step": 123720 + }, + { + "epoch": 34.79, + "learning_rate": 3.382875706744135e-05, + "loss": 0.0556, + "step": 123750 + }, + { + "epoch": 34.8, + "learning_rate": 3.3810014681535626e-05, + "loss": 0.0508, + "step": 123780 + }, + { + "epoch": 34.81, + "learning_rate": 3.37912722956299e-05, + "loss": 0.0536, + "step": 123810 + }, + { + "epoch": 34.82, + "learning_rate": 3.3772529909724175e-05, + "loss": 0.054, + "step": 123840 + }, + { + "epoch": 34.82, + "learning_rate": 3.3753787523818456e-05, + "loss": 0.0491, + "step": 123870 + }, + { + "epoch": 34.83, + "learning_rate": 3.373504513791272e-05, + "loss": 0.0532, + "step": 123900 + }, + { + "epoch": 34.84, + "learning_rate": 3.3716302752007e-05, + "loss": 0.0492, + "step": 123930 + }, + { + "epoch": 34.85, + "learning_rate": 3.369756036610127e-05, + "loss": 0.0552, + "step": 123960 + }, + { + "epoch": 34.86, + "learning_rate": 3.3678817980195546e-05, + "loss": 0.0559, + "step": 123990 + }, + { + "epoch": 34.87, + "learning_rate": 3.366007559428982e-05, + "loss": 0.0514, + "step": 124020 + }, + { + "epoch": 34.87, + "learning_rate": 3.3641333208384094e-05, + "loss": 0.0558, + "step": 124050 + }, + { + "epoch": 34.88, + "learning_rate": 3.362259082247837e-05, + "loss": 0.0529, + "step": 124080 + }, + { + "epoch": 34.89, + "learning_rate": 3.360384843657264e-05, + "loss": 0.0521, + "step": 124110 + }, + { + "epoch": 34.9, + "learning_rate": 3.3585106050666923e-05, + "loss": 0.0606, + "step": 124140 + }, + { + "epoch": 34.91, + "learning_rate": 3.356636366476119e-05, + "loss": 0.0464, + "step": 124170 + }, + { + "epoch": 34.92, + "learning_rate": 3.3547621278855465e-05, + "loss": 0.0572, + "step": 124200 + }, + { + "epoch": 34.93, + "learning_rate": 3.352887889294974e-05, + "loss": 0.0559, + "step": 124230 + }, + { + "epoch": 34.93, + "learning_rate": 3.3510136507044013e-05, + "loss": 0.0524, + "step": 124260 + }, + { + "epoch": 34.94, + "learning_rate": 3.349139412113829e-05, + "loss": 0.0585, + "step": 124290 + }, + { + "epoch": 34.95, + "learning_rate": 3.347265173523256e-05, + "loss": 0.0487, + "step": 124320 + }, + { + "epoch": 34.96, + "learning_rate": 3.345390934932684e-05, + "loss": 0.0549, + "step": 124350 + }, + { + "epoch": 34.97, + "learning_rate": 3.343516696342111e-05, + "loss": 0.0525, + "step": 124380 + }, + { + "epoch": 34.98, + "learning_rate": 3.3416424577515384e-05, + "loss": 0.0541, + "step": 124410 + }, + { + "epoch": 34.98, + "learning_rate": 3.339768219160966e-05, + "loss": 0.0587, + "step": 124440 + }, + { + "epoch": 34.99, + "learning_rate": 3.337893980570393e-05, + "loss": 0.0508, + "step": 124470 + }, + { + "epoch": 35.0, + "eval_loss": 0.10791715979576111, + "eval_runtime": 635.3837, + "eval_samples_per_second": 25.234, + "eval_steps_per_second": 0.79, + "eval_wer": 0.09728685873377642, + "step": 124495 + }, + { + "epoch": 35.0, + "learning_rate": 3.336019741979821e-05, + "loss": 0.0613, + "step": 124500 + }, + { + "epoch": 35.01, + "learning_rate": 3.334145503389248e-05, + "loss": 0.0491, + "step": 124530 + }, + { + "epoch": 35.02, + "learning_rate": 3.332271264798676e-05, + "loss": 0.0526, + "step": 124560 + }, + { + "epoch": 35.03, + "learning_rate": 3.330397026208103e-05, + "loss": 0.0505, + "step": 124590 + }, + { + "epoch": 35.04, + "learning_rate": 3.3285227876175304e-05, + "loss": 0.0519, + "step": 124620 + }, + { + "epoch": 35.04, + "learning_rate": 3.326648549026958e-05, + "loss": 0.0557, + "step": 124650 + }, + { + "epoch": 35.05, + "learning_rate": 3.324774310436385e-05, + "loss": 0.0465, + "step": 124680 + }, + { + "epoch": 35.06, + "learning_rate": 3.3229000718458126e-05, + "loss": 0.0514, + "step": 124710 + }, + { + "epoch": 35.07, + "learning_rate": 3.32102583325524e-05, + "loss": 0.0523, + "step": 124740 + }, + { + "epoch": 35.08, + "learning_rate": 3.319151594664668e-05, + "loss": 0.05, + "step": 124770 + }, + { + "epoch": 35.09, + "learning_rate": 3.317277356074095e-05, + "loss": 0.0573, + "step": 124800 + }, + { + "epoch": 35.09, + "learning_rate": 3.315403117483522e-05, + "loss": 0.048, + "step": 124830 + }, + { + "epoch": 35.1, + "learning_rate": 3.31352887889295e-05, + "loss": 0.0539, + "step": 124860 + }, + { + "epoch": 35.11, + "learning_rate": 3.311654640302377e-05, + "loss": 0.0501, + "step": 124890 + }, + { + "epoch": 35.12, + "learning_rate": 3.3097804017118046e-05, + "loss": 0.0518, + "step": 124920 + }, + { + "epoch": 35.13, + "learning_rate": 3.307906163121232e-05, + "loss": 0.0587, + "step": 124950 + }, + { + "epoch": 35.14, + "learning_rate": 3.30603192453066e-05, + "loss": 0.0495, + "step": 124980 + }, + { + "epoch": 35.14, + "learning_rate": 3.304157685940087e-05, + "loss": 0.054, + "step": 125010 + }, + { + "epoch": 35.15, + "learning_rate": 3.302283447349514e-05, + "loss": 0.0556, + "step": 125040 + }, + { + "epoch": 35.16, + "learning_rate": 3.300409208758942e-05, + "loss": 0.0485, + "step": 125070 + }, + { + "epoch": 35.17, + "learning_rate": 3.298534970168369e-05, + "loss": 0.056, + "step": 125100 + }, + { + "epoch": 35.18, + "learning_rate": 3.2966607315777965e-05, + "loss": 0.0501, + "step": 125130 + }, + { + "epoch": 35.19, + "learning_rate": 3.294786492987224e-05, + "loss": 0.0544, + "step": 125160 + }, + { + "epoch": 35.2, + "learning_rate": 3.292912254396652e-05, + "loss": 0.0548, + "step": 125190 + }, + { + "epoch": 35.2, + "learning_rate": 3.291038015806079e-05, + "loss": 0.0523, + "step": 125220 + }, + { + "epoch": 35.21, + "learning_rate": 3.289163777215506e-05, + "loss": 0.0596, + "step": 125250 + }, + { + "epoch": 35.22, + "learning_rate": 3.2872895386249336e-05, + "loss": 0.0477, + "step": 125280 + }, + { + "epoch": 35.23, + "learning_rate": 3.285415300034361e-05, + "loss": 0.0563, + "step": 125310 + }, + { + "epoch": 35.24, + "learning_rate": 3.2835410614437884e-05, + "loss": 0.0558, + "step": 125340 + }, + { + "epoch": 35.25, + "learning_rate": 3.281666822853216e-05, + "loss": 0.051, + "step": 125370 + }, + { + "epoch": 35.25, + "learning_rate": 3.279792584262644e-05, + "loss": 0.0586, + "step": 125400 + }, + { + "epoch": 35.26, + "learning_rate": 3.277918345672071e-05, + "loss": 0.0507, + "step": 125430 + }, + { + "epoch": 35.27, + "learning_rate": 3.276106581701184e-05, + "loss": 0.0542, + "step": 125460 + }, + { + "epoch": 35.28, + "learning_rate": 3.2742323431106115e-05, + "loss": 0.0501, + "step": 125490 + }, + { + "epoch": 35.29, + "learning_rate": 3.272358104520039e-05, + "loss": 0.0515, + "step": 125520 + }, + { + "epoch": 35.3, + "learning_rate": 3.2704838659294664e-05, + "loss": 0.0591, + "step": 125550 + }, + { + "epoch": 35.3, + "learning_rate": 3.268609627338894e-05, + "loss": 0.0469, + "step": 125580 + }, + { + "epoch": 35.31, + "learning_rate": 3.266735388748321e-05, + "loss": 0.0545, + "step": 125610 + }, + { + "epoch": 35.32, + "learning_rate": 3.2648611501577486e-05, + "loss": 0.051, + "step": 125640 + }, + { + "epoch": 35.33, + "learning_rate": 3.262986911567176e-05, + "loss": 0.048, + "step": 125670 + }, + { + "epoch": 35.34, + "learning_rate": 3.2611126729766035e-05, + "loss": 0.0577, + "step": 125700 + }, + { + "epoch": 35.35, + "learning_rate": 3.259238434386031e-05, + "loss": 0.0468, + "step": 125730 + }, + { + "epoch": 35.36, + "learning_rate": 3.257364195795458e-05, + "loss": 0.0567, + "step": 125760 + }, + { + "epoch": 35.36, + "learning_rate": 3.255489957204886e-05, + "loss": 0.0479, + "step": 125790 + }, + { + "epoch": 35.37, + "learning_rate": 3.253615718614313e-05, + "loss": 0.0543, + "step": 125820 + }, + { + "epoch": 35.38, + "learning_rate": 3.2517414800237406e-05, + "loss": 0.0594, + "step": 125850 + }, + { + "epoch": 35.39, + "learning_rate": 3.249867241433168e-05, + "loss": 0.0472, + "step": 125880 + }, + { + "epoch": 35.4, + "learning_rate": 3.2479930028425954e-05, + "loss": 0.0585, + "step": 125910 + }, + { + "epoch": 35.41, + "learning_rate": 3.246118764252023e-05, + "loss": 0.0516, + "step": 125940 + }, + { + "epoch": 35.41, + "learning_rate": 3.24424452566145e-05, + "loss": 0.0497, + "step": 125970 + }, + { + "epoch": 35.42, + "learning_rate": 3.2423702870708777e-05, + "loss": 0.0578, + "step": 126000 + }, + { + "epoch": 35.43, + "learning_rate": 3.240496048480305e-05, + "loss": 0.049, + "step": 126030 + }, + { + "epoch": 35.44, + "learning_rate": 3.2386218098897325e-05, + "loss": 0.0557, + "step": 126060 + }, + { + "epoch": 35.45, + "learning_rate": 3.23674757129916e-05, + "loss": 0.0499, + "step": 126090 + }, + { + "epoch": 35.46, + "learning_rate": 3.234873332708587e-05, + "loss": 0.0504, + "step": 126120 + }, + { + "epoch": 35.47, + "learning_rate": 3.232999094118015e-05, + "loss": 0.0612, + "step": 126150 + }, + { + "epoch": 35.47, + "learning_rate": 3.231124855527442e-05, + "loss": 0.0474, + "step": 126180 + }, + { + "epoch": 35.48, + "learning_rate": 3.2292506169368696e-05, + "loss": 0.0541, + "step": 126210 + }, + { + "epoch": 35.49, + "learning_rate": 3.227376378346297e-05, + "loss": 0.0512, + "step": 126240 + }, + { + "epoch": 35.5, + "learning_rate": 3.2255021397557244e-05, + "loss": 0.0511, + "step": 126270 + }, + { + "epoch": 35.51, + "learning_rate": 3.223627901165152e-05, + "loss": 0.0544, + "step": 126300 + }, + { + "epoch": 35.52, + "learning_rate": 3.221753662574579e-05, + "loss": 0.0462, + "step": 126330 + }, + { + "epoch": 35.52, + "learning_rate": 3.219879423984007e-05, + "loss": 0.0594, + "step": 126360 + }, + { + "epoch": 35.53, + "learning_rate": 3.218005185393434e-05, + "loss": 0.0557, + "step": 126390 + }, + { + "epoch": 35.54, + "learning_rate": 3.2161309468028615e-05, + "loss": 0.0517, + "step": 126420 + }, + { + "epoch": 35.55, + "learning_rate": 3.214256708212289e-05, + "loss": 0.0592, + "step": 126450 + }, + { + "epoch": 35.56, + "learning_rate": 3.2123824696217164e-05, + "loss": 0.0457, + "step": 126480 + }, + { + "epoch": 35.57, + "learning_rate": 3.210508231031144e-05, + "loss": 0.054, + "step": 126510 + }, + { + "epoch": 35.57, + "learning_rate": 3.208633992440571e-05, + "loss": 0.0495, + "step": 126540 + }, + { + "epoch": 35.58, + "learning_rate": 3.2067597538499986e-05, + "loss": 0.0472, + "step": 126570 + }, + { + "epoch": 35.59, + "learning_rate": 3.204885515259426e-05, + "loss": 0.0593, + "step": 126600 + }, + { + "epoch": 35.6, + "learning_rate": 3.2030112766688535e-05, + "loss": 0.0498, + "step": 126630 + }, + { + "epoch": 35.61, + "learning_rate": 3.201137038078281e-05, + "loss": 0.0544, + "step": 126660 + }, + { + "epoch": 35.62, + "learning_rate": 3.199262799487708e-05, + "loss": 0.051, + "step": 126690 + }, + { + "epoch": 35.63, + "learning_rate": 3.197388560897136e-05, + "loss": 0.0507, + "step": 126720 + }, + { + "epoch": 35.63, + "learning_rate": 3.195514322306563e-05, + "loss": 0.0566, + "step": 126750 + }, + { + "epoch": 35.64, + "learning_rate": 3.1936400837159906e-05, + "loss": 0.048, + "step": 126780 + }, + { + "epoch": 35.65, + "learning_rate": 3.191765845125418e-05, + "loss": 0.0525, + "step": 126810 + }, + { + "epoch": 35.66, + "learning_rate": 3.1898916065348454e-05, + "loss": 0.0537, + "step": 126840 + }, + { + "epoch": 35.67, + "learning_rate": 3.188017367944273e-05, + "loss": 0.0509, + "step": 126870 + }, + { + "epoch": 35.68, + "learning_rate": 3.1861431293537e-05, + "loss": 0.059, + "step": 126900 + }, + { + "epoch": 35.68, + "learning_rate": 3.1842688907631276e-05, + "loss": 0.0465, + "step": 126930 + }, + { + "epoch": 35.69, + "learning_rate": 3.182394652172555e-05, + "loss": 0.0535, + "step": 126960 + }, + { + "epoch": 35.7, + "learning_rate": 3.1805204135819825e-05, + "loss": 0.0535, + "step": 126990 + }, + { + "epoch": 35.71, + "learning_rate": 3.17864617499141e-05, + "loss": 0.052, + "step": 127020 + }, + { + "epoch": 35.72, + "learning_rate": 3.176771936400837e-05, + "loss": 0.0586, + "step": 127050 + }, + { + "epoch": 35.73, + "learning_rate": 3.174897697810265e-05, + "loss": 0.0485, + "step": 127080 + }, + { + "epoch": 35.74, + "learning_rate": 3.173023459219692e-05, + "loss": 0.0526, + "step": 127110 + }, + { + "epoch": 35.74, + "learning_rate": 3.1711492206291196e-05, + "loss": 0.0541, + "step": 127140 + }, + { + "epoch": 35.75, + "learning_rate": 3.169274982038547e-05, + "loss": 0.0537, + "step": 127170 + }, + { + "epoch": 35.76, + "learning_rate": 3.1674007434479744e-05, + "loss": 0.0619, + "step": 127200 + }, + { + "epoch": 35.77, + "learning_rate": 3.165526504857402e-05, + "loss": 0.0483, + "step": 127230 + }, + { + "epoch": 35.78, + "learning_rate": 3.163652266266829e-05, + "loss": 0.0515, + "step": 127260 + }, + { + "epoch": 35.79, + "learning_rate": 3.161778027676257e-05, + "loss": 0.0516, + "step": 127290 + }, + { + "epoch": 35.79, + "learning_rate": 3.159903789085684e-05, + "loss": 0.0503, + "step": 127320 + }, + { + "epoch": 35.8, + "learning_rate": 3.1580295504951115e-05, + "loss": 0.0573, + "step": 127350 + }, + { + "epoch": 35.81, + "learning_rate": 3.156155311904539e-05, + "loss": 0.0476, + "step": 127380 + }, + { + "epoch": 35.82, + "learning_rate": 3.1542810733139664e-05, + "loss": 0.0542, + "step": 127410 + }, + { + "epoch": 35.83, + "learning_rate": 3.152406834723394e-05, + "loss": 0.0506, + "step": 127440 + }, + { + "epoch": 35.84, + "learning_rate": 3.150532596132821e-05, + "loss": 0.0494, + "step": 127470 + }, + { + "epoch": 35.84, + "learning_rate": 3.1486583575422486e-05, + "loss": 0.0598, + "step": 127500 + }, + { + "epoch": 35.85, + "learning_rate": 3.146784118951676e-05, + "loss": 0.0495, + "step": 127530 + }, + { + "epoch": 35.86, + "learning_rate": 3.1449098803611034e-05, + "loss": 0.0522, + "step": 127560 + }, + { + "epoch": 35.87, + "learning_rate": 3.143035641770531e-05, + "loss": 0.0537, + "step": 127590 + }, + { + "epoch": 35.88, + "learning_rate": 3.141161403179958e-05, + "loss": 0.0524, + "step": 127620 + }, + { + "epoch": 35.89, + "learning_rate": 3.139287164589386e-05, + "loss": 0.0604, + "step": 127650 + }, + { + "epoch": 35.9, + "learning_rate": 3.137412925998813e-05, + "loss": 0.0468, + "step": 127680 + }, + { + "epoch": 35.9, + "learning_rate": 3.1355386874082405e-05, + "loss": 0.058, + "step": 127710 + }, + { + "epoch": 35.91, + "learning_rate": 3.133664448817668e-05, + "loss": 0.053, + "step": 127740 + }, + { + "epoch": 35.92, + "learning_rate": 3.1317902102270954e-05, + "loss": 0.0507, + "step": 127770 + }, + { + "epoch": 35.93, + "learning_rate": 3.129915971636523e-05, + "loss": 0.0529, + "step": 127800 + }, + { + "epoch": 35.94, + "learning_rate": 3.12804173304595e-05, + "loss": 0.046, + "step": 127830 + }, + { + "epoch": 35.95, + "learning_rate": 3.1261674944553776e-05, + "loss": 0.0518, + "step": 127860 + }, + { + "epoch": 35.95, + "learning_rate": 3.124293255864805e-05, + "loss": 0.0546, + "step": 127890 + }, + { + "epoch": 35.96, + "learning_rate": 3.1224190172742325e-05, + "loss": 0.0536, + "step": 127920 + }, + { + "epoch": 35.97, + "learning_rate": 3.12054477868366e-05, + "loss": 0.0564, + "step": 127950 + }, + { + "epoch": 35.98, + "learning_rate": 3.118670540093087e-05, + "loss": 0.0501, + "step": 127980 + }, + { + "epoch": 35.99, + "learning_rate": 3.116796301502515e-05, + "loss": 0.0528, + "step": 128010 + }, + { + "epoch": 36.0, + "learning_rate": 3.114922062911942e-05, + "loss": 0.0526, + "step": 128040 + }, + { + "epoch": 36.0, + "eval_loss": 0.10677393525838852, + "eval_runtime": 635.8282, + "eval_samples_per_second": 25.216, + "eval_steps_per_second": 0.79, + "eval_wer": 0.09673413126253873, + "step": 128052 + }, + { + "epoch": 36.01, + "learning_rate": 3.1130478243213696e-05, + "loss": 0.0513, + "step": 128070 + }, + { + "epoch": 36.01, + "learning_rate": 3.111173585730797e-05, + "loss": 0.0532, + "step": 128100 + }, + { + "epoch": 36.02, + "learning_rate": 3.1092993471402244e-05, + "loss": 0.0461, + "step": 128130 + }, + { + "epoch": 36.03, + "learning_rate": 3.107425108549652e-05, + "loss": 0.0604, + "step": 128160 + }, + { + "epoch": 36.04, + "learning_rate": 3.105550869959079e-05, + "loss": 0.0484, + "step": 128190 + }, + { + "epoch": 36.05, + "learning_rate": 3.103676631368507e-05, + "loss": 0.0542, + "step": 128220 + }, + { + "epoch": 36.06, + "learning_rate": 3.101802392777934e-05, + "loss": 0.0546, + "step": 128250 + }, + { + "epoch": 36.06, + "learning_rate": 3.0999281541873615e-05, + "loss": 0.0495, + "step": 128280 + }, + { + "epoch": 36.07, + "learning_rate": 3.098053915596789e-05, + "loss": 0.0558, + "step": 128310 + }, + { + "epoch": 36.08, + "learning_rate": 3.0961796770062163e-05, + "loss": 0.0449, + "step": 128340 + }, + { + "epoch": 36.09, + "learning_rate": 3.094305438415644e-05, + "loss": 0.0524, + "step": 128370 + }, + { + "epoch": 36.1, + "learning_rate": 3.092431199825071e-05, + "loss": 0.0563, + "step": 128400 + }, + { + "epoch": 36.11, + "learning_rate": 3.0905569612344986e-05, + "loss": 0.0479, + "step": 128430 + }, + { + "epoch": 36.11, + "learning_rate": 3.088682722643926e-05, + "loss": 0.0533, + "step": 128460 + }, + { + "epoch": 36.12, + "learning_rate": 3.0868084840533534e-05, + "loss": 0.0508, + "step": 128490 + }, + { + "epoch": 36.13, + "learning_rate": 3.084934245462781e-05, + "loss": 0.0524, + "step": 128520 + }, + { + "epoch": 36.14, + "learning_rate": 3.083060006872208e-05, + "loss": 0.051, + "step": 128550 + }, + { + "epoch": 36.15, + "learning_rate": 3.081185768281636e-05, + "loss": 0.0497, + "step": 128580 + }, + { + "epoch": 36.16, + "learning_rate": 3.079311529691063e-05, + "loss": 0.0569, + "step": 128610 + }, + { + "epoch": 36.17, + "learning_rate": 3.0774372911004905e-05, + "loss": 0.0478, + "step": 128640 + }, + { + "epoch": 36.17, + "learning_rate": 3.075563052509918e-05, + "loss": 0.0478, + "step": 128670 + }, + { + "epoch": 36.18, + "learning_rate": 3.0736888139193454e-05, + "loss": 0.0542, + "step": 128700 + }, + { + "epoch": 36.19, + "learning_rate": 3.071814575328773e-05, + "loss": 0.0496, + "step": 128730 + }, + { + "epoch": 36.2, + "learning_rate": 3.0699403367382e-05, + "loss": 0.0602, + "step": 128760 + }, + { + "epoch": 36.21, + "learning_rate": 3.0680660981476276e-05, + "loss": 0.049, + "step": 128790 + }, + { + "epoch": 36.22, + "learning_rate": 3.066191859557055e-05, + "loss": 0.0547, + "step": 128820 + }, + { + "epoch": 36.22, + "learning_rate": 3.0643176209664825e-05, + "loss": 0.0498, + "step": 128850 + }, + { + "epoch": 36.23, + "learning_rate": 3.06244338237591e-05, + "loss": 0.0482, + "step": 128880 + }, + { + "epoch": 36.24, + "learning_rate": 3.060569143785337e-05, + "loss": 0.0574, + "step": 128910 + }, + { + "epoch": 36.25, + "learning_rate": 3.058694905194765e-05, + "loss": 0.047, + "step": 128940 + }, + { + "epoch": 36.26, + "learning_rate": 3.056820666604192e-05, + "loss": 0.0539, + "step": 128970 + }, + { + "epoch": 36.27, + "learning_rate": 3.0549464280136196e-05, + "loss": 0.0493, + "step": 129000 + }, + { + "epoch": 36.27, + "learning_rate": 3.053072189423047e-05, + "loss": 0.0476, + "step": 129030 + }, + { + "epoch": 36.28, + "learning_rate": 3.0511979508324744e-05, + "loss": 0.0553, + "step": 129060 + }, + { + "epoch": 36.29, + "learning_rate": 3.0493237122419015e-05, + "loss": 0.0472, + "step": 129090 + }, + { + "epoch": 36.3, + "learning_rate": 3.0474494736513292e-05, + "loss": 0.0503, + "step": 129120 + }, + { + "epoch": 36.31, + "learning_rate": 3.045575235060757e-05, + "loss": 0.0538, + "step": 129150 + }, + { + "epoch": 36.32, + "learning_rate": 3.043700996470184e-05, + "loss": 0.0469, + "step": 129180 + }, + { + "epoch": 36.33, + "learning_rate": 3.041826757879612e-05, + "loss": 0.056, + "step": 129210 + }, + { + "epoch": 36.33, + "learning_rate": 3.039952519289039e-05, + "loss": 0.0484, + "step": 129240 + }, + { + "epoch": 36.34, + "learning_rate": 3.0380782806984663e-05, + "loss": 0.0519, + "step": 129270 + }, + { + "epoch": 36.35, + "learning_rate": 3.0362040421078934e-05, + "loss": 0.0566, + "step": 129300 + }, + { + "epoch": 36.36, + "learning_rate": 3.0343298035173212e-05, + "loss": 0.0472, + "step": 129330 + }, + { + "epoch": 36.37, + "learning_rate": 3.032455564926749e-05, + "loss": 0.057, + "step": 129360 + }, + { + "epoch": 36.38, + "learning_rate": 3.030581326336176e-05, + "loss": 0.0478, + "step": 129390 + }, + { + "epoch": 36.38, + "learning_rate": 3.0287070877456038e-05, + "loss": 0.0531, + "step": 129420 + }, + { + "epoch": 36.39, + "learning_rate": 3.0268953237747165e-05, + "loss": 0.055, + "step": 129450 + }, + { + "epoch": 36.4, + "learning_rate": 3.0250210851841443e-05, + "loss": 0.0496, + "step": 129480 + }, + { + "epoch": 36.41, + "learning_rate": 3.0231468465935713e-05, + "loss": 0.0548, + "step": 129510 + }, + { + "epoch": 36.42, + "learning_rate": 3.021272608002999e-05, + "loss": 0.0471, + "step": 129540 + }, + { + "epoch": 36.43, + "learning_rate": 3.0193983694124262e-05, + "loss": 0.0549, + "step": 129570 + }, + { + "epoch": 36.44, + "learning_rate": 3.017524130821854e-05, + "loss": 0.0539, + "step": 129600 + }, + { + "epoch": 36.44, + "learning_rate": 3.015649892231281e-05, + "loss": 0.0463, + "step": 129630 + }, + { + "epoch": 36.45, + "learning_rate": 3.0137756536407084e-05, + "loss": 0.0532, + "step": 129660 + }, + { + "epoch": 36.46, + "learning_rate": 3.0119014150501362e-05, + "loss": 0.0468, + "step": 129690 + }, + { + "epoch": 36.47, + "learning_rate": 3.0100271764595633e-05, + "loss": 0.0515, + "step": 129720 + }, + { + "epoch": 36.48, + "learning_rate": 3.008152937868991e-05, + "loss": 0.0571, + "step": 129750 + }, + { + "epoch": 36.49, + "learning_rate": 3.006278699278418e-05, + "loss": 0.0492, + "step": 129780 + }, + { + "epoch": 36.49, + "learning_rate": 3.004404460687846e-05, + "loss": 0.0551, + "step": 129810 + }, + { + "epoch": 36.5, + "learning_rate": 3.002530222097273e-05, + "loss": 0.0451, + "step": 129840 + }, + { + "epoch": 36.51, + "learning_rate": 3.0006559835067004e-05, + "loss": 0.0528, + "step": 129870 + }, + { + "epoch": 36.52, + "learning_rate": 2.998781744916128e-05, + "loss": 0.0566, + "step": 129900 + }, + { + "epoch": 36.53, + "learning_rate": 2.9969075063255552e-05, + "loss": 0.0464, + "step": 129930 + }, + { + "epoch": 36.54, + "learning_rate": 2.995033267734983e-05, + "loss": 0.0537, + "step": 129960 + }, + { + "epoch": 36.54, + "learning_rate": 2.99315902914441e-05, + "loss": 0.0489, + "step": 129990 + }, + { + "epoch": 36.55, + "learning_rate": 2.9912847905538378e-05, + "loss": 0.0522, + "step": 130020 + }, + { + "epoch": 36.56, + "learning_rate": 2.989410551963265e-05, + "loss": 0.0513, + "step": 130050 + }, + { + "epoch": 36.57, + "learning_rate": 2.9875363133726923e-05, + "loss": 0.0464, + "step": 130080 + }, + { + "epoch": 36.58, + "learning_rate": 2.98566207478212e-05, + "loss": 0.0558, + "step": 130110 + }, + { + "epoch": 36.59, + "learning_rate": 2.983787836191547e-05, + "loss": 0.0463, + "step": 130140 + }, + { + "epoch": 36.6, + "learning_rate": 2.981913597600975e-05, + "loss": 0.0536, + "step": 130170 + }, + { + "epoch": 36.6, + "learning_rate": 2.980039359010402e-05, + "loss": 0.0517, + "step": 130200 + }, + { + "epoch": 36.61, + "learning_rate": 2.9781651204198297e-05, + "loss": 0.049, + "step": 130230 + }, + { + "epoch": 36.62, + "learning_rate": 2.9762908818292568e-05, + "loss": 0.0582, + "step": 130260 + }, + { + "epoch": 36.63, + "learning_rate": 2.9744166432386842e-05, + "loss": 0.0475, + "step": 130290 + }, + { + "epoch": 36.64, + "learning_rate": 2.972542404648112e-05, + "loss": 0.0558, + "step": 130320 + }, + { + "epoch": 36.65, + "learning_rate": 2.970668166057539e-05, + "loss": 0.0496, + "step": 130350 + }, + { + "epoch": 36.65, + "learning_rate": 2.968793927466967e-05, + "loss": 0.0515, + "step": 130380 + }, + { + "epoch": 36.66, + "learning_rate": 2.966919688876394e-05, + "loss": 0.0581, + "step": 130410 + }, + { + "epoch": 36.67, + "learning_rate": 2.9650454502858217e-05, + "loss": 0.048, + "step": 130440 + }, + { + "epoch": 36.68, + "learning_rate": 2.9631712116952488e-05, + "loss": 0.0519, + "step": 130470 + }, + { + "epoch": 36.69, + "learning_rate": 2.9612969731046765e-05, + "loss": 0.048, + "step": 130500 + }, + { + "epoch": 36.7, + "learning_rate": 2.959422734514104e-05, + "loss": 0.0496, + "step": 130530 + }, + { + "epoch": 36.7, + "learning_rate": 2.957548495923531e-05, + "loss": 0.0532, + "step": 130560 + }, + { + "epoch": 36.71, + "learning_rate": 2.9556742573329588e-05, + "loss": 0.0505, + "step": 130590 + }, + { + "epoch": 36.72, + "learning_rate": 2.953800018742386e-05, + "loss": 0.0524, + "step": 130620 + }, + { + "epoch": 36.73, + "learning_rate": 2.9519257801518136e-05, + "loss": 0.052, + "step": 130650 + }, + { + "epoch": 36.74, + "learning_rate": 2.9500515415612407e-05, + "loss": 0.0498, + "step": 130680 + }, + { + "epoch": 36.75, + "learning_rate": 2.9481773029706685e-05, + "loss": 0.0565, + "step": 130710 + }, + { + "epoch": 36.76, + "learning_rate": 2.946303064380096e-05, + "loss": 0.0473, + "step": 130740 + }, + { + "epoch": 36.76, + "learning_rate": 2.944428825789523e-05, + "loss": 0.0503, + "step": 130770 + }, + { + "epoch": 36.77, + "learning_rate": 2.9425545871989507e-05, + "loss": 0.0535, + "step": 130800 + }, + { + "epoch": 36.78, + "learning_rate": 2.9406803486083778e-05, + "loss": 0.0491, + "step": 130830 + }, + { + "epoch": 36.79, + "learning_rate": 2.9388061100178055e-05, + "loss": 0.0521, + "step": 130860 + }, + { + "epoch": 36.8, + "learning_rate": 2.9369318714272326e-05, + "loss": 0.0443, + "step": 130890 + }, + { + "epoch": 36.81, + "learning_rate": 2.9350576328366604e-05, + "loss": 0.0538, + "step": 130920 + }, + { + "epoch": 36.81, + "learning_rate": 2.9331833942460878e-05, + "loss": 0.0522, + "step": 130950 + }, + { + "epoch": 36.82, + "learning_rate": 2.931309155655515e-05, + "loss": 0.0501, + "step": 130980 + }, + { + "epoch": 36.83, + "learning_rate": 2.9294349170649426e-05, + "loss": 0.0568, + "step": 131010 + }, + { + "epoch": 36.84, + "learning_rate": 2.9275606784743697e-05, + "loss": 0.0475, + "step": 131040 + }, + { + "epoch": 36.85, + "learning_rate": 2.9256864398837975e-05, + "loss": 0.0505, + "step": 131070 + }, + { + "epoch": 36.86, + "learning_rate": 2.9238746759129106e-05, + "loss": 0.0537, + "step": 131100 + }, + { + "epoch": 36.87, + "learning_rate": 2.922000437322338e-05, + "loss": 0.0494, + "step": 131130 + }, + { + "epoch": 36.87, + "learning_rate": 2.920126198731765e-05, + "loss": 0.0543, + "step": 131160 + }, + { + "epoch": 36.88, + "learning_rate": 2.9182519601411928e-05, + "loss": 0.0461, + "step": 131190 + }, + { + "epoch": 36.89, + "learning_rate": 2.91637772155062e-05, + "loss": 0.0523, + "step": 131220 + }, + { + "epoch": 36.9, + "learning_rate": 2.9145034829600477e-05, + "loss": 0.0496, + "step": 131250 + }, + { + "epoch": 36.91, + "learning_rate": 2.9126292443694754e-05, + "loss": 0.0478, + "step": 131280 + }, + { + "epoch": 36.92, + "learning_rate": 2.9107550057789025e-05, + "loss": 0.054, + "step": 131310 + }, + { + "epoch": 36.92, + "learning_rate": 2.90888076718833e-05, + "loss": 0.0467, + "step": 131340 + }, + { + "epoch": 36.93, + "learning_rate": 2.907006528597757e-05, + "loss": 0.0542, + "step": 131370 + }, + { + "epoch": 36.94, + "learning_rate": 2.9051322900071848e-05, + "loss": 0.0543, + "step": 131400 + }, + { + "epoch": 36.95, + "learning_rate": 2.903258051416612e-05, + "loss": 0.0491, + "step": 131430 + }, + { + "epoch": 36.96, + "learning_rate": 2.9013838128260396e-05, + "loss": 0.0573, + "step": 131460 + }, + { + "epoch": 36.97, + "learning_rate": 2.8995095742354673e-05, + "loss": 0.0478, + "step": 131490 + }, + { + "epoch": 36.97, + "learning_rate": 2.8976353356448944e-05, + "loss": 0.0549, + "step": 131520 + }, + { + "epoch": 36.98, + "learning_rate": 2.895761097054322e-05, + "loss": 0.0558, + "step": 131550 + }, + { + "epoch": 36.99, + "learning_rate": 2.893886858463749e-05, + "loss": 0.0487, + "step": 131580 + }, + { + "epoch": 37.0, + "eval_loss": 0.10814538598060608, + "eval_runtime": 637.0458, + "eval_samples_per_second": 25.168, + "eval_steps_per_second": 0.788, + "eval_wer": 0.09662495052747942, + "step": 131609 + }, + { + "epoch": 37.0, + "learning_rate": 2.8920126198731767e-05, + "loss": 0.0589, + "step": 131610 + }, + { + "epoch": 37.01, + "learning_rate": 2.8901383812826038e-05, + "loss": 0.0479, + "step": 131640 + }, + { + "epoch": 37.02, + "learning_rate": 2.8882641426920315e-05, + "loss": 0.0533, + "step": 131670 + }, + { + "epoch": 37.03, + "learning_rate": 2.8863899041014593e-05, + "loss": 0.0463, + "step": 131700 + }, + { + "epoch": 37.03, + "learning_rate": 2.8845156655108864e-05, + "loss": 0.048, + "step": 131730 + }, + { + "epoch": 37.04, + "learning_rate": 2.8826414269203138e-05, + "loss": 0.0577, + "step": 131760 + }, + { + "epoch": 37.05, + "learning_rate": 2.880767188329741e-05, + "loss": 0.0447, + "step": 131790 + }, + { + "epoch": 37.06, + "learning_rate": 2.8788929497391686e-05, + "loss": 0.0561, + "step": 131820 + }, + { + "epoch": 37.07, + "learning_rate": 2.8770187111485957e-05, + "loss": 0.0476, + "step": 131850 + }, + { + "epoch": 37.08, + "learning_rate": 2.8751444725580235e-05, + "loss": 0.0488, + "step": 131880 + }, + { + "epoch": 37.08, + "learning_rate": 2.8732702339674512e-05, + "loss": 0.0553, + "step": 131910 + }, + { + "epoch": 37.09, + "learning_rate": 2.8713959953768783e-05, + "loss": 0.0465, + "step": 131940 + }, + { + "epoch": 37.1, + "learning_rate": 2.8695217567863057e-05, + "loss": 0.054, + "step": 131970 + }, + { + "epoch": 37.11, + "learning_rate": 2.8676475181957328e-05, + "loss": 0.0475, + "step": 132000 + }, + { + "epoch": 37.12, + "learning_rate": 2.8657732796051606e-05, + "loss": 0.0514, + "step": 132030 + }, + { + "epoch": 37.13, + "learning_rate": 2.8638990410145876e-05, + "loss": 0.0529, + "step": 132060 + }, + { + "epoch": 37.14, + "learning_rate": 2.8620248024240154e-05, + "loss": 0.0458, + "step": 132090 + }, + { + "epoch": 37.14, + "learning_rate": 2.860150563833443e-05, + "loss": 0.0527, + "step": 132120 + }, + { + "epoch": 37.15, + "learning_rate": 2.8582763252428702e-05, + "loss": 0.0462, + "step": 132150 + }, + { + "epoch": 37.16, + "learning_rate": 2.8564020866522976e-05, + "loss": 0.0492, + "step": 132180 + }, + { + "epoch": 37.17, + "learning_rate": 2.854527848061725e-05, + "loss": 0.0535, + "step": 132210 + }, + { + "epoch": 37.18, + "learning_rate": 2.8526536094711525e-05, + "loss": 0.047, + "step": 132240 + }, + { + "epoch": 37.19, + "learning_rate": 2.8507793708805796e-05, + "loss": 0.0499, + "step": 132270 + }, + { + "epoch": 37.19, + "learning_rate": 2.8489051322900073e-05, + "loss": 0.0492, + "step": 132300 + }, + { + "epoch": 37.2, + "learning_rate": 2.847030893699435e-05, + "loss": 0.0496, + "step": 132330 + }, + { + "epoch": 37.21, + "learning_rate": 2.845156655108862e-05, + "loss": 0.053, + "step": 132360 + }, + { + "epoch": 37.22, + "learning_rate": 2.8432824165182896e-05, + "loss": 0.0445, + "step": 132390 + }, + { + "epoch": 37.23, + "learning_rate": 2.841408177927717e-05, + "loss": 0.054, + "step": 132420 + }, + { + "epoch": 37.24, + "learning_rate": 2.8395339393371444e-05, + "loss": 0.0484, + "step": 132450 + }, + { + "epoch": 37.24, + "learning_rate": 2.8376597007465715e-05, + "loss": 0.0499, + "step": 132480 + }, + { + "epoch": 37.25, + "learning_rate": 2.8357854621559993e-05, + "loss": 0.0586, + "step": 132510 + }, + { + "epoch": 37.26, + "learning_rate": 2.833911223565427e-05, + "loss": 0.0434, + "step": 132540 + }, + { + "epoch": 37.27, + "learning_rate": 2.832036984974854e-05, + "loss": 0.0539, + "step": 132570 + }, + { + "epoch": 37.28, + "learning_rate": 2.830162746384282e-05, + "loss": 0.0495, + "step": 132600 + }, + { + "epoch": 37.29, + "learning_rate": 2.828288507793709e-05, + "loss": 0.0525, + "step": 132630 + }, + { + "epoch": 37.3, + "learning_rate": 2.8264142692031364e-05, + "loss": 0.0548, + "step": 132660 + }, + { + "epoch": 37.3, + "learning_rate": 2.8245400306125634e-05, + "loss": 0.0429, + "step": 132690 + }, + { + "epoch": 37.31, + "learning_rate": 2.8226657920219912e-05, + "loss": 0.0552, + "step": 132720 + }, + { + "epoch": 37.32, + "learning_rate": 2.820791553431419e-05, + "loss": 0.0485, + "step": 132750 + }, + { + "epoch": 37.33, + "learning_rate": 2.818917314840846e-05, + "loss": 0.0488, + "step": 132780 + }, + { + "epoch": 37.34, + "learning_rate": 2.8170430762502738e-05, + "loss": 0.0592, + "step": 132810 + }, + { + "epoch": 37.35, + "learning_rate": 2.815168837659701e-05, + "loss": 0.0448, + "step": 132840 + }, + { + "epoch": 37.35, + "learning_rate": 2.8132945990691283e-05, + "loss": 0.0562, + "step": 132870 + }, + { + "epoch": 37.36, + "learning_rate": 2.8114203604785554e-05, + "loss": 0.0467, + "step": 132900 + }, + { + "epoch": 37.37, + "learning_rate": 2.809546121887983e-05, + "loss": 0.0519, + "step": 132930 + }, + { + "epoch": 37.38, + "learning_rate": 2.807671883297411e-05, + "loss": 0.0532, + "step": 132960 + }, + { + "epoch": 37.39, + "learning_rate": 2.805797644706838e-05, + "loss": 0.0442, + "step": 132990 + }, + { + "epoch": 37.4, + "learning_rate": 2.8039234061162657e-05, + "loss": 0.052, + "step": 133020 + }, + { + "epoch": 37.41, + "learning_rate": 2.8020491675256928e-05, + "loss": 0.0474, + "step": 133050 + }, + { + "epoch": 37.41, + "learning_rate": 2.8001749289351202e-05, + "loss": 0.0509, + "step": 133080 + }, + { + "epoch": 37.42, + "learning_rate": 2.7983006903445473e-05, + "loss": 0.0553, + "step": 133110 + }, + { + "epoch": 37.43, + "learning_rate": 2.796426451753975e-05, + "loss": 0.0439, + "step": 133140 + }, + { + "epoch": 37.44, + "learning_rate": 2.794614687783088e-05, + "loss": 0.0561, + "step": 133170 + }, + { + "epoch": 37.45, + "learning_rate": 2.792740449192516e-05, + "loss": 0.0503, + "step": 133200 + }, + { + "epoch": 37.46, + "learning_rate": 2.790866210601943e-05, + "loss": 0.0514, + "step": 133230 + }, + { + "epoch": 37.46, + "learning_rate": 2.7889919720113704e-05, + "loss": 0.0523, + "step": 133260 + }, + { + "epoch": 37.47, + "learning_rate": 2.787117733420798e-05, + "loss": 0.044, + "step": 133290 + }, + { + "epoch": 37.48, + "learning_rate": 2.7852434948302252e-05, + "loss": 0.052, + "step": 133320 + }, + { + "epoch": 37.49, + "learning_rate": 2.783369256239653e-05, + "loss": 0.0482, + "step": 133350 + }, + { + "epoch": 37.5, + "learning_rate": 2.78149501764908e-05, + "loss": 0.0521, + "step": 133380 + }, + { + "epoch": 37.51, + "learning_rate": 2.7796207790585078e-05, + "loss": 0.054, + "step": 133410 + }, + { + "epoch": 37.51, + "learning_rate": 2.777746540467935e-05, + "loss": 0.0438, + "step": 133440 + }, + { + "epoch": 37.52, + "learning_rate": 2.7758723018773623e-05, + "loss": 0.055, + "step": 133470 + }, + { + "epoch": 37.53, + "learning_rate": 2.77399806328679e-05, + "loss": 0.0471, + "step": 133500 + }, + { + "epoch": 37.54, + "learning_rate": 2.772123824696217e-05, + "loss": 0.0511, + "step": 133530 + }, + { + "epoch": 37.55, + "learning_rate": 2.770249586105645e-05, + "loss": 0.0517, + "step": 133560 + }, + { + "epoch": 37.56, + "learning_rate": 2.768375347515072e-05, + "loss": 0.0432, + "step": 133590 + }, + { + "epoch": 37.57, + "learning_rate": 2.7665011089244998e-05, + "loss": 0.0514, + "step": 133620 + }, + { + "epoch": 37.57, + "learning_rate": 2.764626870333927e-05, + "loss": 0.0469, + "step": 133650 + }, + { + "epoch": 37.58, + "learning_rate": 2.7627526317433543e-05, + "loss": 0.0526, + "step": 133680 + }, + { + "epoch": 37.59, + "learning_rate": 2.760878393152782e-05, + "loss": 0.0558, + "step": 133710 + }, + { + "epoch": 37.6, + "learning_rate": 2.759004154562209e-05, + "loss": 0.0444, + "step": 133740 + }, + { + "epoch": 37.61, + "learning_rate": 2.757129915971637e-05, + "loss": 0.0545, + "step": 133770 + }, + { + "epoch": 37.62, + "learning_rate": 2.755255677381064e-05, + "loss": 0.0502, + "step": 133800 + }, + { + "epoch": 37.62, + "learning_rate": 2.7533814387904917e-05, + "loss": 0.0506, + "step": 133830 + }, + { + "epoch": 37.63, + "learning_rate": 2.7515072001999188e-05, + "loss": 0.0556, + "step": 133860 + }, + { + "epoch": 37.64, + "learning_rate": 2.7496329616093462e-05, + "loss": 0.0459, + "step": 133890 + }, + { + "epoch": 37.65, + "learning_rate": 2.747758723018774e-05, + "loss": 0.0527, + "step": 133920 + }, + { + "epoch": 37.66, + "learning_rate": 2.745884484428201e-05, + "loss": 0.0477, + "step": 133950 + }, + { + "epoch": 37.67, + "learning_rate": 2.7440102458376288e-05, + "loss": 0.0496, + "step": 133980 + }, + { + "epoch": 37.67, + "learning_rate": 2.742136007247056e-05, + "loss": 0.0527, + "step": 134010 + }, + { + "epoch": 37.68, + "learning_rate": 2.7402617686564836e-05, + "loss": 0.0431, + "step": 134040 + }, + { + "epoch": 37.69, + "learning_rate": 2.7383875300659107e-05, + "loss": 0.0526, + "step": 134070 + }, + { + "epoch": 37.7, + "learning_rate": 2.7365132914753385e-05, + "loss": 0.0458, + "step": 134100 + }, + { + "epoch": 37.71, + "learning_rate": 2.734639052884766e-05, + "loss": 0.052, + "step": 134130 + }, + { + "epoch": 37.72, + "learning_rate": 2.732764814294193e-05, + "loss": 0.0559, + "step": 134160 + }, + { + "epoch": 37.73, + "learning_rate": 2.7308905757036207e-05, + "loss": 0.045, + "step": 134190 + }, + { + "epoch": 37.73, + "learning_rate": 2.7290163371130478e-05, + "loss": 0.0549, + "step": 134220 + }, + { + "epoch": 37.74, + "learning_rate": 2.7271420985224756e-05, + "loss": 0.0464, + "step": 134250 + }, + { + "epoch": 37.75, + "learning_rate": 2.7252678599319026e-05, + "loss": 0.054, + "step": 134280 + }, + { + "epoch": 37.76, + "learning_rate": 2.7233936213413304e-05, + "loss": 0.0567, + "step": 134310 + }, + { + "epoch": 37.77, + "learning_rate": 2.7215193827507578e-05, + "loss": 0.0458, + "step": 134340 + }, + { + "epoch": 37.78, + "learning_rate": 2.719645144160185e-05, + "loss": 0.0567, + "step": 134370 + }, + { + "epoch": 37.78, + "learning_rate": 2.7177709055696127e-05, + "loss": 0.0451, + "step": 134400 + }, + { + "epoch": 37.79, + "learning_rate": 2.7158966669790397e-05, + "loss": 0.0499, + "step": 134430 + }, + { + "epoch": 37.8, + "learning_rate": 2.7140224283884675e-05, + "loss": 0.0555, + "step": 134460 + }, + { + "epoch": 37.81, + "learning_rate": 2.7121481897978946e-05, + "loss": 0.0448, + "step": 134490 + }, + { + "epoch": 37.82, + "learning_rate": 2.7102739512073223e-05, + "loss": 0.0525, + "step": 134520 + }, + { + "epoch": 37.83, + "learning_rate": 2.7083997126167498e-05, + "loss": 0.0479, + "step": 134550 + }, + { + "epoch": 37.84, + "learning_rate": 2.706525474026177e-05, + "loss": 0.0523, + "step": 134580 + }, + { + "epoch": 37.84, + "learning_rate": 2.7046512354356046e-05, + "loss": 0.0534, + "step": 134610 + }, + { + "epoch": 37.85, + "learning_rate": 2.7027769968450317e-05, + "loss": 0.0463, + "step": 134640 + }, + { + "epoch": 37.86, + "learning_rate": 2.7009027582544594e-05, + "loss": 0.054, + "step": 134670 + }, + { + "epoch": 37.87, + "learning_rate": 2.6990285196638865e-05, + "loss": 0.0463, + "step": 134700 + }, + { + "epoch": 37.88, + "learning_rate": 2.6971542810733143e-05, + "loss": 0.0491, + "step": 134730 + }, + { + "epoch": 37.89, + "learning_rate": 2.6952800424827413e-05, + "loss": 0.0543, + "step": 134760 + }, + { + "epoch": 37.89, + "learning_rate": 2.6934058038921688e-05, + "loss": 0.043, + "step": 134790 + }, + { + "epoch": 37.9, + "learning_rate": 2.6915315653015965e-05, + "loss": 0.0539, + "step": 134820 + }, + { + "epoch": 37.91, + "learning_rate": 2.6896573267110236e-05, + "loss": 0.0457, + "step": 134850 + }, + { + "epoch": 37.92, + "learning_rate": 2.6877830881204514e-05, + "loss": 0.054, + "step": 134880 + }, + { + "epoch": 37.93, + "learning_rate": 2.6859088495298784e-05, + "loss": 0.053, + "step": 134910 + }, + { + "epoch": 37.94, + "learning_rate": 2.6840346109393062e-05, + "loss": 0.0456, + "step": 134940 + }, + { + "epoch": 37.94, + "learning_rate": 2.6821603723487333e-05, + "loss": 0.0602, + "step": 134970 + }, + { + "epoch": 37.95, + "learning_rate": 2.6802861337581607e-05, + "loss": 0.0468, + "step": 135000 + }, + { + "epoch": 37.96, + "learning_rate": 2.6784118951675885e-05, + "loss": 0.0524, + "step": 135030 + }, + { + "epoch": 37.97, + "learning_rate": 2.6765376565770155e-05, + "loss": 0.0577, + "step": 135060 + }, + { + "epoch": 37.98, + "learning_rate": 2.6746634179864433e-05, + "loss": 0.0447, + "step": 135090 + }, + { + "epoch": 37.99, + "learning_rate": 2.6727891793958704e-05, + "loss": 0.0546, + "step": 135120 + }, + { + "epoch": 38.0, + "learning_rate": 2.670914940805298e-05, + "loss": 0.0495, + "step": 135150 + }, + { + "epoch": 38.0, + "eval_loss": 0.1098802462220192, + "eval_runtime": 637.127, + "eval_samples_per_second": 25.165, + "eval_steps_per_second": 0.788, + "eval_wer": 0.09562867632006332, + "step": 135166 + }, + { + "epoch": 38.0, + "learning_rate": 2.6690407022147252e-05, + "loss": 0.052, + "step": 135180 + }, + { + "epoch": 38.01, + "learning_rate": 2.6671664636241526e-05, + "loss": 0.049, + "step": 135210 + }, + { + "epoch": 38.02, + "learning_rate": 2.6652922250335804e-05, + "loss": 0.0482, + "step": 135240 + }, + { + "epoch": 38.03, + "learning_rate": 2.6634179864430075e-05, + "loss": 0.0553, + "step": 135270 + }, + { + "epoch": 38.04, + "learning_rate": 2.6615437478524352e-05, + "loss": 0.0441, + "step": 135300 + }, + { + "epoch": 38.05, + "learning_rate": 2.6596695092618623e-05, + "loss": 0.0528, + "step": 135330 + }, + { + "epoch": 38.05, + "learning_rate": 2.65779527067129e-05, + "loss": 0.051, + "step": 135360 + }, + { + "epoch": 38.06, + "learning_rate": 2.655921032080717e-05, + "loss": 0.052, + "step": 135390 + }, + { + "epoch": 38.07, + "learning_rate": 2.6540467934901446e-05, + "loss": 0.0558, + "step": 135420 + }, + { + "epoch": 38.08, + "learning_rate": 2.6521725548995723e-05, + "loss": 0.0429, + "step": 135450 + }, + { + "epoch": 38.09, + "learning_rate": 2.6502983163089994e-05, + "loss": 0.0495, + "step": 135480 + }, + { + "epoch": 38.1, + "learning_rate": 2.648424077718427e-05, + "loss": 0.0512, + "step": 135510 + }, + { + "epoch": 38.11, + "learning_rate": 2.6465498391278542e-05, + "loss": 0.0514, + "step": 135540 + }, + { + "epoch": 38.11, + "learning_rate": 2.644675600537282e-05, + "loss": 0.0523, + "step": 135570 + }, + { + "epoch": 38.12, + "learning_rate": 2.642801361946709e-05, + "loss": 0.0454, + "step": 135600 + }, + { + "epoch": 38.13, + "learning_rate": 2.640927123356137e-05, + "loss": 0.0533, + "step": 135630 + }, + { + "epoch": 38.14, + "learning_rate": 2.6390528847655643e-05, + "loss": 0.0502, + "step": 135660 + }, + { + "epoch": 38.15, + "learning_rate": 2.6371786461749913e-05, + "loss": 0.0519, + "step": 135690 + }, + { + "epoch": 38.16, + "learning_rate": 2.635304407584419e-05, + "loss": 0.0581, + "step": 135720 + }, + { + "epoch": 38.16, + "learning_rate": 2.6334301689938462e-05, + "loss": 0.046, + "step": 135750 + }, + { + "epoch": 38.17, + "learning_rate": 2.631555930403274e-05, + "loss": 0.0523, + "step": 135780 + }, + { + "epoch": 38.18, + "learning_rate": 2.629681691812701e-05, + "loss": 0.0493, + "step": 135810 + }, + { + "epoch": 38.19, + "learning_rate": 2.6278074532221288e-05, + "loss": 0.049, + "step": 135840 + }, + { + "epoch": 38.2, + "learning_rate": 2.6259332146315562e-05, + "loss": 0.0556, + "step": 135870 + }, + { + "epoch": 38.21, + "learning_rate": 2.6240589760409833e-05, + "loss": 0.0444, + "step": 135900 + }, + { + "epoch": 38.21, + "learning_rate": 2.622184737450411e-05, + "loss": 0.0517, + "step": 135930 + }, + { + "epoch": 38.22, + "learning_rate": 2.620310498859838e-05, + "loss": 0.047, + "step": 135960 + }, + { + "epoch": 38.23, + "learning_rate": 2.618436260269266e-05, + "loss": 0.051, + "step": 135990 + }, + { + "epoch": 38.24, + "learning_rate": 2.616562021678693e-05, + "loss": 0.0575, + "step": 136020 + }, + { + "epoch": 38.25, + "learning_rate": 2.6146877830881207e-05, + "loss": 0.0442, + "step": 136050 + }, + { + "epoch": 38.26, + "learning_rate": 2.612813544497548e-05, + "loss": 0.0539, + "step": 136080 + }, + { + "epoch": 38.27, + "learning_rate": 2.6109393059069752e-05, + "loss": 0.0468, + "step": 136110 + }, + { + "epoch": 38.27, + "learning_rate": 2.609065067316403e-05, + "loss": 0.0506, + "step": 136140 + }, + { + "epoch": 38.28, + "learning_rate": 2.60719082872583e-05, + "loss": 0.0533, + "step": 136170 + }, + { + "epoch": 38.29, + "learning_rate": 2.6053165901352578e-05, + "loss": 0.0438, + "step": 136200 + }, + { + "epoch": 38.3, + "learning_rate": 2.603442351544685e-05, + "loss": 0.052, + "step": 136230 + }, + { + "epoch": 38.31, + "learning_rate": 2.6015681129541126e-05, + "loss": 0.048, + "step": 136260 + }, + { + "epoch": 38.32, + "learning_rate": 2.59969387436354e-05, + "loss": 0.0481, + "step": 136290 + }, + { + "epoch": 38.32, + "learning_rate": 2.597819635772967e-05, + "loss": 0.0495, + "step": 136320 + }, + { + "epoch": 38.33, + "learning_rate": 2.595945397182395e-05, + "loss": 0.0414, + "step": 136350 + }, + { + "epoch": 38.34, + "learning_rate": 2.594071158591822e-05, + "loss": 0.0542, + "step": 136380 + }, + { + "epoch": 38.35, + "learning_rate": 2.5921969200012497e-05, + "loss": 0.0479, + "step": 136410 + }, + { + "epoch": 38.36, + "learning_rate": 2.5903226814106768e-05, + "loss": 0.0471, + "step": 136440 + }, + { + "epoch": 38.37, + "learning_rate": 2.5884484428201046e-05, + "loss": 0.0562, + "step": 136470 + }, + { + "epoch": 38.37, + "learning_rate": 2.586574204229532e-05, + "loss": 0.0458, + "step": 136500 + }, + { + "epoch": 38.38, + "learning_rate": 2.584699965638959e-05, + "loss": 0.054, + "step": 136530 + }, + { + "epoch": 38.39, + "learning_rate": 2.582825727048387e-05, + "loss": 0.0503, + "step": 136560 + }, + { + "epoch": 38.4, + "learning_rate": 2.580951488457814e-05, + "loss": 0.0487, + "step": 136590 + }, + { + "epoch": 38.41, + "learning_rate": 2.5790772498672417e-05, + "loss": 0.051, + "step": 136620 + }, + { + "epoch": 38.42, + "learning_rate": 2.5772030112766688e-05, + "loss": 0.0447, + "step": 136650 + }, + { + "epoch": 38.43, + "learning_rate": 2.5753287726860965e-05, + "loss": 0.056, + "step": 136680 + }, + { + "epoch": 38.43, + "learning_rate": 2.573454534095524e-05, + "loss": 0.051, + "step": 136710 + }, + { + "epoch": 38.44, + "learning_rate": 2.571580295504951e-05, + "loss": 0.0496, + "step": 136740 + }, + { + "epoch": 38.45, + "learning_rate": 2.5697060569143788e-05, + "loss": 0.0507, + "step": 136770 + }, + { + "epoch": 38.46, + "learning_rate": 2.567831818323806e-05, + "loss": 0.044, + "step": 136800 + }, + { + "epoch": 38.47, + "learning_rate": 2.5659575797332336e-05, + "loss": 0.0494, + "step": 136830 + }, + { + "epoch": 38.48, + "learning_rate": 2.5640833411426607e-05, + "loss": 0.0449, + "step": 136860 + }, + { + "epoch": 38.48, + "learning_rate": 2.5622091025520884e-05, + "loss": 0.0472, + "step": 136890 + }, + { + "epoch": 38.49, + "learning_rate": 2.560334863961516e-05, + "loss": 0.0534, + "step": 136920 + }, + { + "epoch": 38.5, + "learning_rate": 2.558460625370943e-05, + "loss": 0.0444, + "step": 136950 + }, + { + "epoch": 38.51, + "learning_rate": 2.5565863867803707e-05, + "loss": 0.0541, + "step": 136980 + }, + { + "epoch": 38.52, + "learning_rate": 2.5547121481897978e-05, + "loss": 0.0465, + "step": 137010 + }, + { + "epoch": 38.53, + "learning_rate": 2.5528379095992255e-05, + "loss": 0.05, + "step": 137040 + }, + { + "epoch": 38.54, + "learning_rate": 2.5509636710086526e-05, + "loss": 0.0532, + "step": 137070 + }, + { + "epoch": 38.54, + "learning_rate": 2.5490894324180804e-05, + "loss": 0.0436, + "step": 137100 + }, + { + "epoch": 38.55, + "learning_rate": 2.5472151938275078e-05, + "loss": 0.0514, + "step": 137130 + }, + { + "epoch": 38.56, + "learning_rate": 2.5453409552369352e-05, + "loss": 0.0508, + "step": 137160 + }, + { + "epoch": 38.57, + "learning_rate": 2.5434667166463626e-05, + "loss": 0.0493, + "step": 137190 + }, + { + "epoch": 38.58, + "learning_rate": 2.5415924780557897e-05, + "loss": 0.05, + "step": 137220 + }, + { + "epoch": 38.59, + "learning_rate": 2.5397182394652175e-05, + "loss": 0.0418, + "step": 137250 + }, + { + "epoch": 38.59, + "learning_rate": 2.5378440008746446e-05, + "loss": 0.0512, + "step": 137280 + }, + { + "epoch": 38.6, + "learning_rate": 2.5359697622840723e-05, + "loss": 0.0473, + "step": 137310 + }, + { + "epoch": 38.61, + "learning_rate": 2.5340955236934997e-05, + "loss": 0.0474, + "step": 137340 + }, + { + "epoch": 38.62, + "learning_rate": 2.532221285102927e-05, + "loss": 0.0537, + "step": 137370 + }, + { + "epoch": 38.63, + "learning_rate": 2.5303470465123546e-05, + "loss": 0.0508, + "step": 137400 + }, + { + "epoch": 38.64, + "learning_rate": 2.5284728079217816e-05, + "loss": 0.0531, + "step": 137430 + }, + { + "epoch": 38.64, + "learning_rate": 2.5265985693312094e-05, + "loss": 0.049, + "step": 137460 + }, + { + "epoch": 38.65, + "learning_rate": 2.5247243307406365e-05, + "loss": 0.0497, + "step": 137490 + }, + { + "epoch": 38.66, + "learning_rate": 2.5228500921500642e-05, + "loss": 0.0526, + "step": 137520 + }, + { + "epoch": 38.67, + "learning_rate": 2.520975853559492e-05, + "loss": 0.0469, + "step": 137550 + }, + { + "epoch": 38.68, + "learning_rate": 2.519101614968919e-05, + "loss": 0.0548, + "step": 137580 + }, + { + "epoch": 38.69, + "learning_rate": 2.5172273763783465e-05, + "loss": 0.048, + "step": 137610 + }, + { + "epoch": 38.7, + "learning_rate": 2.5153531377877736e-05, + "loss": 0.0488, + "step": 137640 + }, + { + "epoch": 38.7, + "learning_rate": 2.5134788991972013e-05, + "loss": 0.0507, + "step": 137670 + }, + { + "epoch": 38.71, + "learning_rate": 2.5116046606066284e-05, + "loss": 0.0436, + "step": 137700 + }, + { + "epoch": 38.72, + "learning_rate": 2.5097304220160562e-05, + "loss": 0.05, + "step": 137730 + }, + { + "epoch": 38.73, + "learning_rate": 2.507856183425484e-05, + "loss": 0.0472, + "step": 137760 + }, + { + "epoch": 38.74, + "learning_rate": 2.505981944834911e-05, + "loss": 0.0484, + "step": 137790 + }, + { + "epoch": 38.75, + "learning_rate": 2.5041077062443384e-05, + "loss": 0.0549, + "step": 137820 + }, + { + "epoch": 38.75, + "learning_rate": 2.5022334676537655e-05, + "loss": 0.0427, + "step": 137850 + }, + { + "epoch": 38.76, + "learning_rate": 2.5003592290631933e-05, + "loss": 0.049, + "step": 137880 + }, + { + "epoch": 38.77, + "learning_rate": 2.4984849904726207e-05, + "loss": 0.0511, + "step": 137910 + }, + { + "epoch": 38.78, + "learning_rate": 2.496610751882048e-05, + "loss": 0.0531, + "step": 137940 + }, + { + "epoch": 38.79, + "learning_rate": 2.4947365132914755e-05, + "loss": 0.0552, + "step": 137970 + }, + { + "epoch": 38.8, + "learning_rate": 2.492862274700903e-05, + "loss": 0.0423, + "step": 138000 + }, + { + "epoch": 38.81, + "learning_rate": 2.4909880361103304e-05, + "loss": 0.0531, + "step": 138030 + }, + { + "epoch": 38.81, + "learning_rate": 2.4891137975197574e-05, + "loss": 0.0495, + "step": 138060 + }, + { + "epoch": 38.82, + "learning_rate": 2.4872395589291852e-05, + "loss": 0.0525, + "step": 138090 + }, + { + "epoch": 38.83, + "learning_rate": 2.4853653203386126e-05, + "loss": 0.0569, + "step": 138120 + }, + { + "epoch": 38.84, + "learning_rate": 2.48349108174804e-05, + "loss": 0.0427, + "step": 138150 + }, + { + "epoch": 38.85, + "learning_rate": 2.4816168431574675e-05, + "loss": 0.0517, + "step": 138180 + }, + { + "epoch": 38.86, + "learning_rate": 2.479742604566895e-05, + "loss": 0.0502, + "step": 138210 + }, + { + "epoch": 38.86, + "learning_rate": 2.4778683659763223e-05, + "loss": 0.0503, + "step": 138240 + }, + { + "epoch": 38.87, + "learning_rate": 2.4759941273857494e-05, + "loss": 0.0548, + "step": 138270 + }, + { + "epoch": 38.88, + "learning_rate": 2.474119888795177e-05, + "loss": 0.0434, + "step": 138300 + }, + { + "epoch": 38.89, + "learning_rate": 2.4722456502046046e-05, + "loss": 0.0521, + "step": 138330 + }, + { + "epoch": 38.9, + "learning_rate": 2.470371411614032e-05, + "loss": 0.0496, + "step": 138360 + }, + { + "epoch": 38.91, + "learning_rate": 2.4684971730234594e-05, + "loss": 0.0475, + "step": 138390 + }, + { + "epoch": 38.91, + "learning_rate": 2.4666229344328868e-05, + "loss": 0.0546, + "step": 138420 + }, + { + "epoch": 38.92, + "learning_rate": 2.4647486958423142e-05, + "loss": 0.0424, + "step": 138450 + }, + { + "epoch": 38.93, + "learning_rate": 2.4628744572517417e-05, + "loss": 0.049, + "step": 138480 + }, + { + "epoch": 38.94, + "learning_rate": 2.461000218661169e-05, + "loss": 0.0477, + "step": 138510 + }, + { + "epoch": 38.95, + "learning_rate": 2.4591259800705965e-05, + "loss": 0.049, + "step": 138540 + }, + { + "epoch": 38.96, + "learning_rate": 2.457251741480024e-05, + "loss": 0.0525, + "step": 138570 + }, + { + "epoch": 38.97, + "learning_rate": 2.4553775028894513e-05, + "loss": 0.0475, + "step": 138600 + }, + { + "epoch": 38.97, + "learning_rate": 2.4535032642988787e-05, + "loss": 0.0506, + "step": 138630 + }, + { + "epoch": 38.98, + "learning_rate": 2.451629025708306e-05, + "loss": 0.0492, + "step": 138660 + }, + { + "epoch": 38.99, + "learning_rate": 2.4497547871177336e-05, + "loss": 0.0504, + "step": 138690 + }, + { + "epoch": 39.0, + "learning_rate": 2.447880548527161e-05, + "loss": 0.0528, + "step": 138720 + }, + { + "epoch": 39.0, + "eval_loss": 0.10912308096885681, + "eval_runtime": 638.8233, + "eval_samples_per_second": 25.098, + "eval_steps_per_second": 0.786, + "eval_wer": 0.09225772112510748, + "step": 138723 + }, + { + "epoch": 39.01, + "learning_rate": 2.4460063099365884e-05, + "loss": 0.0436, + "step": 138750 + }, + { + "epoch": 39.02, + "learning_rate": 2.444132071346016e-05, + "loss": 0.0513, + "step": 138780 + }, + { + "epoch": 39.02, + "learning_rate": 2.4422578327554433e-05, + "loss": 0.0455, + "step": 138810 + }, + { + "epoch": 39.03, + "learning_rate": 2.4403835941648707e-05, + "loss": 0.0498, + "step": 138840 + }, + { + "epoch": 39.04, + "learning_rate": 2.438509355574298e-05, + "loss": 0.0536, + "step": 138870 + }, + { + "epoch": 39.05, + "learning_rate": 2.4366351169837255e-05, + "loss": 0.0494, + "step": 138900 + }, + { + "epoch": 39.06, + "learning_rate": 2.434760878393153e-05, + "loss": 0.0533, + "step": 138930 + }, + { + "epoch": 39.07, + "learning_rate": 2.4328866398025804e-05, + "loss": 0.0448, + "step": 138960 + }, + { + "epoch": 39.08, + "learning_rate": 2.4310124012120078e-05, + "loss": 0.0487, + "step": 138990 + }, + { + "epoch": 39.08, + "learning_rate": 2.4291381626214352e-05, + "loss": 0.0519, + "step": 139020 + }, + { + "epoch": 39.09, + "learning_rate": 2.4272639240308626e-05, + "loss": 0.0456, + "step": 139050 + }, + { + "epoch": 39.1, + "learning_rate": 2.42538968544029e-05, + "loss": 0.0544, + "step": 139080 + }, + { + "epoch": 39.11, + "learning_rate": 2.4235154468497175e-05, + "loss": 0.0442, + "step": 139110 + }, + { + "epoch": 39.12, + "learning_rate": 2.4216412082591445e-05, + "loss": 0.0504, + "step": 139140 + }, + { + "epoch": 39.13, + "learning_rate": 2.4197669696685723e-05, + "loss": 0.0515, + "step": 139170 + }, + { + "epoch": 39.13, + "learning_rate": 2.4178927310779997e-05, + "loss": 0.048, + "step": 139200 + }, + { + "epoch": 39.14, + "learning_rate": 2.4160809671071128e-05, + "loss": 0.0524, + "step": 139230 + }, + { + "epoch": 39.15, + "learning_rate": 2.4142067285165405e-05, + "loss": 0.0433, + "step": 139260 + }, + { + "epoch": 39.16, + "learning_rate": 2.4123324899259676e-05, + "loss": 0.0522, + "step": 139290 + }, + { + "epoch": 39.17, + "learning_rate": 2.410458251335395e-05, + "loss": 0.0488, + "step": 139320 + }, + { + "epoch": 39.18, + "learning_rate": 2.4085840127448225e-05, + "loss": 0.0492, + "step": 139350 + }, + { + "epoch": 39.18, + "learning_rate": 2.40670977415425e-05, + "loss": 0.0539, + "step": 139380 + }, + { + "epoch": 39.19, + "learning_rate": 2.4048355355636773e-05, + "loss": 0.0471, + "step": 139410 + }, + { + "epoch": 39.2, + "learning_rate": 2.4029612969731047e-05, + "loss": 0.0495, + "step": 139440 + }, + { + "epoch": 39.21, + "learning_rate": 2.4010870583825325e-05, + "loss": 0.0476, + "step": 139470 + }, + { + "epoch": 39.22, + "learning_rate": 2.3992128197919596e-05, + "loss": 0.0442, + "step": 139500 + }, + { + "epoch": 39.23, + "learning_rate": 2.3974010558210726e-05, + "loss": 0.056, + "step": 139530 + }, + { + "epoch": 39.24, + "learning_rate": 2.3955268172305e-05, + "loss": 0.0435, + "step": 139560 + }, + { + "epoch": 39.24, + "learning_rate": 2.3936525786399278e-05, + "loss": 0.0481, + "step": 139590 + }, + { + "epoch": 39.25, + "learning_rate": 2.3917783400493552e-05, + "loss": 0.0475, + "step": 139620 + }, + { + "epoch": 39.26, + "learning_rate": 2.3899041014587827e-05, + "loss": 0.046, + "step": 139650 + }, + { + "epoch": 39.27, + "learning_rate": 2.3880298628682097e-05, + "loss": 0.0509, + "step": 139680 + }, + { + "epoch": 39.28, + "learning_rate": 2.386155624277637e-05, + "loss": 0.0425, + "step": 139710 + }, + { + "epoch": 39.29, + "learning_rate": 2.3842813856870646e-05, + "loss": 0.0489, + "step": 139740 + }, + { + "epoch": 39.29, + "learning_rate": 2.382407147096492e-05, + "loss": 0.0473, + "step": 139770 + }, + { + "epoch": 39.3, + "learning_rate": 2.3805329085059198e-05, + "loss": 0.0466, + "step": 139800 + }, + { + "epoch": 39.31, + "learning_rate": 2.3786586699153472e-05, + "loss": 0.0507, + "step": 139830 + }, + { + "epoch": 39.32, + "learning_rate": 2.3767844313247746e-05, + "loss": 0.0441, + "step": 139860 + }, + { + "epoch": 39.33, + "learning_rate": 2.374910192734202e-05, + "loss": 0.0471, + "step": 139890 + }, + { + "epoch": 39.34, + "learning_rate": 2.373035954143629e-05, + "loss": 0.0481, + "step": 139920 + }, + { + "epoch": 39.34, + "learning_rate": 2.3711617155530565e-05, + "loss": 0.0456, + "step": 139950 + }, + { + "epoch": 39.35, + "learning_rate": 2.369287476962484e-05, + "loss": 0.051, + "step": 139980 + }, + { + "epoch": 39.36, + "learning_rate": 2.3674757129915974e-05, + "loss": 0.0442, + "step": 140010 + }, + { + "epoch": 39.37, + "learning_rate": 2.3656014744010248e-05, + "loss": 0.0502, + "step": 140040 + }, + { + "epoch": 39.38, + "learning_rate": 2.3637272358104522e-05, + "loss": 0.0486, + "step": 140070 + }, + { + "epoch": 39.39, + "learning_rate": 2.3618529972198793e-05, + "loss": 0.0443, + "step": 140100 + }, + { + "epoch": 39.4, + "learning_rate": 2.359978758629307e-05, + "loss": 0.0518, + "step": 140130 + }, + { + "epoch": 39.4, + "learning_rate": 2.3581045200387344e-05, + "loss": 0.0425, + "step": 140160 + }, + { + "epoch": 39.41, + "learning_rate": 2.356230281448162e-05, + "loss": 0.0484, + "step": 140190 + }, + { + "epoch": 39.42, + "learning_rate": 2.3543560428575893e-05, + "loss": 0.0488, + "step": 140220 + }, + { + "epoch": 39.43, + "learning_rate": 2.3524818042670167e-05, + "loss": 0.0442, + "step": 140250 + }, + { + "epoch": 39.44, + "learning_rate": 2.350607565676444e-05, + "loss": 0.0506, + "step": 140280 + }, + { + "epoch": 39.45, + "learning_rate": 2.3487333270858712e-05, + "loss": 0.0439, + "step": 140310 + }, + { + "epoch": 39.45, + "learning_rate": 2.346859088495299e-05, + "loss": 0.0493, + "step": 140340 + }, + { + "epoch": 39.46, + "learning_rate": 2.3449848499047264e-05, + "loss": 0.0473, + "step": 140370 + }, + { + "epoch": 39.47, + "learning_rate": 2.3431106113141538e-05, + "loss": 0.0457, + "step": 140400 + }, + { + "epoch": 39.48, + "learning_rate": 2.3412363727235812e-05, + "loss": 0.0582, + "step": 140430 + }, + { + "epoch": 39.49, + "learning_rate": 2.3393621341330086e-05, + "loss": 0.0452, + "step": 140460 + }, + { + "epoch": 39.5, + "learning_rate": 2.337487895542436e-05, + "loss": 0.0515, + "step": 140490 + }, + { + "epoch": 39.51, + "learning_rate": 2.335613656951863e-05, + "loss": 0.0503, + "step": 140520 + }, + { + "epoch": 39.51, + "learning_rate": 2.333739418361291e-05, + "loss": 0.0451, + "step": 140550 + }, + { + "epoch": 39.52, + "learning_rate": 2.3318651797707183e-05, + "loss": 0.0513, + "step": 140580 + }, + { + "epoch": 39.53, + "learning_rate": 2.3299909411801457e-05, + "loss": 0.0424, + "step": 140610 + }, + { + "epoch": 39.54, + "learning_rate": 2.328116702589573e-05, + "loss": 0.0492, + "step": 140640 + }, + { + "epoch": 39.55, + "learning_rate": 2.3262424639990006e-05, + "loss": 0.0483, + "step": 140670 + }, + { + "epoch": 39.56, + "learning_rate": 2.324368225408428e-05, + "loss": 0.0481, + "step": 140700 + }, + { + "epoch": 39.56, + "learning_rate": 2.322493986817855e-05, + "loss": 0.0511, + "step": 140730 + }, + { + "epoch": 39.57, + "learning_rate": 2.3206197482272828e-05, + "loss": 0.0433, + "step": 140760 + }, + { + "epoch": 39.58, + "learning_rate": 2.3187455096367102e-05, + "loss": 0.0507, + "step": 140790 + }, + { + "epoch": 39.59, + "learning_rate": 2.3168712710461377e-05, + "loss": 0.0484, + "step": 140820 + }, + { + "epoch": 39.6, + "learning_rate": 2.314997032455565e-05, + "loss": 0.0444, + "step": 140850 + }, + { + "epoch": 39.61, + "learning_rate": 2.3131227938649925e-05, + "loss": 0.0502, + "step": 140880 + }, + { + "epoch": 39.61, + "learning_rate": 2.31124855527442e-05, + "loss": 0.0455, + "step": 140910 + }, + { + "epoch": 39.62, + "learning_rate": 2.3093743166838473e-05, + "loss": 0.0492, + "step": 140940 + }, + { + "epoch": 39.63, + "learning_rate": 2.3075000780932748e-05, + "loss": 0.0495, + "step": 140970 + }, + { + "epoch": 39.64, + "learning_rate": 2.3056258395027022e-05, + "loss": 0.0457, + "step": 141000 + }, + { + "epoch": 39.65, + "learning_rate": 2.3037516009121296e-05, + "loss": 0.0528, + "step": 141030 + }, + { + "epoch": 39.66, + "learning_rate": 2.301877362321557e-05, + "loss": 0.0445, + "step": 141060 + }, + { + "epoch": 39.67, + "learning_rate": 2.3000031237309844e-05, + "loss": 0.0516, + "step": 141090 + }, + { + "epoch": 39.67, + "learning_rate": 2.298128885140412e-05, + "loss": 0.0505, + "step": 141120 + }, + { + "epoch": 39.68, + "learning_rate": 2.2962546465498393e-05, + "loss": 0.0474, + "step": 141150 + }, + { + "epoch": 39.69, + "learning_rate": 2.2943804079592667e-05, + "loss": 0.053, + "step": 141180 + }, + { + "epoch": 39.7, + "learning_rate": 2.292506169368694e-05, + "loss": 0.0444, + "step": 141210 + }, + { + "epoch": 39.71, + "learning_rate": 2.2906319307781215e-05, + "loss": 0.0514, + "step": 141240 + }, + { + "epoch": 39.72, + "learning_rate": 2.288757692187549e-05, + "loss": 0.0473, + "step": 141270 + }, + { + "epoch": 39.72, + "learning_rate": 2.2868834535969764e-05, + "loss": 0.0458, + "step": 141300 + }, + { + "epoch": 39.73, + "learning_rate": 2.2850092150064038e-05, + "loss": 0.0488, + "step": 141330 + }, + { + "epoch": 39.74, + "learning_rate": 2.2831349764158312e-05, + "loss": 0.0445, + "step": 141360 + }, + { + "epoch": 39.75, + "learning_rate": 2.2812607378252586e-05, + "loss": 0.0499, + "step": 141390 + }, + { + "epoch": 39.76, + "learning_rate": 2.279386499234686e-05, + "loss": 0.0468, + "step": 141420 + }, + { + "epoch": 39.77, + "learning_rate": 2.2775122606441135e-05, + "loss": 0.0469, + "step": 141450 + }, + { + "epoch": 39.77, + "learning_rate": 2.275638022053541e-05, + "loss": 0.051, + "step": 141480 + }, + { + "epoch": 39.78, + "learning_rate": 2.2737637834629683e-05, + "loss": 0.0447, + "step": 141510 + }, + { + "epoch": 39.79, + "learning_rate": 2.2718895448723957e-05, + "loss": 0.0507, + "step": 141540 + }, + { + "epoch": 39.8, + "learning_rate": 2.270015306281823e-05, + "loss": 0.0491, + "step": 141570 + }, + { + "epoch": 39.81, + "learning_rate": 2.2681410676912506e-05, + "loss": 0.0457, + "step": 141600 + }, + { + "epoch": 39.82, + "learning_rate": 2.266266829100678e-05, + "loss": 0.0533, + "step": 141630 + }, + { + "epoch": 39.83, + "learning_rate": 2.2643925905101054e-05, + "loss": 0.0461, + "step": 141660 + }, + { + "epoch": 39.83, + "learning_rate": 2.2625183519195328e-05, + "loss": 0.0498, + "step": 141690 + }, + { + "epoch": 39.84, + "learning_rate": 2.2606441133289602e-05, + "loss": 0.0464, + "step": 141720 + }, + { + "epoch": 39.85, + "learning_rate": 2.2587698747383877e-05, + "loss": 0.0485, + "step": 141750 + }, + { + "epoch": 39.86, + "learning_rate": 2.256895636147815e-05, + "loss": 0.0518, + "step": 141780 + }, + { + "epoch": 39.87, + "learning_rate": 2.2550213975572425e-05, + "loss": 0.0455, + "step": 141810 + }, + { + "epoch": 39.88, + "learning_rate": 2.25314715896667e-05, + "loss": 0.0485, + "step": 141840 + }, + { + "epoch": 39.88, + "learning_rate": 2.2512729203760973e-05, + "loss": 0.0484, + "step": 141870 + }, + { + "epoch": 39.89, + "learning_rate": 2.2493986817855248e-05, + "loss": 0.0443, + "step": 141900 + }, + { + "epoch": 39.9, + "learning_rate": 2.2475244431949522e-05, + "loss": 0.0533, + "step": 141930 + }, + { + "epoch": 39.91, + "learning_rate": 2.2456502046043796e-05, + "loss": 0.0425, + "step": 141960 + }, + { + "epoch": 39.92, + "learning_rate": 2.243775966013807e-05, + "loss": 0.0512, + "step": 141990 + }, + { + "epoch": 39.93, + "learning_rate": 2.2419017274232344e-05, + "loss": 0.048, + "step": 142020 + }, + { + "epoch": 39.94, + "learning_rate": 2.240027488832662e-05, + "loss": 0.0449, + "step": 142050 + }, + { + "epoch": 39.94, + "learning_rate": 2.2381532502420893e-05, + "loss": 0.0504, + "step": 142080 + }, + { + "epoch": 39.95, + "learning_rate": 2.2362790116515167e-05, + "loss": 0.046, + "step": 142110 + }, + { + "epoch": 39.96, + "learning_rate": 2.234404773060944e-05, + "loss": 0.0503, + "step": 142140 + }, + { + "epoch": 39.97, + "learning_rate": 2.2325305344703715e-05, + "loss": 0.048, + "step": 142170 + }, + { + "epoch": 39.98, + "learning_rate": 2.230656295879799e-05, + "loss": 0.0443, + "step": 142200 + }, + { + "epoch": 39.99, + "learning_rate": 2.2287820572892264e-05, + "loss": 0.0524, + "step": 142230 + }, + { + "epoch": 39.99, + "learning_rate": 2.2269078186986538e-05, + "loss": 0.0439, + "step": 142260 + }, + { + "epoch": 40.0, + "eval_loss": 0.11113700270652771, + "eval_runtime": 639.3379, + "eval_samples_per_second": 25.078, + "eval_steps_per_second": 0.785, + "eval_wer": 0.09283774378011, + "step": 142280 + }, + { + "epoch": 40.0, + "learning_rate": 2.2250335801080812e-05, + "loss": 0.0503, + "step": 142290 + }, + { + "epoch": 40.01, + "learning_rate": 2.2231593415175086e-05, + "loss": 0.0457, + "step": 142320 + }, + { + "epoch": 40.02, + "learning_rate": 2.221285102926936e-05, + "loss": 0.0462, + "step": 142350 + }, + { + "epoch": 40.03, + "learning_rate": 2.2194108643363635e-05, + "loss": 0.0556, + "step": 142380 + }, + { + "epoch": 40.04, + "learning_rate": 2.217536625745791e-05, + "loss": 0.0438, + "step": 142410 + }, + { + "epoch": 40.04, + "learning_rate": 2.2156623871552183e-05, + "loss": 0.0529, + "step": 142440 + }, + { + "epoch": 40.05, + "learning_rate": 2.2137881485646457e-05, + "loss": 0.0455, + "step": 142470 + }, + { + "epoch": 40.06, + "learning_rate": 2.211913909974073e-05, + "loss": 0.0481, + "step": 142500 + }, + { + "epoch": 40.07, + "learning_rate": 2.2100396713835006e-05, + "loss": 0.0507, + "step": 142530 + }, + { + "epoch": 40.08, + "learning_rate": 2.208165432792928e-05, + "loss": 0.0408, + "step": 142560 + }, + { + "epoch": 40.09, + "learning_rate": 2.2062911942023554e-05, + "loss": 0.0499, + "step": 142590 + }, + { + "epoch": 40.1, + "learning_rate": 2.2044169556117828e-05, + "loss": 0.047, + "step": 142620 + }, + { + "epoch": 40.1, + "learning_rate": 2.2025427170212102e-05, + "loss": 0.0508, + "step": 142650 + }, + { + "epoch": 40.11, + "learning_rate": 2.2006684784306376e-05, + "loss": 0.0545, + "step": 142680 + }, + { + "epoch": 40.12, + "learning_rate": 2.198794239840065e-05, + "loss": 0.0441, + "step": 142710 + }, + { + "epoch": 40.13, + "learning_rate": 2.1969200012494925e-05, + "loss": 0.0481, + "step": 142740 + }, + { + "epoch": 40.14, + "learning_rate": 2.19504576265892e-05, + "loss": 0.0413, + "step": 142770 + }, + { + "epoch": 40.15, + "learning_rate": 2.1931715240683473e-05, + "loss": 0.0474, + "step": 142800 + }, + { + "epoch": 40.15, + "learning_rate": 2.1912972854777747e-05, + "loss": 0.0528, + "step": 142830 + }, + { + "epoch": 40.16, + "learning_rate": 2.189423046887202e-05, + "loss": 0.0418, + "step": 142860 + }, + { + "epoch": 40.17, + "learning_rate": 2.1875488082966296e-05, + "loss": 0.052, + "step": 142890 + }, + { + "epoch": 40.18, + "learning_rate": 2.185674569706057e-05, + "loss": 0.046, + "step": 142920 + }, + { + "epoch": 40.19, + "learning_rate": 2.1838003311154844e-05, + "loss": 0.051, + "step": 142950 + }, + { + "epoch": 40.2, + "learning_rate": 2.181926092524912e-05, + "loss": 0.0523, + "step": 142980 + }, + { + "epoch": 40.21, + "learning_rate": 2.1800518539343393e-05, + "loss": 0.0429, + "step": 143010 + }, + { + "epoch": 40.21, + "learning_rate": 2.1781776153437667e-05, + "loss": 0.0557, + "step": 143040 + }, + { + "epoch": 40.22, + "learning_rate": 2.176303376753194e-05, + "loss": 0.0443, + "step": 143070 + }, + { + "epoch": 40.23, + "learning_rate": 2.1744291381626215e-05, + "loss": 0.0497, + "step": 143100 + }, + { + "epoch": 40.24, + "learning_rate": 2.172554899572049e-05, + "loss": 0.0501, + "step": 143130 + }, + { + "epoch": 40.25, + "learning_rate": 2.1706806609814764e-05, + "loss": 0.0427, + "step": 143160 + }, + { + "epoch": 40.26, + "learning_rate": 2.1688064223909038e-05, + "loss": 0.0508, + "step": 143190 + }, + { + "epoch": 40.26, + "learning_rate": 2.1669321838003312e-05, + "loss": 0.0432, + "step": 143220 + }, + { + "epoch": 40.27, + "learning_rate": 2.1650579452097586e-05, + "loss": 0.0461, + "step": 143250 + }, + { + "epoch": 40.28, + "learning_rate": 2.163183706619186e-05, + "loss": 0.0521, + "step": 143280 + }, + { + "epoch": 40.29, + "learning_rate": 2.1613094680286134e-05, + "loss": 0.0412, + "step": 143310 + }, + { + "epoch": 40.3, + "learning_rate": 2.159435229438041e-05, + "loss": 0.0514, + "step": 143340 + }, + { + "epoch": 40.31, + "learning_rate": 2.1575609908474683e-05, + "loss": 0.0456, + "step": 143370 + }, + { + "epoch": 40.31, + "learning_rate": 2.1556867522568957e-05, + "loss": 0.0478, + "step": 143400 + }, + { + "epoch": 40.32, + "learning_rate": 2.153812513666323e-05, + "loss": 0.0549, + "step": 143430 + }, + { + "epoch": 40.33, + "learning_rate": 2.1519382750757505e-05, + "loss": 0.0435, + "step": 143460 + }, + { + "epoch": 40.34, + "learning_rate": 2.150064036485178e-05, + "loss": 0.0512, + "step": 143490 + }, + { + "epoch": 40.35, + "learning_rate": 2.1481897978946054e-05, + "loss": 0.0442, + "step": 143520 + }, + { + "epoch": 40.36, + "learning_rate": 2.1463155593040328e-05, + "loss": 0.0485, + "step": 143550 + }, + { + "epoch": 40.37, + "learning_rate": 2.1444413207134602e-05, + "loss": 0.0531, + "step": 143580 + }, + { + "epoch": 40.37, + "learning_rate": 2.1425670821228876e-05, + "loss": 0.0427, + "step": 143610 + }, + { + "epoch": 40.38, + "learning_rate": 2.140692843532315e-05, + "loss": 0.0512, + "step": 143640 + }, + { + "epoch": 40.39, + "learning_rate": 2.1388186049417425e-05, + "loss": 0.0457, + "step": 143670 + }, + { + "epoch": 40.4, + "learning_rate": 2.13694436635117e-05, + "loss": 0.0507, + "step": 143700 + }, + { + "epoch": 40.41, + "learning_rate": 2.1350701277605973e-05, + "loss": 0.0557, + "step": 143730 + }, + { + "epoch": 40.42, + "learning_rate": 2.1331958891700247e-05, + "loss": 0.0413, + "step": 143760 + }, + { + "epoch": 40.42, + "learning_rate": 2.131321650579452e-05, + "loss": 0.0532, + "step": 143790 + }, + { + "epoch": 40.43, + "learning_rate": 2.1294474119888796e-05, + "loss": 0.0416, + "step": 143820 + }, + { + "epoch": 40.44, + "learning_rate": 2.127573173398307e-05, + "loss": 0.0473, + "step": 143850 + }, + { + "epoch": 40.45, + "learning_rate": 2.1256989348077344e-05, + "loss": 0.0498, + "step": 143880 + }, + { + "epoch": 40.46, + "learning_rate": 2.1238246962171618e-05, + "loss": 0.0436, + "step": 143910 + }, + { + "epoch": 40.47, + "learning_rate": 2.1219504576265892e-05, + "loss": 0.0515, + "step": 143940 + }, + { + "epoch": 40.48, + "learning_rate": 2.1200762190360167e-05, + "loss": 0.0457, + "step": 143970 + }, + { + "epoch": 40.48, + "learning_rate": 2.118201980445444e-05, + "loss": 0.0488, + "step": 144000 + }, + { + "epoch": 40.49, + "learning_rate": 2.1163277418548715e-05, + "loss": 0.0554, + "step": 144030 + }, + { + "epoch": 40.5, + "learning_rate": 2.114453503264299e-05, + "loss": 0.0446, + "step": 144060 + }, + { + "epoch": 40.51, + "learning_rate": 2.1125792646737263e-05, + "loss": 0.0502, + "step": 144090 + }, + { + "epoch": 40.52, + "learning_rate": 2.1107050260831538e-05, + "loss": 0.044, + "step": 144120 + }, + { + "epoch": 40.53, + "learning_rate": 2.1088307874925812e-05, + "loss": 0.0516, + "step": 144150 + }, + { + "epoch": 40.53, + "learning_rate": 2.106956548902009e-05, + "loss": 0.051, + "step": 144180 + }, + { + "epoch": 40.54, + "learning_rate": 2.105082310311436e-05, + "loss": 0.0438, + "step": 144210 + }, + { + "epoch": 40.55, + "learning_rate": 2.1032080717208634e-05, + "loss": 0.0522, + "step": 144240 + }, + { + "epoch": 40.56, + "learning_rate": 2.101333833130291e-05, + "loss": 0.0459, + "step": 144270 + }, + { + "epoch": 40.57, + "learning_rate": 2.0995220691594043e-05, + "loss": 0.0482, + "step": 144300 + }, + { + "epoch": 40.58, + "learning_rate": 2.0976478305688317e-05, + "loss": 0.0515, + "step": 144330 + }, + { + "epoch": 40.58, + "learning_rate": 2.095773591978259e-05, + "loss": 0.0426, + "step": 144360 + }, + { + "epoch": 40.59, + "learning_rate": 2.0938993533876862e-05, + "loss": 0.0516, + "step": 144390 + }, + { + "epoch": 40.6, + "learning_rate": 2.0920251147971136e-05, + "loss": 0.0457, + "step": 144420 + }, + { + "epoch": 40.61, + "learning_rate": 2.090150876206541e-05, + "loss": 0.0468, + "step": 144450 + }, + { + "epoch": 40.62, + "learning_rate": 2.0882766376159685e-05, + "loss": 0.0532, + "step": 144480 + }, + { + "epoch": 40.63, + "learning_rate": 2.0864023990253962e-05, + "loss": 0.0425, + "step": 144510 + }, + { + "epoch": 40.64, + "learning_rate": 2.0845281604348236e-05, + "loss": 0.0508, + "step": 144540 + }, + { + "epoch": 40.64, + "learning_rate": 2.082653921844251e-05, + "loss": 0.0456, + "step": 144570 + }, + { + "epoch": 40.65, + "learning_rate": 2.080779683253678e-05, + "loss": 0.0467, + "step": 144600 + }, + { + "epoch": 40.66, + "learning_rate": 2.0789054446631055e-05, + "loss": 0.0505, + "step": 144630 + }, + { + "epoch": 40.67, + "learning_rate": 2.077031206072533e-05, + "loss": 0.0424, + "step": 144660 + }, + { + "epoch": 40.68, + "learning_rate": 2.0751569674819604e-05, + "loss": 0.0491, + "step": 144690 + }, + { + "epoch": 40.69, + "learning_rate": 2.073282728891388e-05, + "loss": 0.0431, + "step": 144720 + }, + { + "epoch": 40.69, + "learning_rate": 2.0714084903008156e-05, + "loss": 0.0458, + "step": 144750 + }, + { + "epoch": 40.7, + "learning_rate": 2.069534251710243e-05, + "loss": 0.0513, + "step": 144780 + }, + { + "epoch": 40.71, + "learning_rate": 2.06766001311967e-05, + "loss": 0.041, + "step": 144810 + }, + { + "epoch": 40.72, + "learning_rate": 2.0657857745290975e-05, + "loss": 0.0546, + "step": 144840 + }, + { + "epoch": 40.73, + "learning_rate": 2.063911535938525e-05, + "loss": 0.0447, + "step": 144870 + }, + { + "epoch": 40.74, + "learning_rate": 2.0620372973479523e-05, + "loss": 0.0511, + "step": 144900 + }, + { + "epoch": 40.74, + "learning_rate": 2.06016305875738e-05, + "loss": 0.0482, + "step": 144930 + }, + { + "epoch": 40.75, + "learning_rate": 2.0582888201668075e-05, + "loss": 0.0414, + "step": 144960 + }, + { + "epoch": 40.76, + "learning_rate": 2.056414581576235e-05, + "loss": 0.0523, + "step": 144990 + }, + { + "epoch": 40.77, + "learning_rate": 2.0545403429856623e-05, + "loss": 0.0448, + "step": 145020 + }, + { + "epoch": 40.78, + "learning_rate": 2.0526661043950894e-05, + "loss": 0.0475, + "step": 145050 + }, + { + "epoch": 40.79, + "learning_rate": 2.050791865804517e-05, + "loss": 0.054, + "step": 145080 + }, + { + "epoch": 40.8, + "learning_rate": 2.0489176272139443e-05, + "loss": 0.0422, + "step": 145110 + }, + { + "epoch": 40.8, + "learning_rate": 2.047043388623372e-05, + "loss": 0.0482, + "step": 145140 + }, + { + "epoch": 40.81, + "learning_rate": 2.0451691500327994e-05, + "loss": 0.0455, + "step": 145170 + }, + { + "epoch": 40.82, + "learning_rate": 2.043294911442227e-05, + "loss": 0.0511, + "step": 145200 + }, + { + "epoch": 40.83, + "learning_rate": 2.0414206728516543e-05, + "loss": 0.0521, + "step": 145230 + }, + { + "epoch": 40.84, + "learning_rate": 2.0395464342610814e-05, + "loss": 0.0433, + "step": 145260 + }, + { + "epoch": 40.85, + "learning_rate": 2.0376721956705088e-05, + "loss": 0.0507, + "step": 145290 + }, + { + "epoch": 40.85, + "learning_rate": 2.0357979570799362e-05, + "loss": 0.0464, + "step": 145320 + }, + { + "epoch": 40.86, + "learning_rate": 2.033923718489364e-05, + "loss": 0.0489, + "step": 145350 + }, + { + "epoch": 40.87, + "learning_rate": 2.0320494798987914e-05, + "loss": 0.0514, + "step": 145380 + }, + { + "epoch": 40.88, + "learning_rate": 2.0301752413082188e-05, + "loss": 0.0415, + "step": 145410 + }, + { + "epoch": 40.89, + "learning_rate": 2.0283010027176462e-05, + "loss": 0.0503, + "step": 145440 + }, + { + "epoch": 40.9, + "learning_rate": 2.0264267641270733e-05, + "loss": 0.0423, + "step": 145470 + }, + { + "epoch": 40.91, + "learning_rate": 2.0245525255365007e-05, + "loss": 0.046, + "step": 145500 + }, + { + "epoch": 40.91, + "learning_rate": 2.022678286945928e-05, + "loss": 0.0506, + "step": 145530 + }, + { + "epoch": 40.92, + "learning_rate": 2.020804048355356e-05, + "loss": 0.0412, + "step": 145560 + }, + { + "epoch": 40.93, + "learning_rate": 2.0189298097647833e-05, + "loss": 0.0478, + "step": 145590 + }, + { + "epoch": 40.94, + "learning_rate": 2.0170555711742107e-05, + "loss": 0.0421, + "step": 145620 + }, + { + "epoch": 40.95, + "learning_rate": 2.015181332583638e-05, + "loss": 0.0475, + "step": 145650 + }, + { + "epoch": 40.96, + "learning_rate": 2.0133070939930652e-05, + "loss": 0.0545, + "step": 145680 + }, + { + "epoch": 40.96, + "learning_rate": 2.0114328554024926e-05, + "loss": 0.0397, + "step": 145710 + }, + { + "epoch": 40.97, + "learning_rate": 2.00955861681192e-05, + "loss": 0.0521, + "step": 145740 + }, + { + "epoch": 40.98, + "learning_rate": 2.0076843782213478e-05, + "loss": 0.0468, + "step": 145770 + }, + { + "epoch": 40.99, + "learning_rate": 2.0058101396307752e-05, + "loss": 0.0452, + "step": 145800 + }, + { + "epoch": 41.0, + "learning_rate": 2.0039359010402027e-05, + "loss": 0.0467, + "step": 145830 + }, + { + "epoch": 41.0, + "eval_loss": 0.11312602460384369, + "eval_runtime": 638.4663, + "eval_samples_per_second": 25.112, + "eval_steps_per_second": 0.786, + "eval_wer": 0.0942707409277633, + "step": 145837 + }, + { + "epoch": 41.01, + "learning_rate": 2.00206166244963e-05, + "loss": 0.0413, + "step": 145860 + }, + { + "epoch": 41.01, + "learning_rate": 2.0001874238590575e-05, + "loss": 0.0531, + "step": 145890 + }, + { + "epoch": 41.02, + "learning_rate": 1.9983131852684846e-05, + "loss": 0.0386, + "step": 145920 + }, + { + "epoch": 41.03, + "learning_rate": 1.996438946677912e-05, + "loss": 0.052, + "step": 145950 + }, + { + "epoch": 41.04, + "learning_rate": 1.9945647080873397e-05, + "loss": 0.045, + "step": 145980 + }, + { + "epoch": 41.05, + "learning_rate": 1.992690469496767e-05, + "loss": 0.0489, + "step": 146010 + }, + { + "epoch": 41.06, + "learning_rate": 1.9908162309061946e-05, + "loss": 0.0522, + "step": 146040 + }, + { + "epoch": 41.07, + "learning_rate": 1.988941992315622e-05, + "loss": 0.0404, + "step": 146070 + }, + { + "epoch": 41.07, + "learning_rate": 1.9870677537250494e-05, + "loss": 0.0487, + "step": 146100 + }, + { + "epoch": 41.08, + "learning_rate": 1.9851935151344765e-05, + "loss": 0.0445, + "step": 146130 + }, + { + "epoch": 41.09, + "learning_rate": 1.983319276543904e-05, + "loss": 0.0485, + "step": 146160 + }, + { + "epoch": 41.1, + "learning_rate": 1.9814450379533313e-05, + "loss": 0.0515, + "step": 146190 + }, + { + "epoch": 41.11, + "learning_rate": 1.979570799362759e-05, + "loss": 0.0427, + "step": 146220 + }, + { + "epoch": 41.12, + "learning_rate": 1.9776965607721865e-05, + "loss": 0.0506, + "step": 146250 + }, + { + "epoch": 41.12, + "learning_rate": 1.975822322181614e-05, + "loss": 0.0434, + "step": 146280 + }, + { + "epoch": 41.13, + "learning_rate": 1.9739480835910414e-05, + "loss": 0.0502, + "step": 146310 + }, + { + "epoch": 41.14, + "learning_rate": 1.9720738450004684e-05, + "loss": 0.0519, + "step": 146340 + }, + { + "epoch": 41.15, + "learning_rate": 1.970199606409896e-05, + "loss": 0.0417, + "step": 146370 + }, + { + "epoch": 41.16, + "learning_rate": 1.9683253678193233e-05, + "loss": 0.0464, + "step": 146400 + }, + { + "epoch": 41.17, + "learning_rate": 1.966451129228751e-05, + "loss": 0.0434, + "step": 146430 + }, + { + "epoch": 41.18, + "learning_rate": 1.9645768906381785e-05, + "loss": 0.0471, + "step": 146460 + }, + { + "epoch": 41.18, + "learning_rate": 1.962702652047606e-05, + "loss": 0.0537, + "step": 146490 + }, + { + "epoch": 41.19, + "learning_rate": 1.9608284134570333e-05, + "loss": 0.0401, + "step": 146520 + }, + { + "epoch": 41.2, + "learning_rate": 1.9590166494861464e-05, + "loss": 0.0486, + "step": 146550 + }, + { + "epoch": 41.21, + "learning_rate": 1.9571424108955738e-05, + "loss": 0.0462, + "step": 146580 + }, + { + "epoch": 41.22, + "learning_rate": 1.9552681723050012e-05, + "loss": 0.0493, + "step": 146610 + }, + { + "epoch": 41.23, + "learning_rate": 1.9533939337144286e-05, + "loss": 0.0523, + "step": 146640 + }, + { + "epoch": 41.23, + "learning_rate": 1.951519695123856e-05, + "loss": 0.0411, + "step": 146670 + }, + { + "epoch": 41.24, + "learning_rate": 1.9496454565332835e-05, + "loss": 0.0496, + "step": 146700 + }, + { + "epoch": 41.25, + "learning_rate": 1.947771217942711e-05, + "loss": 0.0441, + "step": 146730 + }, + { + "epoch": 41.26, + "learning_rate": 1.9458969793521383e-05, + "loss": 0.0498, + "step": 146760 + }, + { + "epoch": 41.27, + "learning_rate": 1.9440227407615657e-05, + "loss": 0.0515, + "step": 146790 + }, + { + "epoch": 41.28, + "learning_rate": 1.942148502170993e-05, + "loss": 0.0423, + "step": 146820 + }, + { + "epoch": 41.28, + "learning_rate": 1.9402742635804206e-05, + "loss": 0.0516, + "step": 146850 + }, + { + "epoch": 41.29, + "learning_rate": 1.938400024989848e-05, + "loss": 0.0434, + "step": 146880 + }, + { + "epoch": 41.3, + "learning_rate": 1.9365257863992754e-05, + "loss": 0.0443, + "step": 146910 + }, + { + "epoch": 41.31, + "learning_rate": 1.9346515478087028e-05, + "loss": 0.0485, + "step": 146940 + }, + { + "epoch": 41.32, + "learning_rate": 1.9327773092181302e-05, + "loss": 0.04, + "step": 146970 + }, + { + "epoch": 41.33, + "learning_rate": 1.9309030706275577e-05, + "loss": 0.0501, + "step": 147000 + }, + { + "epoch": 41.34, + "learning_rate": 1.929028832036985e-05, + "loss": 0.044, + "step": 147030 + }, + { + "epoch": 41.34, + "learning_rate": 1.9271545934464125e-05, + "loss": 0.0485, + "step": 147060 + }, + { + "epoch": 41.35, + "learning_rate": 1.92528035485584e-05, + "loss": 0.0517, + "step": 147090 + }, + { + "epoch": 41.36, + "learning_rate": 1.9234061162652673e-05, + "loss": 0.0399, + "step": 147120 + }, + { + "epoch": 41.37, + "learning_rate": 1.9215318776746948e-05, + "loss": 0.0464, + "step": 147150 + }, + { + "epoch": 41.38, + "learning_rate": 1.9196576390841222e-05, + "loss": 0.0431, + "step": 147180 + }, + { + "epoch": 41.39, + "learning_rate": 1.9177834004935496e-05, + "loss": 0.0474, + "step": 147210 + }, + { + "epoch": 41.39, + "learning_rate": 1.915909161902977e-05, + "loss": 0.0512, + "step": 147240 + }, + { + "epoch": 41.4, + "learning_rate": 1.9140349233124044e-05, + "loss": 0.0411, + "step": 147270 + }, + { + "epoch": 41.41, + "learning_rate": 1.912160684721832e-05, + "loss": 0.0512, + "step": 147300 + }, + { + "epoch": 41.42, + "learning_rate": 1.9102864461312593e-05, + "loss": 0.0447, + "step": 147330 + }, + { + "epoch": 41.43, + "learning_rate": 1.9084122075406867e-05, + "loss": 0.0464, + "step": 147360 + }, + { + "epoch": 41.44, + "learning_rate": 1.906537968950114e-05, + "loss": 0.0502, + "step": 147390 + }, + { + "epoch": 41.44, + "learning_rate": 1.9046637303595415e-05, + "loss": 0.0453, + "step": 147420 + }, + { + "epoch": 41.45, + "learning_rate": 1.902789491768969e-05, + "loss": 0.0513, + "step": 147450 + }, + { + "epoch": 41.46, + "learning_rate": 1.9009152531783964e-05, + "loss": 0.0459, + "step": 147480 + }, + { + "epoch": 41.47, + "learning_rate": 1.8990410145878238e-05, + "loss": 0.0495, + "step": 147510 + }, + { + "epoch": 41.48, + "learning_rate": 1.8971667759972512e-05, + "loss": 0.0525, + "step": 147540 + }, + { + "epoch": 41.49, + "learning_rate": 1.8952925374066786e-05, + "loss": 0.0421, + "step": 147570 + }, + { + "epoch": 41.5, + "learning_rate": 1.893418298816106e-05, + "loss": 0.0518, + "step": 147600 + }, + { + "epoch": 41.5, + "learning_rate": 1.8915440602255335e-05, + "loss": 0.0475, + "step": 147630 + }, + { + "epoch": 41.51, + "learning_rate": 1.889669821634961e-05, + "loss": 0.0458, + "step": 147660 + }, + { + "epoch": 41.52, + "learning_rate": 1.8877955830443883e-05, + "loss": 0.0468, + "step": 147690 + }, + { + "epoch": 41.53, + "learning_rate": 1.8859213444538157e-05, + "loss": 0.0425, + "step": 147720 + }, + { + "epoch": 41.54, + "learning_rate": 1.884047105863243e-05, + "loss": 0.0476, + "step": 147750 + }, + { + "epoch": 41.55, + "learning_rate": 1.8821728672726706e-05, + "loss": 0.0477, + "step": 147780 + }, + { + "epoch": 41.55, + "learning_rate": 1.880298628682098e-05, + "loss": 0.0452, + "step": 147810 + }, + { + "epoch": 41.56, + "learning_rate": 1.8784243900915254e-05, + "loss": 0.0555, + "step": 147840 + }, + { + "epoch": 41.57, + "learning_rate": 1.8765501515009528e-05, + "loss": 0.0411, + "step": 147870 + }, + { + "epoch": 41.58, + "learning_rate": 1.8746759129103802e-05, + "loss": 0.0509, + "step": 147900 + }, + { + "epoch": 41.59, + "learning_rate": 1.8728016743198076e-05, + "loss": 0.0476, + "step": 147930 + }, + { + "epoch": 41.6, + "learning_rate": 1.870927435729235e-05, + "loss": 0.0464, + "step": 147960 + }, + { + "epoch": 41.61, + "learning_rate": 1.8690531971386625e-05, + "loss": 0.0508, + "step": 147990 + }, + { + "epoch": 41.61, + "learning_rate": 1.86717895854809e-05, + "loss": 0.0404, + "step": 148020 + }, + { + "epoch": 41.62, + "learning_rate": 1.8653047199575173e-05, + "loss": 0.0501, + "step": 148050 + }, + { + "epoch": 41.63, + "learning_rate": 1.8634304813669447e-05, + "loss": 0.0441, + "step": 148080 + }, + { + "epoch": 41.64, + "learning_rate": 1.861556242776372e-05, + "loss": 0.0497, + "step": 148110 + }, + { + "epoch": 41.65, + "learning_rate": 1.8596820041857996e-05, + "loss": 0.0502, + "step": 148140 + }, + { + "epoch": 41.66, + "learning_rate": 1.857807765595227e-05, + "loss": 0.0446, + "step": 148170 + }, + { + "epoch": 41.66, + "learning_rate": 1.8559335270046544e-05, + "loss": 0.0494, + "step": 148200 + }, + { + "epoch": 41.67, + "learning_rate": 1.854059288414082e-05, + "loss": 0.046, + "step": 148230 + }, + { + "epoch": 41.68, + "learning_rate": 1.8521850498235093e-05, + "loss": 0.0496, + "step": 148260 + }, + { + "epoch": 41.69, + "learning_rate": 1.8503108112329367e-05, + "loss": 0.0507, + "step": 148290 + }, + { + "epoch": 41.7, + "learning_rate": 1.848436572642364e-05, + "loss": 0.0428, + "step": 148320 + }, + { + "epoch": 41.71, + "learning_rate": 1.8465623340517915e-05, + "loss": 0.0497, + "step": 148350 + }, + { + "epoch": 41.71, + "learning_rate": 1.844688095461219e-05, + "loss": 0.0442, + "step": 148380 + }, + { + "epoch": 41.72, + "learning_rate": 1.8428138568706464e-05, + "loss": 0.046, + "step": 148410 + }, + { + "epoch": 41.73, + "learning_rate": 1.8409396182800738e-05, + "loss": 0.0528, + "step": 148440 + }, + { + "epoch": 41.74, + "learning_rate": 1.8390653796895012e-05, + "loss": 0.0437, + "step": 148470 + }, + { + "epoch": 41.75, + "learning_rate": 1.8371911410989286e-05, + "loss": 0.0488, + "step": 148500 + }, + { + "epoch": 41.76, + "learning_rate": 1.835316902508356e-05, + "loss": 0.0432, + "step": 148530 + }, + { + "epoch": 41.77, + "learning_rate": 1.8334426639177834e-05, + "loss": 0.0449, + "step": 148560 + }, + { + "epoch": 41.77, + "learning_rate": 1.831568425327211e-05, + "loss": 0.0497, + "step": 148590 + }, + { + "epoch": 41.78, + "learning_rate": 1.8296941867366383e-05, + "loss": 0.0405, + "step": 148620 + }, + { + "epoch": 41.79, + "learning_rate": 1.827819948146066e-05, + "loss": 0.0477, + "step": 148650 + }, + { + "epoch": 41.8, + "learning_rate": 1.825945709555493e-05, + "loss": 0.0475, + "step": 148680 + }, + { + "epoch": 41.81, + "learning_rate": 1.8240714709649205e-05, + "loss": 0.0458, + "step": 148710 + }, + { + "epoch": 41.82, + "learning_rate": 1.8222597069940336e-05, + "loss": 0.0518, + "step": 148740 + }, + { + "epoch": 41.82, + "learning_rate": 1.8203854684034614e-05, + "loss": 0.0404, + "step": 148770 + }, + { + "epoch": 41.83, + "learning_rate": 1.8185112298128888e-05, + "loss": 0.0518, + "step": 148800 + }, + { + "epoch": 41.84, + "learning_rate": 1.8166369912223162e-05, + "loss": 0.0473, + "step": 148830 + }, + { + "epoch": 41.85, + "learning_rate": 1.8147627526317433e-05, + "loss": 0.0467, + "step": 148860 + }, + { + "epoch": 41.86, + "learning_rate": 1.8128885140411707e-05, + "loss": 0.0526, + "step": 148890 + }, + { + "epoch": 41.87, + "learning_rate": 1.811014275450598e-05, + "loss": 0.0419, + "step": 148920 + }, + { + "epoch": 41.88, + "learning_rate": 1.8091400368600256e-05, + "loss": 0.0469, + "step": 148950 + }, + { + "epoch": 41.88, + "learning_rate": 1.8072657982694533e-05, + "loss": 0.0447, + "step": 148980 + }, + { + "epoch": 41.89, + "learning_rate": 1.8053915596788807e-05, + "loss": 0.0468, + "step": 149010 + }, + { + "epoch": 41.9, + "learning_rate": 1.803517321088308e-05, + "loss": 0.0538, + "step": 149040 + }, + { + "epoch": 41.91, + "learning_rate": 1.8016430824977352e-05, + "loss": 0.0428, + "step": 149070 + }, + { + "epoch": 41.92, + "learning_rate": 1.7997688439071627e-05, + "loss": 0.0545, + "step": 149100 + }, + { + "epoch": 41.93, + "learning_rate": 1.79789460531659e-05, + "loss": 0.0454, + "step": 149130 + }, + { + "epoch": 41.93, + "learning_rate": 1.7960203667260175e-05, + "loss": 0.0485, + "step": 149160 + }, + { + "epoch": 41.94, + "learning_rate": 1.7941461281354453e-05, + "loss": 0.0502, + "step": 149190 + }, + { + "epoch": 41.95, + "learning_rate": 1.7922718895448727e-05, + "loss": 0.0414, + "step": 149220 + }, + { + "epoch": 41.96, + "learning_rate": 1.7903976509543e-05, + "loss": 0.0513, + "step": 149250 + }, + { + "epoch": 41.97, + "learning_rate": 1.788523412363727e-05, + "loss": 0.045, + "step": 149280 + }, + { + "epoch": 41.98, + "learning_rate": 1.7866491737731546e-05, + "loss": 0.0451, + "step": 149310 + }, + { + "epoch": 41.98, + "learning_rate": 1.784774935182582e-05, + "loss": 0.0508, + "step": 149340 + }, + { + "epoch": 41.99, + "learning_rate": 1.7829006965920094e-05, + "loss": 0.0407, + "step": 149370 + }, + { + "epoch": 42.0, + "eval_loss": 0.11148813366889954, + "eval_runtime": 636.4424, + "eval_samples_per_second": 25.192, + "eval_steps_per_second": 0.789, + "eval_wer": 0.09436627407094018, + "step": 149394 + }, + { + "epoch": 42.0, + "learning_rate": 1.781088932621123e-05, + "loss": 0.0539, + "step": 149400 + }, + { + "epoch": 42.01, + "learning_rate": 1.7792146940305503e-05, + "loss": 0.0409, + "step": 149430 + }, + { + "epoch": 42.02, + "learning_rate": 1.7773404554399773e-05, + "loss": 0.048, + "step": 149460 + }, + { + "epoch": 42.03, + "learning_rate": 1.7754662168494048e-05, + "loss": 0.0473, + "step": 149490 + }, + { + "epoch": 42.04, + "learning_rate": 1.7735919782588325e-05, + "loss": 0.0433, + "step": 149520 + }, + { + "epoch": 42.04, + "learning_rate": 1.77171773966826e-05, + "loss": 0.052, + "step": 149550 + }, + { + "epoch": 42.05, + "learning_rate": 1.7698435010776874e-05, + "loss": 0.0433, + "step": 149580 + }, + { + "epoch": 42.06, + "learning_rate": 1.7679692624871148e-05, + "loss": 0.0482, + "step": 149610 + }, + { + "epoch": 42.07, + "learning_rate": 1.7660950238965422e-05, + "loss": 0.0459, + "step": 149640 + }, + { + "epoch": 42.08, + "learning_rate": 1.7642207853059696e-05, + "loss": 0.0441, + "step": 149670 + }, + { + "epoch": 42.09, + "learning_rate": 1.7623465467153967e-05, + "loss": 0.0496, + "step": 149700 + }, + { + "epoch": 42.09, + "learning_rate": 1.7604723081248245e-05, + "loss": 0.0389, + "step": 149730 + }, + { + "epoch": 42.1, + "learning_rate": 1.758598069534252e-05, + "loss": 0.053, + "step": 149760 + }, + { + "epoch": 42.11, + "learning_rate": 1.7567238309436793e-05, + "loss": 0.0473, + "step": 149790 + }, + { + "epoch": 42.12, + "learning_rate": 1.7548495923531067e-05, + "loss": 0.0428, + "step": 149820 + }, + { + "epoch": 42.13, + "learning_rate": 1.752975353762534e-05, + "loss": 0.0514, + "step": 149850 + }, + { + "epoch": 42.14, + "learning_rate": 1.7511011151719616e-05, + "loss": 0.0408, + "step": 149880 + }, + { + "epoch": 42.15, + "learning_rate": 1.7492268765813886e-05, + "loss": 0.0472, + "step": 149910 + }, + { + "epoch": 42.15, + "learning_rate": 1.7473526379908164e-05, + "loss": 0.0492, + "step": 149940 + }, + { + "epoch": 42.16, + "learning_rate": 1.7454783994002438e-05, + "loss": 0.0426, + "step": 149970 + }, + { + "epoch": 42.17, + "learning_rate": 1.7436041608096712e-05, + "loss": 0.0493, + "step": 150000 + }, + { + "epoch": 42.18, + "learning_rate": 1.7417299222190986e-05, + "loss": 0.0446, + "step": 150030 + }, + { + "epoch": 42.19, + "learning_rate": 1.739855683628526e-05, + "loss": 0.0493, + "step": 150060 + }, + { + "epoch": 42.2, + "learning_rate": 1.7379814450379535e-05, + "loss": 0.0479, + "step": 150090 + }, + { + "epoch": 42.2, + "learning_rate": 1.7361072064473806e-05, + "loss": 0.0453, + "step": 150120 + }, + { + "epoch": 42.21, + "learning_rate": 1.7342329678568083e-05, + "loss": 0.0462, + "step": 150150 + }, + { + "epoch": 42.22, + "learning_rate": 1.7323587292662357e-05, + "loss": 0.0405, + "step": 150180 + }, + { + "epoch": 42.23, + "learning_rate": 1.730484490675663e-05, + "loss": 0.0468, + "step": 150210 + }, + { + "epoch": 42.24, + "learning_rate": 1.7286102520850906e-05, + "loss": 0.0468, + "step": 150240 + }, + { + "epoch": 42.25, + "learning_rate": 1.726736013494518e-05, + "loss": 0.0441, + "step": 150270 + }, + { + "epoch": 42.25, + "learning_rate": 1.7248617749039454e-05, + "loss": 0.052, + "step": 150300 + }, + { + "epoch": 42.26, + "learning_rate": 1.722987536313373e-05, + "loss": 0.0412, + "step": 150330 + }, + { + "epoch": 42.27, + "learning_rate": 1.7211132977228003e-05, + "loss": 0.0487, + "step": 150360 + }, + { + "epoch": 42.28, + "learning_rate": 1.7192390591322277e-05, + "loss": 0.0435, + "step": 150390 + }, + { + "epoch": 42.29, + "learning_rate": 1.717364820541655e-05, + "loss": 0.0477, + "step": 150420 + }, + { + "epoch": 42.3, + "learning_rate": 1.7154905819510825e-05, + "loss": 0.0489, + "step": 150450 + }, + { + "epoch": 42.31, + "learning_rate": 1.71361634336051e-05, + "loss": 0.0396, + "step": 150480 + }, + { + "epoch": 42.31, + "learning_rate": 1.7117421047699374e-05, + "loss": 0.0493, + "step": 150510 + }, + { + "epoch": 42.32, + "learning_rate": 1.7098678661793648e-05, + "loss": 0.0462, + "step": 150540 + }, + { + "epoch": 42.33, + "learning_rate": 1.707993627588792e-05, + "loss": 0.0435, + "step": 150570 + }, + { + "epoch": 42.34, + "learning_rate": 1.7061193889982196e-05, + "loss": 0.0469, + "step": 150600 + }, + { + "epoch": 42.35, + "learning_rate": 1.704245150407647e-05, + "loss": 0.0437, + "step": 150630 + }, + { + "epoch": 42.36, + "learning_rate": 1.7023709118170744e-05, + "loss": 0.0497, + "step": 150660 + }, + { + "epoch": 42.36, + "learning_rate": 1.700496673226502e-05, + "loss": 0.046, + "step": 150690 + }, + { + "epoch": 42.37, + "learning_rate": 1.6986224346359293e-05, + "loss": 0.0441, + "step": 150720 + }, + { + "epoch": 42.38, + "learning_rate": 1.6967481960453567e-05, + "loss": 0.0489, + "step": 150750 + }, + { + "epoch": 42.39, + "learning_rate": 1.6948739574547838e-05, + "loss": 0.0424, + "step": 150780 + }, + { + "epoch": 42.4, + "learning_rate": 1.6929997188642115e-05, + "loss": 0.0485, + "step": 150810 + }, + { + "epoch": 42.41, + "learning_rate": 1.691125480273639e-05, + "loss": 0.0467, + "step": 150840 + }, + { + "epoch": 42.41, + "learning_rate": 1.6892512416830664e-05, + "loss": 0.0445, + "step": 150870 + }, + { + "epoch": 42.42, + "learning_rate": 1.6873770030924938e-05, + "loss": 0.0545, + "step": 150900 + }, + { + "epoch": 42.43, + "learning_rate": 1.6855027645019212e-05, + "loss": 0.0424, + "step": 150930 + }, + { + "epoch": 42.44, + "learning_rate": 1.6836285259113486e-05, + "loss": 0.0482, + "step": 150960 + }, + { + "epoch": 42.45, + "learning_rate": 1.681754287320776e-05, + "loss": 0.0488, + "step": 150990 + }, + { + "epoch": 42.46, + "learning_rate": 1.6798800487302035e-05, + "loss": 0.0445, + "step": 151020 + }, + { + "epoch": 42.47, + "learning_rate": 1.678005810139631e-05, + "loss": 0.0499, + "step": 151050 + }, + { + "epoch": 42.47, + "learning_rate": 1.6761315715490583e-05, + "loss": 0.0422, + "step": 151080 + }, + { + "epoch": 42.48, + "learning_rate": 1.6742573329584857e-05, + "loss": 0.0489, + "step": 151110 + }, + { + "epoch": 42.49, + "learning_rate": 1.672383094367913e-05, + "loss": 0.0473, + "step": 151140 + }, + { + "epoch": 42.5, + "learning_rate": 1.6705088557773406e-05, + "loss": 0.0437, + "step": 151170 + }, + { + "epoch": 42.51, + "learning_rate": 1.668634617186768e-05, + "loss": 0.051, + "step": 151200 + }, + { + "epoch": 42.52, + "learning_rate": 1.6667603785961954e-05, + "loss": 0.0397, + "step": 151230 + }, + { + "epoch": 42.52, + "learning_rate": 1.6648861400056228e-05, + "loss": 0.0487, + "step": 151260 + }, + { + "epoch": 42.53, + "learning_rate": 1.6630119014150502e-05, + "loss": 0.0448, + "step": 151290 + }, + { + "epoch": 42.54, + "learning_rate": 1.6611376628244777e-05, + "loss": 0.0438, + "step": 151320 + }, + { + "epoch": 42.55, + "learning_rate": 1.659263424233905e-05, + "loss": 0.0492, + "step": 151350 + }, + { + "epoch": 42.56, + "learning_rate": 1.6573891856433325e-05, + "loss": 0.043, + "step": 151380 + }, + { + "epoch": 42.57, + "learning_rate": 1.65551494705276e-05, + "loss": 0.0486, + "step": 151410 + }, + { + "epoch": 42.58, + "learning_rate": 1.6536407084621873e-05, + "loss": 0.0469, + "step": 151440 + }, + { + "epoch": 42.58, + "learning_rate": 1.6517664698716148e-05, + "loss": 0.0445, + "step": 151470 + }, + { + "epoch": 42.59, + "learning_rate": 1.6498922312810422e-05, + "loss": 0.0519, + "step": 151500 + }, + { + "epoch": 42.6, + "learning_rate": 1.6480179926904696e-05, + "loss": 0.0429, + "step": 151530 + }, + { + "epoch": 42.61, + "learning_rate": 1.646206228719583e-05, + "loss": 0.0501, + "step": 151560 + }, + { + "epoch": 42.62, + "learning_rate": 1.64433199012901e-05, + "loss": 0.0467, + "step": 151590 + }, + { + "epoch": 42.63, + "learning_rate": 1.6424577515384375e-05, + "loss": 0.0463, + "step": 151620 + }, + { + "epoch": 42.63, + "learning_rate": 1.640583512947865e-05, + "loss": 0.0507, + "step": 151650 + }, + { + "epoch": 42.64, + "learning_rate": 1.6387092743572924e-05, + "loss": 0.0424, + "step": 151680 + }, + { + "epoch": 42.65, + "learning_rate": 1.6368350357667198e-05, + "loss": 0.0499, + "step": 151710 + }, + { + "epoch": 42.66, + "learning_rate": 1.6349607971761472e-05, + "loss": 0.0477, + "step": 151740 + }, + { + "epoch": 42.67, + "learning_rate": 1.633086558585575e-05, + "loss": 0.0471, + "step": 151770 + }, + { + "epoch": 42.68, + "learning_rate": 1.631212319995002e-05, + "loss": 0.0508, + "step": 151800 + }, + { + "epoch": 42.68, + "learning_rate": 1.6293380814044295e-05, + "loss": 0.044, + "step": 151830 + }, + { + "epoch": 42.69, + "learning_rate": 1.627463842813857e-05, + "loss": 0.0477, + "step": 151860 + }, + { + "epoch": 42.7, + "learning_rate": 1.6255896042232843e-05, + "loss": 0.0462, + "step": 151890 + }, + { + "epoch": 42.71, + "learning_rate": 1.6237153656327117e-05, + "loss": 0.0474, + "step": 151920 + }, + { + "epoch": 42.72, + "learning_rate": 1.621841127042139e-05, + "loss": 0.0489, + "step": 151950 + }, + { + "epoch": 42.73, + "learning_rate": 1.619966888451567e-05, + "loss": 0.04, + "step": 151980 + }, + { + "epoch": 42.74, + "learning_rate": 1.618092649860994e-05, + "loss": 0.0465, + "step": 152010 + }, + { + "epoch": 42.74, + "learning_rate": 1.6162184112704214e-05, + "loss": 0.0474, + "step": 152040 + }, + { + "epoch": 42.75, + "learning_rate": 1.6143441726798488e-05, + "loss": 0.0441, + "step": 152070 + }, + { + "epoch": 42.76, + "learning_rate": 1.6124699340892762e-05, + "loss": 0.0519, + "step": 152100 + }, + { + "epoch": 42.77, + "learning_rate": 1.6105956954987036e-05, + "loss": 0.039, + "step": 152130 + }, + { + "epoch": 42.78, + "learning_rate": 1.608721456908131e-05, + "loss": 0.0451, + "step": 152160 + }, + { + "epoch": 42.79, + "learning_rate": 1.6068472183175588e-05, + "loss": 0.0458, + "step": 152190 + }, + { + "epoch": 42.79, + "learning_rate": 1.604972979726986e-05, + "loss": 0.044, + "step": 152220 + }, + { + "epoch": 42.8, + "learning_rate": 1.6030987411364133e-05, + "loss": 0.0516, + "step": 152250 + }, + { + "epoch": 42.81, + "learning_rate": 1.6012245025458407e-05, + "loss": 0.041, + "step": 152280 + }, + { + "epoch": 42.82, + "learning_rate": 1.599350263955268e-05, + "loss": 0.0461, + "step": 152310 + }, + { + "epoch": 42.83, + "learning_rate": 1.5974760253646956e-05, + "loss": 0.0438, + "step": 152340 + }, + { + "epoch": 42.84, + "learning_rate": 1.595601786774123e-05, + "loss": 0.0424, + "step": 152370 + }, + { + "epoch": 42.84, + "learning_rate": 1.5937275481835508e-05, + "loss": 0.0495, + "step": 152400 + }, + { + "epoch": 42.85, + "learning_rate": 1.5918533095929782e-05, + "loss": 0.0437, + "step": 152430 + }, + { + "epoch": 42.86, + "learning_rate": 1.5899790710024053e-05, + "loss": 0.046, + "step": 152460 + }, + { + "epoch": 42.87, + "learning_rate": 1.5881048324118327e-05, + "loss": 0.0459, + "step": 152490 + }, + { + "epoch": 42.88, + "learning_rate": 1.58623059382126e-05, + "loss": 0.044, + "step": 152520 + }, + { + "epoch": 42.89, + "learning_rate": 1.5843563552306875e-05, + "loss": 0.0482, + "step": 152550 + }, + { + "epoch": 42.9, + "learning_rate": 1.582482116640115e-05, + "loss": 0.0415, + "step": 152580 + }, + { + "epoch": 42.9, + "learning_rate": 1.5806078780495427e-05, + "loss": 0.0499, + "step": 152610 + }, + { + "epoch": 42.91, + "learning_rate": 1.57873363945897e-05, + "loss": 0.0453, + "step": 152640 + }, + { + "epoch": 42.92, + "learning_rate": 1.5768594008683972e-05, + "loss": 0.0447, + "step": 152670 + }, + { + "epoch": 42.93, + "learning_rate": 1.5749851622778246e-05, + "loss": 0.0506, + "step": 152700 + }, + { + "epoch": 42.94, + "learning_rate": 1.573110923687252e-05, + "loss": 0.0413, + "step": 152730 + }, + { + "epoch": 42.95, + "learning_rate": 1.5712366850966794e-05, + "loss": 0.0484, + "step": 152760 + }, + { + "epoch": 42.95, + "learning_rate": 1.569362446506107e-05, + "loss": 0.0472, + "step": 152790 + }, + { + "epoch": 42.96, + "learning_rate": 1.5674882079155346e-05, + "loss": 0.0463, + "step": 152820 + }, + { + "epoch": 42.97, + "learning_rate": 1.565613969324962e-05, + "loss": 0.0486, + "step": 152850 + }, + { + "epoch": 42.98, + "learning_rate": 1.563739730734389e-05, + "loss": 0.0416, + "step": 152880 + }, + { + "epoch": 42.99, + "learning_rate": 1.5618654921438165e-05, + "loss": 0.0505, + "step": 152910 + }, + { + "epoch": 43.0, + "learning_rate": 1.559991253553244e-05, + "loss": 0.046, + "step": 152940 + }, + { + "epoch": 43.0, + "eval_loss": 0.11060696840286255, + "eval_runtime": 639.3277, + "eval_samples_per_second": 25.078, + "eval_steps_per_second": 0.785, + "eval_wer": 0.09347918059858339, + "step": 152951 + }, + { + "epoch": 43.01, + "learning_rate": 1.5581170149626714e-05, + "loss": 0.0466, + "step": 152970 + }, + { + "epoch": 43.01, + "learning_rate": 1.5562427763720988e-05, + "loss": 0.0497, + "step": 153000 + }, + { + "epoch": 43.02, + "learning_rate": 1.5543685377815266e-05, + "loss": 0.0419, + "step": 153030 + }, + { + "epoch": 43.03, + "learning_rate": 1.552494299190954e-05, + "loss": 0.0468, + "step": 153060 + }, + { + "epoch": 43.04, + "learning_rate": 1.5506200606003814e-05, + "loss": 0.0441, + "step": 153090 + }, + { + "epoch": 43.05, + "learning_rate": 1.5487458220098085e-05, + "loss": 0.0452, + "step": 153120 + }, + { + "epoch": 43.06, + "learning_rate": 1.546871583419236e-05, + "loss": 0.0439, + "step": 153150 + }, + { + "epoch": 43.06, + "learning_rate": 1.5449973448286633e-05, + "loss": 0.0423, + "step": 153180 + }, + { + "epoch": 43.07, + "learning_rate": 1.5431231062380907e-05, + "loss": 0.0489, + "step": 153210 + }, + { + "epoch": 43.08, + "learning_rate": 1.541248867647518e-05, + "loss": 0.0438, + "step": 153240 + }, + { + "epoch": 43.09, + "learning_rate": 1.539374629056946e-05, + "loss": 0.0439, + "step": 153270 + }, + { + "epoch": 43.1, + "learning_rate": 1.5375003904663733e-05, + "loss": 0.0492, + "step": 153300 + }, + { + "epoch": 43.11, + "learning_rate": 1.5356261518758004e-05, + "loss": 0.0436, + "step": 153330 + }, + { + "epoch": 43.11, + "learning_rate": 1.5337519132852278e-05, + "loss": 0.05, + "step": 153360 + }, + { + "epoch": 43.12, + "learning_rate": 1.5318776746946552e-05, + "loss": 0.042, + "step": 153390 + }, + { + "epoch": 43.13, + "learning_rate": 1.5300034361040827e-05, + "loss": 0.0491, + "step": 153420 + }, + { + "epoch": 43.14, + "learning_rate": 1.52812919751351e-05, + "loss": 0.0476, + "step": 153450 + }, + { + "epoch": 43.15, + "learning_rate": 1.526254958922938e-05, + "loss": 0.0406, + "step": 153480 + }, + { + "epoch": 43.16, + "learning_rate": 1.5243807203323651e-05, + "loss": 0.0474, + "step": 153510 + }, + { + "epoch": 43.17, + "learning_rate": 1.5225064817417925e-05, + "loss": 0.0413, + "step": 153540 + }, + { + "epoch": 43.17, + "learning_rate": 1.52063224315122e-05, + "loss": 0.0467, + "step": 153570 + }, + { + "epoch": 43.18, + "learning_rate": 1.5187580045606473e-05, + "loss": 0.0462, + "step": 153600 + }, + { + "epoch": 43.19, + "learning_rate": 1.5168837659700746e-05, + "loss": 0.0437, + "step": 153630 + }, + { + "epoch": 43.2, + "learning_rate": 1.515009527379502e-05, + "loss": 0.0502, + "step": 153660 + }, + { + "epoch": 43.21, + "learning_rate": 1.5131352887889296e-05, + "loss": 0.0437, + "step": 153690 + }, + { + "epoch": 43.22, + "learning_rate": 1.511261050198357e-05, + "loss": 0.0472, + "step": 153720 + }, + { + "epoch": 43.22, + "learning_rate": 1.5093868116077844e-05, + "loss": 0.0489, + "step": 153750 + }, + { + "epoch": 43.23, + "learning_rate": 1.5075125730172119e-05, + "loss": 0.0416, + "step": 153780 + }, + { + "epoch": 43.24, + "learning_rate": 1.5056383344266393e-05, + "loss": 0.049, + "step": 153810 + }, + { + "epoch": 43.25, + "learning_rate": 1.5037640958360665e-05, + "loss": 0.0433, + "step": 153840 + }, + { + "epoch": 43.26, + "learning_rate": 1.501889857245494e-05, + "loss": 0.0456, + "step": 153870 + }, + { + "epoch": 43.27, + "learning_rate": 1.5000156186549217e-05, + "loss": 0.0471, + "step": 153900 + }, + { + "epoch": 43.28, + "learning_rate": 1.498141380064349e-05, + "loss": 0.0421, + "step": 153930 + }, + { + "epoch": 43.28, + "learning_rate": 1.4962671414737764e-05, + "loss": 0.0486, + "step": 153960 + }, + { + "epoch": 43.29, + "learning_rate": 1.4943929028832038e-05, + "loss": 0.0429, + "step": 153990 + }, + { + "epoch": 43.3, + "learning_rate": 1.4925186642926312e-05, + "loss": 0.0475, + "step": 154020 + }, + { + "epoch": 43.31, + "learning_rate": 1.4906444257020585e-05, + "loss": 0.0498, + "step": 154050 + }, + { + "epoch": 43.32, + "learning_rate": 1.4887701871114859e-05, + "loss": 0.0424, + "step": 154080 + }, + { + "epoch": 43.33, + "learning_rate": 1.4868959485209136e-05, + "loss": 0.0492, + "step": 154110 + }, + { + "epoch": 43.33, + "learning_rate": 1.4850217099303409e-05, + "loss": 0.0445, + "step": 154140 + }, + { + "epoch": 43.34, + "learning_rate": 1.4831474713397683e-05, + "loss": 0.0498, + "step": 154170 + }, + { + "epoch": 43.35, + "learning_rate": 1.4812732327491957e-05, + "loss": 0.048, + "step": 154200 + }, + { + "epoch": 43.36, + "learning_rate": 1.4793989941586231e-05, + "loss": 0.0453, + "step": 154230 + }, + { + "epoch": 43.37, + "learning_rate": 1.4775247555680504e-05, + "loss": 0.0503, + "step": 154260 + }, + { + "epoch": 43.38, + "learning_rate": 1.4756505169774778e-05, + "loss": 0.0425, + "step": 154290 + }, + { + "epoch": 43.38, + "learning_rate": 1.4737762783869056e-05, + "loss": 0.0438, + "step": 154320 + }, + { + "epoch": 43.39, + "learning_rate": 1.4719020397963328e-05, + "loss": 0.0476, + "step": 154350 + }, + { + "epoch": 43.4, + "learning_rate": 1.4700278012057602e-05, + "loss": 0.0442, + "step": 154380 + }, + { + "epoch": 43.41, + "learning_rate": 1.4681535626151877e-05, + "loss": 0.0491, + "step": 154410 + }, + { + "epoch": 43.42, + "learning_rate": 1.466279324024615e-05, + "loss": 0.0404, + "step": 154440 + }, + { + "epoch": 43.43, + "learning_rate": 1.4644050854340425e-05, + "loss": 0.0502, + "step": 154470 + }, + { + "epoch": 43.44, + "learning_rate": 1.4625308468434698e-05, + "loss": 0.0447, + "step": 154500 + }, + { + "epoch": 43.44, + "learning_rate": 1.4606566082528975e-05, + "loss": 0.039, + "step": 154530 + }, + { + "epoch": 43.45, + "learning_rate": 1.458782369662325e-05, + "loss": 0.0487, + "step": 154560 + }, + { + "epoch": 43.46, + "learning_rate": 1.4569081310717522e-05, + "loss": 0.0406, + "step": 154590 + }, + { + "epoch": 43.47, + "learning_rate": 1.4550338924811796e-05, + "loss": 0.0464, + "step": 154620 + }, + { + "epoch": 43.48, + "learning_rate": 1.453159653890607e-05, + "loss": 0.0462, + "step": 154650 + }, + { + "epoch": 43.49, + "learning_rate": 1.4512854153000344e-05, + "loss": 0.0448, + "step": 154680 + }, + { + "epoch": 43.49, + "learning_rate": 1.4494111767094617e-05, + "loss": 0.0487, + "step": 154710 + }, + { + "epoch": 43.5, + "learning_rate": 1.4475369381188894e-05, + "loss": 0.041, + "step": 154740 + }, + { + "epoch": 43.51, + "learning_rate": 1.4456626995283169e-05, + "loss": 0.0486, + "step": 154770 + }, + { + "epoch": 43.52, + "learning_rate": 1.4437884609377441e-05, + "loss": 0.0459, + "step": 154800 + }, + { + "epoch": 43.53, + "learning_rate": 1.4419142223471715e-05, + "loss": 0.0438, + "step": 154830 + }, + { + "epoch": 43.54, + "learning_rate": 1.440039983756599e-05, + "loss": 0.0474, + "step": 154860 + }, + { + "epoch": 43.55, + "learning_rate": 1.4381657451660264e-05, + "loss": 0.0424, + "step": 154890 + }, + { + "epoch": 43.55, + "learning_rate": 1.4362915065754536e-05, + "loss": 0.044, + "step": 154920 + }, + { + "epoch": 43.56, + "learning_rate": 1.434417267984881e-05, + "loss": 0.047, + "step": 154950 + }, + { + "epoch": 43.57, + "learning_rate": 1.4325430293943088e-05, + "loss": 0.04, + "step": 154980 + }, + { + "epoch": 43.58, + "learning_rate": 1.430668790803736e-05, + "loss": 0.0476, + "step": 155010 + }, + { + "epoch": 43.59, + "learning_rate": 1.4287945522131635e-05, + "loss": 0.0435, + "step": 155040 + }, + { + "epoch": 43.6, + "learning_rate": 1.4269203136225909e-05, + "loss": 0.0465, + "step": 155070 + }, + { + "epoch": 43.6, + "learning_rate": 1.4250460750320183e-05, + "loss": 0.0462, + "step": 155100 + }, + { + "epoch": 43.61, + "learning_rate": 1.4231718364414457e-05, + "loss": 0.042, + "step": 155130 + }, + { + "epoch": 43.62, + "learning_rate": 1.421297597850873e-05, + "loss": 0.048, + "step": 155160 + }, + { + "epoch": 43.63, + "learning_rate": 1.4194233592603007e-05, + "loss": 0.0421, + "step": 155190 + }, + { + "epoch": 43.64, + "learning_rate": 1.417549120669728e-05, + "loss": 0.0489, + "step": 155220 + }, + { + "epoch": 43.65, + "learning_rate": 1.4156748820791554e-05, + "loss": 0.0486, + "step": 155250 + }, + { + "epoch": 43.65, + "learning_rate": 1.4138006434885828e-05, + "loss": 0.0413, + "step": 155280 + }, + { + "epoch": 43.66, + "learning_rate": 1.4119264048980102e-05, + "loss": 0.0502, + "step": 155310 + }, + { + "epoch": 43.67, + "learning_rate": 1.4100521663074377e-05, + "loss": 0.0429, + "step": 155340 + }, + { + "epoch": 43.68, + "learning_rate": 1.4081779277168649e-05, + "loss": 0.0465, + "step": 155370 + }, + { + "epoch": 43.69, + "learning_rate": 1.4063036891262927e-05, + "loss": 0.0493, + "step": 155400 + }, + { + "epoch": 43.7, + "learning_rate": 1.40442945053572e-05, + "loss": 0.0422, + "step": 155430 + }, + { + "epoch": 43.71, + "learning_rate": 1.4025552119451473e-05, + "loss": 0.0508, + "step": 155460 + }, + { + "epoch": 43.71, + "learning_rate": 1.4006809733545747e-05, + "loss": 0.0429, + "step": 155490 + }, + { + "epoch": 43.72, + "learning_rate": 1.3988067347640022e-05, + "loss": 0.0441, + "step": 155520 + }, + { + "epoch": 43.73, + "learning_rate": 1.3969324961734296e-05, + "loss": 0.0482, + "step": 155550 + }, + { + "epoch": 43.74, + "learning_rate": 1.3950582575828568e-05, + "loss": 0.0426, + "step": 155580 + }, + { + "epoch": 43.75, + "learning_rate": 1.3931840189922846e-05, + "loss": 0.0465, + "step": 155610 + }, + { + "epoch": 43.76, + "learning_rate": 1.391309780401712e-05, + "loss": 0.0429, + "step": 155640 + }, + { + "epoch": 43.76, + "learning_rate": 1.3894355418111393e-05, + "loss": 0.0439, + "step": 155670 + }, + { + "epoch": 43.77, + "learning_rate": 1.3875613032205667e-05, + "loss": 0.0464, + "step": 155700 + }, + { + "epoch": 43.78, + "learning_rate": 1.3856870646299941e-05, + "loss": 0.0428, + "step": 155730 + }, + { + "epoch": 43.79, + "learning_rate": 1.3838128260394215e-05, + "loss": 0.0453, + "step": 155760 + }, + { + "epoch": 43.8, + "learning_rate": 1.3819385874488488e-05, + "loss": 0.0443, + "step": 155790 + }, + { + "epoch": 43.81, + "learning_rate": 1.3800643488582765e-05, + "loss": 0.0434, + "step": 155820 + }, + { + "epoch": 43.81, + "learning_rate": 1.378190110267704e-05, + "loss": 0.0427, + "step": 155850 + }, + { + "epoch": 43.82, + "learning_rate": 1.3763158716771312e-05, + "loss": 0.0423, + "step": 155880 + }, + { + "epoch": 43.83, + "learning_rate": 1.3744416330865586e-05, + "loss": 0.0473, + "step": 155910 + }, + { + "epoch": 43.84, + "learning_rate": 1.372567394495986e-05, + "loss": 0.0414, + "step": 155940 + }, + { + "epoch": 43.85, + "learning_rate": 1.3706931559054135e-05, + "loss": 0.0451, + "step": 155970 + }, + { + "epoch": 43.86, + "learning_rate": 1.3688189173148409e-05, + "loss": 0.0461, + "step": 156000 + }, + { + "epoch": 43.87, + "learning_rate": 1.3669446787242685e-05, + "loss": 0.0423, + "step": 156030 + }, + { + "epoch": 43.87, + "learning_rate": 1.3650704401336959e-05, + "loss": 0.0471, + "step": 156060 + }, + { + "epoch": 43.88, + "learning_rate": 1.3632586761628088e-05, + "loss": 0.0435, + "step": 156090 + }, + { + "epoch": 43.89, + "learning_rate": 1.3613844375722362e-05, + "loss": 0.0454, + "step": 156120 + }, + { + "epoch": 43.9, + "learning_rate": 1.3595101989816638e-05, + "loss": 0.0468, + "step": 156150 + }, + { + "epoch": 43.91, + "learning_rate": 1.3576359603910912e-05, + "loss": 0.0399, + "step": 156180 + }, + { + "epoch": 43.92, + "learning_rate": 1.3557617218005186e-05, + "loss": 0.0487, + "step": 156210 + }, + { + "epoch": 43.92, + "learning_rate": 1.353887483209946e-05, + "loss": 0.0442, + "step": 156240 + }, + { + "epoch": 43.93, + "learning_rate": 1.3520132446193735e-05, + "loss": 0.046, + "step": 156270 + }, + { + "epoch": 43.94, + "learning_rate": 1.3501390060288007e-05, + "loss": 0.0476, + "step": 156300 + }, + { + "epoch": 43.95, + "learning_rate": 1.3482647674382281e-05, + "loss": 0.0397, + "step": 156330 + }, + { + "epoch": 43.96, + "learning_rate": 1.3463905288476559e-05, + "loss": 0.0529, + "step": 156360 + }, + { + "epoch": 43.97, + "learning_rate": 1.3445162902570832e-05, + "loss": 0.0414, + "step": 156390 + }, + { + "epoch": 43.98, + "learning_rate": 1.3426420516665106e-05, + "loss": 0.0452, + "step": 156420 + }, + { + "epoch": 43.98, + "learning_rate": 1.340767813075938e-05, + "loss": 0.0467, + "step": 156450 + }, + { + "epoch": 43.99, + "learning_rate": 1.3388935744853654e-05, + "loss": 0.0447, + "step": 156480 + }, + { + "epoch": 44.0, + "eval_loss": 0.10826382040977478, + "eval_runtime": 640.1758, + "eval_samples_per_second": 25.045, + "eval_steps_per_second": 0.784, + "eval_wer": 0.09191653132804717, + "step": 156508 + }, + { + "epoch": 44.0, + "learning_rate": 1.3370193358947927e-05, + "loss": 0.0516, + "step": 156510 + }, + { + "epoch": 44.01, + "learning_rate": 1.33514509730422e-05, + "loss": 0.0367, + "step": 156540 + }, + { + "epoch": 44.02, + "learning_rate": 1.3332708587136478e-05, + "loss": 0.0511, + "step": 156570 + }, + { + "epoch": 44.03, + "learning_rate": 1.3313966201230751e-05, + "loss": 0.0436, + "step": 156600 + }, + { + "epoch": 44.03, + "learning_rate": 1.3295223815325025e-05, + "loss": 0.0452, + "step": 156630 + }, + { + "epoch": 44.04, + "learning_rate": 1.32764814294193e-05, + "loss": 0.0485, + "step": 156660 + }, + { + "epoch": 44.05, + "learning_rate": 1.3257739043513573e-05, + "loss": 0.0371, + "step": 156690 + }, + { + "epoch": 44.06, + "learning_rate": 1.3238996657607846e-05, + "loss": 0.0472, + "step": 156720 + }, + { + "epoch": 44.07, + "learning_rate": 1.322025427170212e-05, + "loss": 0.0421, + "step": 156750 + }, + { + "epoch": 44.08, + "learning_rate": 1.3201511885796398e-05, + "loss": 0.0452, + "step": 156780 + }, + { + "epoch": 44.08, + "learning_rate": 1.318276949989067e-05, + "loss": 0.049, + "step": 156810 + }, + { + "epoch": 44.09, + "learning_rate": 1.3164027113984944e-05, + "loss": 0.0384, + "step": 156840 + }, + { + "epoch": 44.1, + "learning_rate": 1.3145284728079219e-05, + "loss": 0.0447, + "step": 156870 + }, + { + "epoch": 44.11, + "learning_rate": 1.3126542342173493e-05, + "loss": 0.044, + "step": 156900 + }, + { + "epoch": 44.12, + "learning_rate": 1.3107799956267767e-05, + "loss": 0.0461, + "step": 156930 + }, + { + "epoch": 44.13, + "learning_rate": 1.308905757036204e-05, + "loss": 0.0471, + "step": 156960 + }, + { + "epoch": 44.14, + "learning_rate": 1.3070315184456317e-05, + "loss": 0.0404, + "step": 156990 + }, + { + "epoch": 44.14, + "learning_rate": 1.305157279855059e-05, + "loss": 0.0466, + "step": 157020 + }, + { + "epoch": 44.15, + "learning_rate": 1.3032830412644864e-05, + "loss": 0.0443, + "step": 157050 + }, + { + "epoch": 44.16, + "learning_rate": 1.3014088026739138e-05, + "loss": 0.0435, + "step": 157080 + }, + { + "epoch": 44.17, + "learning_rate": 1.2995345640833412e-05, + "loss": 0.0477, + "step": 157110 + }, + { + "epoch": 44.18, + "learning_rate": 1.2976603254927686e-05, + "loss": 0.0364, + "step": 157140 + }, + { + "epoch": 44.19, + "learning_rate": 1.2957860869021959e-05, + "loss": 0.049, + "step": 157170 + }, + { + "epoch": 44.19, + "learning_rate": 1.2939118483116236e-05, + "loss": 0.0432, + "step": 157200 + }, + { + "epoch": 44.2, + "learning_rate": 1.292037609721051e-05, + "loss": 0.0476, + "step": 157230 + }, + { + "epoch": 44.21, + "learning_rate": 1.2901633711304783e-05, + "loss": 0.051, + "step": 157260 + }, + { + "epoch": 44.22, + "learning_rate": 1.2882891325399057e-05, + "loss": 0.042, + "step": 157290 + }, + { + "epoch": 44.23, + "learning_rate": 1.2864148939493331e-05, + "loss": 0.0464, + "step": 157320 + }, + { + "epoch": 44.24, + "learning_rate": 1.2845406553587606e-05, + "loss": 0.0425, + "step": 157350 + }, + { + "epoch": 44.25, + "learning_rate": 1.2826664167681878e-05, + "loss": 0.0463, + "step": 157380 + }, + { + "epoch": 44.25, + "learning_rate": 1.2807921781776156e-05, + "loss": 0.0507, + "step": 157410 + }, + { + "epoch": 44.26, + "learning_rate": 1.278917939587043e-05, + "loss": 0.0378, + "step": 157440 + }, + { + "epoch": 44.27, + "learning_rate": 1.2770437009964702e-05, + "loss": 0.0477, + "step": 157470 + }, + { + "epoch": 44.28, + "learning_rate": 1.2751694624058977e-05, + "loss": 0.0433, + "step": 157500 + }, + { + "epoch": 44.29, + "learning_rate": 1.273295223815325e-05, + "loss": 0.0446, + "step": 157530 + }, + { + "epoch": 44.3, + "learning_rate": 1.2714209852247525e-05, + "loss": 0.0527, + "step": 157560 + }, + { + "epoch": 44.3, + "learning_rate": 1.2695467466341797e-05, + "loss": 0.0397, + "step": 157590 + }, + { + "epoch": 44.31, + "learning_rate": 1.2676725080436072e-05, + "loss": 0.0475, + "step": 157620 + }, + { + "epoch": 44.32, + "learning_rate": 1.265798269453035e-05, + "loss": 0.0446, + "step": 157650 + }, + { + "epoch": 44.33, + "learning_rate": 1.2639240308624622e-05, + "loss": 0.0479, + "step": 157680 + }, + { + "epoch": 44.34, + "learning_rate": 1.2620497922718896e-05, + "loss": 0.0489, + "step": 157710 + }, + { + "epoch": 44.35, + "learning_rate": 1.260175553681317e-05, + "loss": 0.0411, + "step": 157740 + }, + { + "epoch": 44.35, + "learning_rate": 1.2583013150907444e-05, + "loss": 0.0474, + "step": 157770 + }, + { + "epoch": 44.36, + "learning_rate": 1.2564270765001718e-05, + "loss": 0.0416, + "step": 157800 + }, + { + "epoch": 44.37, + "learning_rate": 1.2545528379095991e-05, + "loss": 0.0452, + "step": 157830 + }, + { + "epoch": 44.38, + "learning_rate": 1.2526785993190269e-05, + "loss": 0.0491, + "step": 157860 + }, + { + "epoch": 44.39, + "learning_rate": 1.2508043607284543e-05, + "loss": 0.0395, + "step": 157890 + }, + { + "epoch": 44.4, + "learning_rate": 1.2489301221378815e-05, + "loss": 0.0451, + "step": 157920 + }, + { + "epoch": 44.41, + "learning_rate": 1.247055883547309e-05, + "loss": 0.0436, + "step": 157950 + }, + { + "epoch": 44.41, + "learning_rate": 1.2451816449567364e-05, + "loss": 0.0451, + "step": 157980 + }, + { + "epoch": 44.42, + "learning_rate": 1.2433074063661638e-05, + "loss": 0.0506, + "step": 158010 + }, + { + "epoch": 44.43, + "learning_rate": 1.2414331677755912e-05, + "loss": 0.0404, + "step": 158040 + }, + { + "epoch": 44.44, + "learning_rate": 1.2395589291850186e-05, + "loss": 0.0471, + "step": 158070 + }, + { + "epoch": 44.45, + "learning_rate": 1.237684690594446e-05, + "loss": 0.0426, + "step": 158100 + }, + { + "epoch": 44.46, + "learning_rate": 1.2358104520038735e-05, + "loss": 0.0452, + "step": 158130 + }, + { + "epoch": 44.46, + "learning_rate": 1.2339362134133009e-05, + "loss": 0.0475, + "step": 158160 + }, + { + "epoch": 44.47, + "learning_rate": 1.2320619748227283e-05, + "loss": 0.0385, + "step": 158190 + }, + { + "epoch": 44.48, + "learning_rate": 1.2301877362321559e-05, + "loss": 0.05, + "step": 158220 + }, + { + "epoch": 44.49, + "learning_rate": 1.2283134976415831e-05, + "loss": 0.0444, + "step": 158250 + }, + { + "epoch": 44.5, + "learning_rate": 1.2264392590510106e-05, + "loss": 0.0439, + "step": 158280 + }, + { + "epoch": 44.51, + "learning_rate": 1.224565020460438e-05, + "loss": 0.0497, + "step": 158310 + }, + { + "epoch": 44.51, + "learning_rate": 1.2226907818698654e-05, + "loss": 0.0392, + "step": 158340 + }, + { + "epoch": 44.52, + "learning_rate": 1.2208165432792928e-05, + "loss": 0.0483, + "step": 158370 + }, + { + "epoch": 44.53, + "learning_rate": 1.2189423046887202e-05, + "loss": 0.0432, + "step": 158400 + }, + { + "epoch": 44.54, + "learning_rate": 1.2170680660981478e-05, + "loss": 0.0439, + "step": 158430 + }, + { + "epoch": 44.55, + "learning_rate": 1.215193827507575e-05, + "loss": 0.0471, + "step": 158460 + }, + { + "epoch": 44.56, + "learning_rate": 1.2133195889170025e-05, + "loss": 0.0387, + "step": 158490 + }, + { + "epoch": 44.57, + "learning_rate": 1.2114453503264299e-05, + "loss": 0.0441, + "step": 158520 + }, + { + "epoch": 44.57, + "learning_rate": 1.2095711117358573e-05, + "loss": 0.0428, + "step": 158550 + }, + { + "epoch": 44.58, + "learning_rate": 1.2076968731452847e-05, + "loss": 0.0413, + "step": 158580 + }, + { + "epoch": 44.59, + "learning_rate": 1.2058226345547122e-05, + "loss": 0.0464, + "step": 158610 + }, + { + "epoch": 44.6, + "learning_rate": 1.2039483959641398e-05, + "loss": 0.04, + "step": 158640 + }, + { + "epoch": 44.61, + "learning_rate": 1.202074157373567e-05, + "loss": 0.0488, + "step": 158670 + }, + { + "epoch": 44.62, + "learning_rate": 1.2001999187829944e-05, + "loss": 0.0424, + "step": 158700 + }, + { + "epoch": 44.62, + "learning_rate": 1.1983256801924218e-05, + "loss": 0.0408, + "step": 158730 + }, + { + "epoch": 44.63, + "learning_rate": 1.1964514416018494e-05, + "loss": 0.0476, + "step": 158760 + }, + { + "epoch": 44.64, + "learning_rate": 1.1945772030112767e-05, + "loss": 0.0405, + "step": 158790 + }, + { + "epoch": 44.65, + "learning_rate": 1.1927029644207041e-05, + "loss": 0.0491, + "step": 158820 + }, + { + "epoch": 44.66, + "learning_rate": 1.1908287258301315e-05, + "loss": 0.0407, + "step": 158850 + }, + { + "epoch": 44.67, + "learning_rate": 1.188954487239559e-05, + "loss": 0.045, + "step": 158880 + }, + { + "epoch": 44.68, + "learning_rate": 1.1870802486489864e-05, + "loss": 0.0477, + "step": 158910 + }, + { + "epoch": 44.68, + "learning_rate": 1.1852060100584138e-05, + "loss": 0.04, + "step": 158940 + }, + { + "epoch": 44.69, + "learning_rate": 1.1833317714678414e-05, + "loss": 0.0465, + "step": 158970 + }, + { + "epoch": 44.7, + "learning_rate": 1.1814575328772686e-05, + "loss": 0.0441, + "step": 159000 + }, + { + "epoch": 44.71, + "learning_rate": 1.179583294286696e-05, + "loss": 0.0468, + "step": 159030 + }, + { + "epoch": 44.72, + "learning_rate": 1.1777090556961234e-05, + "loss": 0.0484, + "step": 159060 + }, + { + "epoch": 44.73, + "learning_rate": 1.175834817105551e-05, + "loss": 0.0381, + "step": 159090 + }, + { + "epoch": 44.73, + "learning_rate": 1.1739605785149783e-05, + "loss": 0.0469, + "step": 159120 + }, + { + "epoch": 44.74, + "learning_rate": 1.1720863399244057e-05, + "loss": 0.043, + "step": 159150 + }, + { + "epoch": 44.75, + "learning_rate": 1.1702121013338333e-05, + "loss": 0.0463, + "step": 159180 + }, + { + "epoch": 44.76, + "learning_rate": 1.1683378627432605e-05, + "loss": 0.0472, + "step": 159210 + }, + { + "epoch": 44.77, + "learning_rate": 1.166463624152688e-05, + "loss": 0.0415, + "step": 159240 + }, + { + "epoch": 44.78, + "learning_rate": 1.1645893855621154e-05, + "loss": 0.051, + "step": 159270 + }, + { + "epoch": 44.78, + "learning_rate": 1.162715146971543e-05, + "loss": 0.0413, + "step": 159300 + }, + { + "epoch": 44.79, + "learning_rate": 1.1608409083809702e-05, + "loss": 0.0423, + "step": 159330 + }, + { + "epoch": 44.8, + "learning_rate": 1.1589666697903976e-05, + "loss": 0.0487, + "step": 159360 + }, + { + "epoch": 44.81, + "learning_rate": 1.1570924311998252e-05, + "loss": 0.0401, + "step": 159390 + }, + { + "epoch": 44.82, + "learning_rate": 1.1552181926092526e-05, + "loss": 0.0482, + "step": 159420 + }, + { + "epoch": 44.83, + "learning_rate": 1.1533439540186799e-05, + "loss": 0.0414, + "step": 159450 + }, + { + "epoch": 44.84, + "learning_rate": 1.1514697154281073e-05, + "loss": 0.0461, + "step": 159480 + }, + { + "epoch": 44.84, + "learning_rate": 1.1496579514572206e-05, + "loss": 0.0478, + "step": 159510 + }, + { + "epoch": 44.85, + "learning_rate": 1.147783712866648e-05, + "loss": 0.0363, + "step": 159540 + }, + { + "epoch": 44.86, + "learning_rate": 1.1459094742760754e-05, + "loss": 0.0434, + "step": 159570 + }, + { + "epoch": 44.87, + "learning_rate": 1.1440352356855028e-05, + "loss": 0.0419, + "step": 159600 + }, + { + "epoch": 44.88, + "learning_rate": 1.1421609970949302e-05, + "loss": 0.0468, + "step": 159630 + }, + { + "epoch": 44.89, + "learning_rate": 1.1402867585043577e-05, + "loss": 0.0493, + "step": 159660 + }, + { + "epoch": 44.89, + "learning_rate": 1.138412519913785e-05, + "loss": 0.0406, + "step": 159690 + }, + { + "epoch": 44.9, + "learning_rate": 1.1365382813232125e-05, + "loss": 0.0461, + "step": 159720 + }, + { + "epoch": 44.91, + "learning_rate": 1.13466404273264e-05, + "loss": 0.0432, + "step": 159750 + }, + { + "epoch": 44.92, + "learning_rate": 1.1327898041420673e-05, + "loss": 0.0423, + "step": 159780 + }, + { + "epoch": 44.93, + "learning_rate": 1.1309155655514948e-05, + "loss": 0.0472, + "step": 159810 + }, + { + "epoch": 44.94, + "learning_rate": 1.1290413269609222e-05, + "loss": 0.0405, + "step": 159840 + }, + { + "epoch": 44.95, + "learning_rate": 1.1271670883703496e-05, + "loss": 0.0463, + "step": 159870 + }, + { + "epoch": 44.95, + "learning_rate": 1.125292849779777e-05, + "loss": 0.0435, + "step": 159900 + }, + { + "epoch": 44.96, + "learning_rate": 1.1234186111892044e-05, + "loss": 0.045, + "step": 159930 + }, + { + "epoch": 44.97, + "learning_rate": 1.1215443725986319e-05, + "loss": 0.0495, + "step": 159960 + }, + { + "epoch": 44.98, + "learning_rate": 1.1196701340080593e-05, + "loss": 0.0389, + "step": 159990 + }, + { + "epoch": 44.99, + "learning_rate": 1.1177958954174867e-05, + "loss": 0.0469, + "step": 160020 + }, + { + "epoch": 45.0, + "learning_rate": 1.1159216568269141e-05, + "loss": 0.0434, + "step": 160050 + }, + { + "epoch": 45.0, + "eval_loss": 0.10925392806529999, + "eval_runtime": 640.2824, + "eval_samples_per_second": 25.041, + "eval_steps_per_second": 0.784, + "eval_wer": 0.09092025712063107, + "step": 160065 } ], "max_steps": 177850, "num_train_epochs": 50, - "total_flos": 2.5993382597195276e+21, + "total_flos": 3.5445415622885476e+21, "trial_name": null, "trial_params": null }