diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,11470 @@ +{ + "best_metric": 24.71689240755159, + "best_model_checkpoint": "output_dir_run_2/checkpoint-42000", + "epoch": 1.834423353006859, + "global_step": 46000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 4.4e-07, + "loss": 3.8256, + "step": 25 + }, + { + "epoch": 0.0, + "learning_rate": 9.200000000000001e-07, + "loss": 3.5128, + "step": 50 + }, + { + "epoch": 0.0, + "learning_rate": 1.42e-06, + "loss": 2.8953, + "step": 75 + }, + { + "epoch": 0.0, + "learning_rate": 1.9200000000000003e-06, + "loss": 2.3779, + "step": 100 + }, + { + "epoch": 0.0, + "learning_rate": 2.42e-06, + "loss": 2.065, + "step": 125 + }, + { + "epoch": 0.01, + "learning_rate": 2.92e-06, + "loss": 1.8663, + "step": 150 + }, + { + "epoch": 0.01, + "learning_rate": 3.4200000000000007e-06, + "loss": 1.6813, + "step": 175 + }, + { + "epoch": 0.01, + "learning_rate": 3.920000000000001e-06, + "loss": 1.6136, + "step": 200 + }, + { + "epoch": 0.01, + "learning_rate": 4.42e-06, + "loss": 1.5066, + "step": 225 + }, + { + "epoch": 0.01, + "learning_rate": 4.92e-06, + "loss": 1.3971, + "step": 250 + }, + { + "epoch": 0.01, + "learning_rate": 5.420000000000001e-06, + "loss": 1.3437, + "step": 275 + }, + { + "epoch": 0.01, + "learning_rate": 5.92e-06, + "loss": 1.2227, + "step": 300 + }, + { + "epoch": 0.01, + "learning_rate": 6.42e-06, + "loss": 1.2204, + "step": 325 + }, + { + "epoch": 0.01, + "learning_rate": 6.92e-06, + "loss": 1.1546, + "step": 350 + }, + { + "epoch": 0.01, + "learning_rate": 7.420000000000001e-06, + "loss": 1.1521, + "step": 375 + }, + { + "epoch": 0.02, + "learning_rate": 7.92e-06, + "loss": 1.0848, + "step": 400 + }, + { + "epoch": 0.02, + "learning_rate": 8.42e-06, + "loss": 1.0626, + "step": 425 + }, + { + "epoch": 0.02, + "learning_rate": 8.920000000000001e-06, + "loss": 1.0112, + "step": 450 + }, + { + "epoch": 0.02, + "learning_rate": 9.42e-06, + "loss": 0.988, + "step": 475 + }, + { + "epoch": 0.02, + "learning_rate": 9.920000000000002e-06, + "loss": 0.9656, + "step": 500 + }, + { + "epoch": 0.02, + "learning_rate": 9.99957957957958e-06, + "loss": 0.9418, + "step": 525 + }, + { + "epoch": 0.02, + "learning_rate": 9.99907907907908e-06, + "loss": 0.9225, + "step": 550 + }, + { + "epoch": 0.02, + "learning_rate": 9.99857857857858e-06, + "loss": 0.9479, + "step": 575 + }, + { + "epoch": 0.02, + "learning_rate": 9.998078078078079e-06, + "loss": 0.8927, + "step": 600 + }, + { + "epoch": 0.02, + "learning_rate": 9.997577577577578e-06, + "loss": 0.8688, + "step": 625 + }, + { + "epoch": 0.03, + "learning_rate": 9.997077077077078e-06, + "loss": 0.8846, + "step": 650 + }, + { + "epoch": 0.03, + "learning_rate": 9.996576576576577e-06, + "loss": 0.8514, + "step": 675 + }, + { + "epoch": 0.03, + "learning_rate": 9.996076076076076e-06, + "loss": 0.8254, + "step": 700 + }, + { + "epoch": 0.03, + "learning_rate": 9.995575575575577e-06, + "loss": 0.8167, + "step": 725 + }, + { + "epoch": 0.03, + "learning_rate": 9.995075075075076e-06, + "loss": 0.7695, + "step": 750 + }, + { + "epoch": 0.03, + "learning_rate": 9.994574574574576e-06, + "loss": 0.8109, + "step": 775 + }, + { + "epoch": 0.03, + "learning_rate": 9.994074074074075e-06, + "loss": 0.7718, + "step": 800 + }, + { + "epoch": 0.03, + "learning_rate": 9.993573573573574e-06, + "loss": 0.7937, + "step": 825 + }, + { + "epoch": 0.03, + "learning_rate": 9.993073073073074e-06, + "loss": 0.7566, + "step": 850 + }, + { + "epoch": 0.03, + "learning_rate": 9.992572572572573e-06, + "loss": 0.7627, + "step": 875 + }, + { + "epoch": 0.04, + "learning_rate": 9.992072072072074e-06, + "loss": 0.7564, + "step": 900 + }, + { + "epoch": 0.04, + "learning_rate": 9.991571571571572e-06, + "loss": 0.766, + "step": 925 + }, + { + "epoch": 0.04, + "learning_rate": 9.991071071071073e-06, + "loss": 0.7255, + "step": 950 + }, + { + "epoch": 0.04, + "learning_rate": 9.990570570570572e-06, + "loss": 0.7385, + "step": 975 + }, + { + "epoch": 0.04, + "learning_rate": 9.990070070070071e-06, + "loss": 0.7455, + "step": 1000 + }, + { + "epoch": 0.04, + "eval_loss": 0.9031199216842651, + "eval_runtime": 2867.5101, + "eval_samples_per_second": 5.654, + "eval_steps_per_second": 0.142, + "eval_wer": 58.282005226601704, + "step": 1000 + }, + { + "epoch": 0.04, + "learning_rate": 9.98956956956957e-06, + "loss": 0.7141, + "step": 1025 + }, + { + "epoch": 0.04, + "learning_rate": 9.98906906906907e-06, + "loss": 0.7036, + "step": 1050 + }, + { + "epoch": 0.04, + "learning_rate": 9.988568568568569e-06, + "loss": 0.7157, + "step": 1075 + }, + { + "epoch": 0.04, + "learning_rate": 9.988068068068068e-06, + "loss": 0.7362, + "step": 1100 + }, + { + "epoch": 0.04, + "learning_rate": 9.98756756756757e-06, + "loss": 0.7134, + "step": 1125 + }, + { + "epoch": 0.05, + "learning_rate": 9.987067067067067e-06, + "loss": 0.6704, + "step": 1150 + }, + { + "epoch": 0.05, + "learning_rate": 9.986566566566568e-06, + "loss": 0.6907, + "step": 1175 + }, + { + "epoch": 0.05, + "learning_rate": 9.986066066066067e-06, + "loss": 0.6851, + "step": 1200 + }, + { + "epoch": 0.05, + "learning_rate": 9.985565565565567e-06, + "loss": 0.7214, + "step": 1225 + }, + { + "epoch": 0.05, + "learning_rate": 9.985065065065066e-06, + "loss": 0.6876, + "step": 1250 + }, + { + "epoch": 0.05, + "learning_rate": 9.984564564564565e-06, + "loss": 0.6627, + "step": 1275 + }, + { + "epoch": 0.05, + "learning_rate": 9.984064064064064e-06, + "loss": 0.6739, + "step": 1300 + }, + { + "epoch": 0.05, + "learning_rate": 9.983563563563564e-06, + "loss": 0.6629, + "step": 1325 + }, + { + "epoch": 0.05, + "learning_rate": 9.983063063063065e-06, + "loss": 0.6493, + "step": 1350 + }, + { + "epoch": 0.05, + "learning_rate": 9.982562562562564e-06, + "loss": 0.6512, + "step": 1375 + }, + { + "epoch": 0.06, + "learning_rate": 9.982062062062063e-06, + "loss": 0.6481, + "step": 1400 + }, + { + "epoch": 0.06, + "learning_rate": 9.981561561561563e-06, + "loss": 0.6459, + "step": 1425 + }, + { + "epoch": 0.06, + "learning_rate": 9.981061061061062e-06, + "loss": 0.643, + "step": 1450 + }, + { + "epoch": 0.06, + "learning_rate": 9.980560560560561e-06, + "loss": 0.6344, + "step": 1475 + }, + { + "epoch": 0.06, + "learning_rate": 9.98006006006006e-06, + "loss": 0.6312, + "step": 1500 + }, + { + "epoch": 0.06, + "learning_rate": 9.979559559559561e-06, + "loss": 0.6587, + "step": 1525 + }, + { + "epoch": 0.06, + "learning_rate": 9.979059059059059e-06, + "loss": 0.6156, + "step": 1550 + }, + { + "epoch": 0.06, + "learning_rate": 9.97855855855856e-06, + "loss": 0.64, + "step": 1575 + }, + { + "epoch": 0.06, + "learning_rate": 9.97805805805806e-06, + "loss": 0.5947, + "step": 1600 + }, + { + "epoch": 0.06, + "learning_rate": 9.977557557557559e-06, + "loss": 0.6496, + "step": 1625 + }, + { + "epoch": 0.07, + "learning_rate": 9.977057057057058e-06, + "loss": 0.6434, + "step": 1650 + }, + { + "epoch": 0.07, + "learning_rate": 9.976556556556557e-06, + "loss": 0.5917, + "step": 1675 + }, + { + "epoch": 0.07, + "learning_rate": 9.976056056056057e-06, + "loss": 0.6057, + "step": 1700 + }, + { + "epoch": 0.07, + "learning_rate": 9.975555555555556e-06, + "loss": 0.6132, + "step": 1725 + }, + { + "epoch": 0.07, + "learning_rate": 9.975055055055057e-06, + "loss": 0.5929, + "step": 1750 + }, + { + "epoch": 0.07, + "learning_rate": 9.974554554554554e-06, + "loss": 0.6166, + "step": 1775 + }, + { + "epoch": 0.07, + "learning_rate": 9.974054054054055e-06, + "loss": 0.5866, + "step": 1800 + }, + { + "epoch": 0.07, + "learning_rate": 9.973553553553555e-06, + "loss": 0.6123, + "step": 1825 + }, + { + "epoch": 0.07, + "learning_rate": 9.973053053053054e-06, + "loss": 0.594, + "step": 1850 + }, + { + "epoch": 0.07, + "learning_rate": 9.972552552552553e-06, + "loss": 0.5949, + "step": 1875 + }, + { + "epoch": 0.08, + "learning_rate": 9.972052052052053e-06, + "loss": 0.5862, + "step": 1900 + }, + { + "epoch": 0.08, + "learning_rate": 9.971551551551552e-06, + "loss": 0.609, + "step": 1925 + }, + { + "epoch": 0.08, + "learning_rate": 9.971051051051051e-06, + "loss": 0.5688, + "step": 1950 + }, + { + "epoch": 0.08, + "learning_rate": 9.970550550550552e-06, + "loss": 0.592, + "step": 1975 + }, + { + "epoch": 0.08, + "learning_rate": 9.970050050050052e-06, + "loss": 0.5906, + "step": 2000 + }, + { + "epoch": 0.08, + "eval_loss": 0.7455159425735474, + "eval_runtime": 3054.18, + "eval_samples_per_second": 5.308, + "eval_steps_per_second": 0.133, + "eval_wer": 50.6001341340261, + "step": 2000 + }, + { + "epoch": 0.08, + "learning_rate": 9.96954954954955e-06, + "loss": 0.5755, + "step": 2025 + }, + { + "epoch": 0.08, + "learning_rate": 9.96904904904905e-06, + "loss": 0.5761, + "step": 2050 + }, + { + "epoch": 0.08, + "learning_rate": 9.96854854854855e-06, + "loss": 0.5832, + "step": 2075 + }, + { + "epoch": 0.08, + "learning_rate": 9.968048048048049e-06, + "loss": 0.5661, + "step": 2100 + }, + { + "epoch": 0.08, + "learning_rate": 9.967547547547548e-06, + "loss": 0.5906, + "step": 2125 + }, + { + "epoch": 0.09, + "learning_rate": 9.967047047047049e-06, + "loss": 0.5769, + "step": 2150 + }, + { + "epoch": 0.09, + "learning_rate": 9.966546546546547e-06, + "loss": 0.5491, + "step": 2175 + }, + { + "epoch": 0.09, + "learning_rate": 9.966046046046048e-06, + "loss": 0.5794, + "step": 2200 + }, + { + "epoch": 0.09, + "learning_rate": 9.965545545545547e-06, + "loss": 0.5319, + "step": 2225 + }, + { + "epoch": 0.09, + "learning_rate": 9.965045045045044e-06, + "loss": 0.5656, + "step": 2250 + }, + { + "epoch": 0.09, + "learning_rate": 9.964544544544545e-06, + "loss": 0.5714, + "step": 2275 + }, + { + "epoch": 0.09, + "learning_rate": 9.964044044044045e-06, + "loss": 0.5667, + "step": 2300 + }, + { + "epoch": 0.09, + "learning_rate": 9.963543543543544e-06, + "loss": 0.5628, + "step": 2325 + }, + { + "epoch": 0.09, + "learning_rate": 9.963043043043043e-06, + "loss": 0.5816, + "step": 2350 + }, + { + "epoch": 0.09, + "learning_rate": 9.962542542542544e-06, + "loss": 0.5713, + "step": 2375 + }, + { + "epoch": 0.1, + "learning_rate": 9.962042042042042e-06, + "loss": 0.5513, + "step": 2400 + }, + { + "epoch": 0.1, + "learning_rate": 9.961541541541543e-06, + "loss": 0.5416, + "step": 2425 + }, + { + "epoch": 0.1, + "learning_rate": 9.961041041041042e-06, + "loss": 0.5273, + "step": 2450 + }, + { + "epoch": 0.1, + "learning_rate": 9.960540540540542e-06, + "loss": 0.5414, + "step": 2475 + }, + { + "epoch": 0.1, + "learning_rate": 9.960040040040041e-06, + "loss": 0.5454, + "step": 2500 + }, + { + "epoch": 0.1, + "learning_rate": 9.95953953953954e-06, + "loss": 0.5335, + "step": 2525 + }, + { + "epoch": 0.1, + "learning_rate": 9.95903903903904e-06, + "loss": 0.538, + "step": 2550 + }, + { + "epoch": 0.1, + "learning_rate": 9.958538538538539e-06, + "loss": 0.5275, + "step": 2575 + }, + { + "epoch": 0.1, + "learning_rate": 9.95803803803804e-06, + "loss": 0.541, + "step": 2600 + }, + { + "epoch": 0.1, + "learning_rate": 9.957537537537539e-06, + "loss": 0.5653, + "step": 2625 + }, + { + "epoch": 0.11, + "learning_rate": 9.957037037037038e-06, + "loss": 0.5407, + "step": 2650 + }, + { + "epoch": 0.11, + "learning_rate": 9.956536536536538e-06, + "loss": 0.5508, + "step": 2675 + }, + { + "epoch": 0.11, + "learning_rate": 9.956036036036037e-06, + "loss": 0.507, + "step": 2700 + }, + { + "epoch": 0.11, + "learning_rate": 9.955535535535536e-06, + "loss": 0.5289, + "step": 2725 + }, + { + "epoch": 0.11, + "learning_rate": 9.955035035035036e-06, + "loss": 0.543, + "step": 2750 + }, + { + "epoch": 0.11, + "learning_rate": 9.954534534534537e-06, + "loss": 0.5489, + "step": 2775 + }, + { + "epoch": 0.11, + "learning_rate": 9.954034034034034e-06, + "loss": 0.5433, + "step": 2800 + }, + { + "epoch": 0.11, + "learning_rate": 9.953533533533535e-06, + "loss": 0.5372, + "step": 2825 + }, + { + "epoch": 0.11, + "learning_rate": 9.953033033033034e-06, + "loss": 0.5397, + "step": 2850 + }, + { + "epoch": 0.11, + "learning_rate": 9.952532532532532e-06, + "loss": 0.5429, + "step": 2875 + }, + { + "epoch": 0.12, + "learning_rate": 9.952032032032033e-06, + "loss": 0.5178, + "step": 2900 + }, + { + "epoch": 0.12, + "learning_rate": 9.951531531531532e-06, + "loss": 0.5426, + "step": 2925 + }, + { + "epoch": 0.12, + "learning_rate": 9.951031031031032e-06, + "loss": 0.5301, + "step": 2950 + }, + { + "epoch": 0.12, + "learning_rate": 9.950530530530531e-06, + "loss": 0.5113, + "step": 2975 + }, + { + "epoch": 0.12, + "learning_rate": 9.950030030030032e-06, + "loss": 0.5015, + "step": 3000 + }, + { + "epoch": 0.12, + "eval_loss": 0.6700246334075928, + "eval_runtime": 2829.2547, + "eval_samples_per_second": 5.73, + "eval_steps_per_second": 0.144, + "eval_wer": 45.80060283223225, + "step": 3000 + }, + { + "epoch": 0.12, + "learning_rate": 9.94952952952953e-06, + "loss": 0.5075, + "step": 3025 + }, + { + "epoch": 0.12, + "learning_rate": 9.94902902902903e-06, + "loss": 0.548, + "step": 3050 + }, + { + "epoch": 0.12, + "learning_rate": 9.94852852852853e-06, + "loss": 0.5221, + "step": 3075 + }, + { + "epoch": 0.12, + "learning_rate": 9.948028028028029e-06, + "loss": 0.5108, + "step": 3100 + }, + { + "epoch": 0.12, + "learning_rate": 9.947527527527528e-06, + "loss": 0.4792, + "step": 3125 + }, + { + "epoch": 0.13, + "learning_rate": 9.947027027027028e-06, + "loss": 0.4993, + "step": 3150 + }, + { + "epoch": 0.13, + "learning_rate": 9.946526526526527e-06, + "loss": 0.5159, + "step": 3175 + }, + { + "epoch": 0.13, + "learning_rate": 9.946026026026026e-06, + "loss": 0.4948, + "step": 3200 + }, + { + "epoch": 0.13, + "learning_rate": 9.945525525525527e-06, + "loss": 0.527, + "step": 3225 + }, + { + "epoch": 0.13, + "learning_rate": 9.945025025025027e-06, + "loss": 0.4831, + "step": 3250 + }, + { + "epoch": 0.13, + "learning_rate": 9.944524524524526e-06, + "loss": 0.5106, + "step": 3275 + }, + { + "epoch": 0.13, + "learning_rate": 9.944024024024025e-06, + "loss": 0.5323, + "step": 3300 + }, + { + "epoch": 0.13, + "learning_rate": 9.943523523523524e-06, + "loss": 0.502, + "step": 3325 + }, + { + "epoch": 0.13, + "learning_rate": 9.943023023023024e-06, + "loss": 0.495, + "step": 3350 + }, + { + "epoch": 0.13, + "learning_rate": 9.942522522522523e-06, + "loss": 0.519, + "step": 3375 + }, + { + "epoch": 0.14, + "learning_rate": 9.942022022022022e-06, + "loss": 0.5351, + "step": 3400 + }, + { + "epoch": 0.14, + "learning_rate": 9.941521521521522e-06, + "loss": 0.4833, + "step": 3425 + }, + { + "epoch": 0.14, + "learning_rate": 9.941021021021023e-06, + "loss": 0.5227, + "step": 3450 + }, + { + "epoch": 0.14, + "learning_rate": 9.940520520520522e-06, + "loss": 0.4969, + "step": 3475 + }, + { + "epoch": 0.14, + "learning_rate": 9.94002002002002e-06, + "loss": 0.5103, + "step": 3500 + }, + { + "epoch": 0.14, + "learning_rate": 9.93951951951952e-06, + "loss": 0.5109, + "step": 3525 + }, + { + "epoch": 0.14, + "learning_rate": 9.93901901901902e-06, + "loss": 0.5228, + "step": 3550 + }, + { + "epoch": 0.14, + "learning_rate": 9.938518518518519e-06, + "loss": 0.4983, + "step": 3575 + }, + { + "epoch": 0.14, + "learning_rate": 9.938018018018018e-06, + "loss": 0.4873, + "step": 3600 + }, + { + "epoch": 0.14, + "learning_rate": 9.93751751751752e-06, + "loss": 0.4955, + "step": 3625 + }, + { + "epoch": 0.15, + "learning_rate": 9.937017017017017e-06, + "loss": 0.5064, + "step": 3650 + }, + { + "epoch": 0.15, + "learning_rate": 9.936516516516518e-06, + "loss": 0.506, + "step": 3675 + }, + { + "epoch": 0.15, + "learning_rate": 9.936016016016017e-06, + "loss": 0.483, + "step": 3700 + }, + { + "epoch": 0.15, + "learning_rate": 9.935515515515517e-06, + "loss": 0.4931, + "step": 3725 + }, + { + "epoch": 0.15, + "learning_rate": 9.935015015015016e-06, + "loss": 0.4854, + "step": 3750 + }, + { + "epoch": 0.15, + "learning_rate": 9.934514514514515e-06, + "loss": 0.4697, + "step": 3775 + }, + { + "epoch": 0.15, + "learning_rate": 9.934014014014014e-06, + "loss": 0.5078, + "step": 3800 + }, + { + "epoch": 0.15, + "learning_rate": 9.933513513513514e-06, + "loss": 0.4759, + "step": 3825 + }, + { + "epoch": 0.15, + "learning_rate": 9.933013013013015e-06, + "loss": 0.5202, + "step": 3850 + }, + { + "epoch": 0.15, + "learning_rate": 9.932512512512514e-06, + "loss": 0.4633, + "step": 3875 + }, + { + "epoch": 0.16, + "learning_rate": 9.932012012012013e-06, + "loss": 0.4947, + "step": 3900 + }, + { + "epoch": 0.16, + "learning_rate": 9.931511511511513e-06, + "loss": 0.4952, + "step": 3925 + }, + { + "epoch": 0.16, + "learning_rate": 9.931011011011012e-06, + "loss": 0.4768, + "step": 3950 + }, + { + "epoch": 0.16, + "learning_rate": 9.930510510510511e-06, + "loss": 0.485, + "step": 3975 + }, + { + "epoch": 0.16, + "learning_rate": 9.93001001001001e-06, + "loss": 0.4855, + "step": 4000 + }, + { + "epoch": 0.16, + "eval_loss": 0.6402216553688049, + "eval_runtime": 2763.3301, + "eval_samples_per_second": 5.867, + "eval_steps_per_second": 0.147, + "eval_wer": 41.90377810840188, + "step": 4000 + }, + { + "epoch": 0.16, + "learning_rate": 9.92950950950951e-06, + "loss": 0.4653, + "step": 4025 + }, + { + "epoch": 0.16, + "learning_rate": 9.929009009009009e-06, + "loss": 0.4994, + "step": 4050 + }, + { + "epoch": 0.16, + "learning_rate": 9.92850850850851e-06, + "loss": 0.4641, + "step": 4075 + }, + { + "epoch": 0.16, + "learning_rate": 9.92800800800801e-06, + "loss": 0.4851, + "step": 4100 + }, + { + "epoch": 0.16, + "learning_rate": 9.927507507507507e-06, + "loss": 0.489, + "step": 4125 + }, + { + "epoch": 0.17, + "learning_rate": 9.927007007007008e-06, + "loss": 0.4881, + "step": 4150 + }, + { + "epoch": 0.17, + "learning_rate": 9.926506506506507e-06, + "loss": 0.4975, + "step": 4175 + }, + { + "epoch": 0.17, + "learning_rate": 9.926006006006007e-06, + "loss": 0.4785, + "step": 4200 + }, + { + "epoch": 0.17, + "learning_rate": 9.925505505505506e-06, + "loss": 0.4689, + "step": 4225 + }, + { + "epoch": 0.17, + "learning_rate": 9.925005005005007e-06, + "loss": 0.4688, + "step": 4250 + }, + { + "epoch": 0.17, + "learning_rate": 9.924504504504505e-06, + "loss": 0.4842, + "step": 4275 + }, + { + "epoch": 0.17, + "learning_rate": 9.924004004004006e-06, + "loss": 0.462, + "step": 4300 + }, + { + "epoch": 0.17, + "learning_rate": 9.923503503503505e-06, + "loss": 0.4674, + "step": 4325 + }, + { + "epoch": 0.17, + "learning_rate": 9.923003003003004e-06, + "loss": 0.4632, + "step": 4350 + }, + { + "epoch": 0.17, + "learning_rate": 9.922502502502503e-06, + "loss": 0.4618, + "step": 4375 + }, + { + "epoch": 0.18, + "learning_rate": 9.922002002002003e-06, + "loss": 0.4655, + "step": 4400 + }, + { + "epoch": 0.18, + "learning_rate": 9.921501501501502e-06, + "loss": 0.4557, + "step": 4425 + }, + { + "epoch": 0.18, + "learning_rate": 9.921001001001001e-06, + "loss": 0.4549, + "step": 4450 + }, + { + "epoch": 0.18, + "learning_rate": 9.920500500500502e-06, + "loss": 0.4757, + "step": 4475 + }, + { + "epoch": 0.18, + "learning_rate": 9.920000000000002e-06, + "loss": 0.4501, + "step": 4500 + }, + { + "epoch": 0.18, + "learning_rate": 9.919499499499501e-06, + "loss": 0.4789, + "step": 4525 + }, + { + "epoch": 0.18, + "learning_rate": 9.918998998999e-06, + "loss": 0.4768, + "step": 4550 + }, + { + "epoch": 0.18, + "learning_rate": 9.9184984984985e-06, + "loss": 0.4799, + "step": 4575 + }, + { + "epoch": 0.18, + "learning_rate": 9.917997997997999e-06, + "loss": 0.4648, + "step": 4600 + }, + { + "epoch": 0.18, + "learning_rate": 9.917497497497498e-06, + "loss": 0.4671, + "step": 4625 + }, + { + "epoch": 0.19, + "learning_rate": 9.916996996996997e-06, + "loss": 0.4672, + "step": 4650 + }, + { + "epoch": 0.19, + "learning_rate": 9.916496496496497e-06, + "loss": 0.4664, + "step": 4675 + }, + { + "epoch": 0.19, + "learning_rate": 9.915995995995998e-06, + "loss": 0.4769, + "step": 4700 + }, + { + "epoch": 0.19, + "learning_rate": 9.915495495495497e-06, + "loss": 0.4828, + "step": 4725 + }, + { + "epoch": 0.19, + "learning_rate": 9.914994994994995e-06, + "loss": 0.4648, + "step": 4750 + }, + { + "epoch": 0.19, + "learning_rate": 9.914494494494496e-06, + "loss": 0.4501, + "step": 4775 + }, + { + "epoch": 0.19, + "learning_rate": 9.913993993993995e-06, + "loss": 0.4638, + "step": 4800 + }, + { + "epoch": 0.19, + "learning_rate": 9.913493493493494e-06, + "loss": 0.463, + "step": 4825 + }, + { + "epoch": 0.19, + "learning_rate": 9.912992992992993e-06, + "loss": 0.4759, + "step": 4850 + }, + { + "epoch": 0.19, + "learning_rate": 9.912492492492494e-06, + "loss": 0.4967, + "step": 4875 + }, + { + "epoch": 0.2, + "learning_rate": 9.911991991991992e-06, + "loss": 0.4483, + "step": 4900 + }, + { + "epoch": 0.2, + "learning_rate": 9.911491491491493e-06, + "loss": 0.4514, + "step": 4925 + }, + { + "epoch": 0.2, + "learning_rate": 9.910990990990992e-06, + "loss": 0.482, + "step": 4950 + }, + { + "epoch": 0.2, + "learning_rate": 9.910490490490492e-06, + "loss": 0.4439, + "step": 4975 + }, + { + "epoch": 0.2, + "learning_rate": 9.909989989989991e-06, + "loss": 0.4379, + "step": 5000 + }, + { + "epoch": 0.2, + "eval_loss": 0.6058462858200073, + "eval_runtime": 2619.0085, + "eval_samples_per_second": 6.191, + "eval_steps_per_second": 0.155, + "eval_wer": 38.43171113389505, + "step": 5000 + }, + { + "epoch": 0.2, + "learning_rate": 9.90948948948949e-06, + "loss": 0.4567, + "step": 5025 + }, + { + "epoch": 0.2, + "learning_rate": 9.90898898898899e-06, + "loss": 0.4506, + "step": 5050 + }, + { + "epoch": 0.2, + "learning_rate": 9.908488488488489e-06, + "loss": 0.4717, + "step": 5075 + }, + { + "epoch": 0.2, + "learning_rate": 9.90798798798799e-06, + "loss": 0.4775, + "step": 5100 + }, + { + "epoch": 0.2, + "learning_rate": 9.907487487487487e-06, + "loss": 0.4344, + "step": 5125 + }, + { + "epoch": 0.21, + "learning_rate": 9.906986986986987e-06, + "loss": 0.4462, + "step": 5150 + }, + { + "epoch": 0.21, + "learning_rate": 9.906486486486488e-06, + "loss": 0.4492, + "step": 5175 + }, + { + "epoch": 0.21, + "learning_rate": 9.905985985985987e-06, + "loss": 0.4532, + "step": 5200 + }, + { + "epoch": 0.21, + "learning_rate": 9.905485485485486e-06, + "loss": 0.4595, + "step": 5225 + }, + { + "epoch": 0.21, + "learning_rate": 9.904984984984986e-06, + "loss": 0.4369, + "step": 5250 + }, + { + "epoch": 0.21, + "learning_rate": 9.904484484484485e-06, + "loss": 0.4668, + "step": 5275 + }, + { + "epoch": 0.21, + "learning_rate": 9.903983983983984e-06, + "loss": 0.4507, + "step": 5300 + }, + { + "epoch": 0.21, + "learning_rate": 9.903483483483485e-06, + "loss": 0.4438, + "step": 5325 + }, + { + "epoch": 0.21, + "learning_rate": 9.902982982982984e-06, + "loss": 0.4679, + "step": 5350 + }, + { + "epoch": 0.21, + "learning_rate": 9.902482482482482e-06, + "loss": 0.468, + "step": 5375 + }, + { + "epoch": 0.22, + "learning_rate": 9.901981981981983e-06, + "loss": 0.4502, + "step": 5400 + }, + { + "epoch": 0.22, + "learning_rate": 9.901481481481482e-06, + "loss": 0.4319, + "step": 5425 + }, + { + "epoch": 0.22, + "learning_rate": 9.900980980980982e-06, + "loss": 0.4799, + "step": 5450 + }, + { + "epoch": 0.22, + "learning_rate": 9.900480480480481e-06, + "loss": 0.4553, + "step": 5475 + }, + { + "epoch": 0.22, + "learning_rate": 9.899979979979982e-06, + "loss": 0.4309, + "step": 5500 + }, + { + "epoch": 0.22, + "learning_rate": 9.89947947947948e-06, + "loss": 0.4385, + "step": 5525 + }, + { + "epoch": 0.22, + "learning_rate": 9.89897897897898e-06, + "loss": 0.431, + "step": 5550 + }, + { + "epoch": 0.22, + "learning_rate": 9.89847847847848e-06, + "loss": 0.4478, + "step": 5575 + }, + { + "epoch": 0.22, + "learning_rate": 9.897977977977979e-06, + "loss": 0.4379, + "step": 5600 + }, + { + "epoch": 0.22, + "learning_rate": 9.897477477477478e-06, + "loss": 0.4334, + "step": 5625 + }, + { + "epoch": 0.23, + "learning_rate": 9.896976976976978e-06, + "loss": 0.4542, + "step": 5650 + }, + { + "epoch": 0.23, + "learning_rate": 9.896476476476477e-06, + "loss": 0.4454, + "step": 5675 + }, + { + "epoch": 0.23, + "learning_rate": 9.895975975975976e-06, + "loss": 0.4519, + "step": 5700 + }, + { + "epoch": 0.23, + "learning_rate": 9.895475475475477e-06, + "loss": 0.4625, + "step": 5725 + }, + { + "epoch": 0.23, + "learning_rate": 9.894974974974975e-06, + "loss": 0.4361, + "step": 5750 + }, + { + "epoch": 0.23, + "learning_rate": 9.894474474474474e-06, + "loss": 0.4305, + "step": 5775 + }, + { + "epoch": 0.23, + "learning_rate": 9.893973973973975e-06, + "loss": 0.4558, + "step": 5800 + }, + { + "epoch": 0.23, + "learning_rate": 9.893473473473475e-06, + "loss": 0.4554, + "step": 5825 + }, + { + "epoch": 0.23, + "learning_rate": 9.892972972972974e-06, + "loss": 0.4562, + "step": 5850 + }, + { + "epoch": 0.23, + "learning_rate": 9.892472472472473e-06, + "loss": 0.4378, + "step": 5875 + }, + { + "epoch": 0.24, + "learning_rate": 9.891971971971972e-06, + "loss": 0.464, + "step": 5900 + }, + { + "epoch": 0.24, + "learning_rate": 9.891471471471472e-06, + "loss": 0.4279, + "step": 5925 + }, + { + "epoch": 0.24, + "learning_rate": 9.890970970970973e-06, + "loss": 0.4414, + "step": 5950 + }, + { + "epoch": 0.24, + "learning_rate": 9.890470470470472e-06, + "loss": 0.4537, + "step": 5975 + }, + { + "epoch": 0.24, + "learning_rate": 9.88996996996997e-06, + "loss": 0.4399, + "step": 6000 + }, + { + "epoch": 0.24, + "eval_loss": 0.5941766500473022, + "eval_runtime": 2644.5549, + "eval_samples_per_second": 6.131, + "eval_steps_per_second": 0.154, + "eval_wer": 37.588362716907824, + "step": 6000 + }, + { + "epoch": 0.24, + "learning_rate": 9.88946946946947e-06, + "loss": 0.4419, + "step": 6025 + }, + { + "epoch": 0.24, + "learning_rate": 9.88896896896897e-06, + "loss": 0.4219, + "step": 6050 + }, + { + "epoch": 0.24, + "learning_rate": 9.88846846846847e-06, + "loss": 0.4271, + "step": 6075 + }, + { + "epoch": 0.24, + "learning_rate": 9.887967967967968e-06, + "loss": 0.4565, + "step": 6100 + }, + { + "epoch": 0.24, + "learning_rate": 9.88746746746747e-06, + "loss": 0.4588, + "step": 6125 + }, + { + "epoch": 0.25, + "learning_rate": 9.886966966966967e-06, + "loss": 0.4384, + "step": 6150 + }, + { + "epoch": 0.25, + "learning_rate": 9.886466466466468e-06, + "loss": 0.4341, + "step": 6175 + }, + { + "epoch": 0.25, + "learning_rate": 9.885965965965967e-06, + "loss": 0.4302, + "step": 6200 + }, + { + "epoch": 0.25, + "learning_rate": 9.885465465465467e-06, + "loss": 0.4307, + "step": 6225 + }, + { + "epoch": 0.25, + "learning_rate": 9.884964964964966e-06, + "loss": 0.4634, + "step": 6250 + }, + { + "epoch": 0.25, + "learning_rate": 9.884464464464465e-06, + "loss": 0.4374, + "step": 6275 + }, + { + "epoch": 0.25, + "learning_rate": 9.883963963963965e-06, + "loss": 0.4352, + "step": 6300 + }, + { + "epoch": 0.25, + "learning_rate": 9.883463463463464e-06, + "loss": 0.4376, + "step": 6325 + }, + { + "epoch": 0.25, + "learning_rate": 9.882962962962965e-06, + "loss": 0.4284, + "step": 6350 + }, + { + "epoch": 0.25, + "learning_rate": 9.882462462462462e-06, + "loss": 0.4143, + "step": 6375 + }, + { + "epoch": 0.26, + "learning_rate": 9.881961961961962e-06, + "loss": 0.4286, + "step": 6400 + }, + { + "epoch": 0.26, + "learning_rate": 9.881461461461463e-06, + "loss": 0.4358, + "step": 6425 + }, + { + "epoch": 0.26, + "learning_rate": 9.880960960960962e-06, + "loss": 0.4306, + "step": 6450 + }, + { + "epoch": 0.26, + "learning_rate": 9.880460460460461e-06, + "loss": 0.4357, + "step": 6475 + }, + { + "epoch": 0.26, + "learning_rate": 9.87995995995996e-06, + "loss": 0.4344, + "step": 6500 + }, + { + "epoch": 0.26, + "learning_rate": 9.87945945945946e-06, + "loss": 0.4508, + "step": 6525 + }, + { + "epoch": 0.26, + "learning_rate": 9.87895895895896e-06, + "loss": 0.441, + "step": 6550 + }, + { + "epoch": 0.26, + "learning_rate": 9.87845845845846e-06, + "loss": 0.419, + "step": 6575 + }, + { + "epoch": 0.26, + "learning_rate": 9.87795795795796e-06, + "loss": 0.4221, + "step": 6600 + }, + { + "epoch": 0.26, + "learning_rate": 9.877457457457457e-06, + "loss": 0.4288, + "step": 6625 + }, + { + "epoch": 0.27, + "learning_rate": 9.876956956956958e-06, + "loss": 0.4288, + "step": 6650 + }, + { + "epoch": 0.27, + "learning_rate": 9.876456456456457e-06, + "loss": 0.4314, + "step": 6675 + }, + { + "epoch": 0.27, + "learning_rate": 9.875955955955957e-06, + "loss": 0.4138, + "step": 6700 + }, + { + "epoch": 0.27, + "learning_rate": 9.875455455455456e-06, + "loss": 0.4291, + "step": 6725 + }, + { + "epoch": 0.27, + "learning_rate": 9.874954954954957e-06, + "loss": 0.4446, + "step": 6750 + }, + { + "epoch": 0.27, + "learning_rate": 9.874454454454455e-06, + "loss": 0.4153, + "step": 6775 + }, + { + "epoch": 0.27, + "learning_rate": 9.873953953953956e-06, + "loss": 0.4325, + "step": 6800 + }, + { + "epoch": 0.27, + "learning_rate": 9.873453453453455e-06, + "loss": 0.4158, + "step": 6825 + }, + { + "epoch": 0.27, + "learning_rate": 9.872952952952952e-06, + "loss": 0.4248, + "step": 6850 + }, + { + "epoch": 0.27, + "learning_rate": 9.872452452452453e-06, + "loss": 0.4221, + "step": 6875 + }, + { + "epoch": 0.28, + "learning_rate": 9.871951951951953e-06, + "loss": 0.4206, + "step": 6900 + }, + { + "epoch": 0.28, + "learning_rate": 9.871451451451452e-06, + "loss": 0.4173, + "step": 6925 + }, + { + "epoch": 0.28, + "learning_rate": 9.870950950950951e-06, + "loss": 0.4285, + "step": 6950 + }, + { + "epoch": 0.28, + "learning_rate": 9.870450450450452e-06, + "loss": 0.4102, + "step": 6975 + }, + { + "epoch": 0.28, + "learning_rate": 9.86994994994995e-06, + "loss": 0.4335, + "step": 7000 + }, + { + "epoch": 0.28, + "eval_loss": 0.5607422590255737, + "eval_runtime": 2701.8903, + "eval_samples_per_second": 6.001, + "eval_steps_per_second": 0.15, + "eval_wer": 36.83443698398872, + "step": 7000 + }, + { + "epoch": 0.28, + "learning_rate": 9.86944944944945e-06, + "loss": 0.4267, + "step": 7025 + }, + { + "epoch": 0.28, + "learning_rate": 9.86894894894895e-06, + "loss": 0.439, + "step": 7050 + }, + { + "epoch": 0.28, + "learning_rate": 9.86844844844845e-06, + "loss": 0.4139, + "step": 7075 + }, + { + "epoch": 0.28, + "learning_rate": 9.867947947947949e-06, + "loss": 0.4248, + "step": 7100 + }, + { + "epoch": 0.28, + "learning_rate": 9.867447447447448e-06, + "loss": 0.4279, + "step": 7125 + }, + { + "epoch": 0.29, + "learning_rate": 9.866946946946947e-06, + "loss": 0.4172, + "step": 7150 + }, + { + "epoch": 0.29, + "learning_rate": 9.866446446446447e-06, + "loss": 0.4382, + "step": 7175 + }, + { + "epoch": 0.29, + "learning_rate": 9.865945945945948e-06, + "loss": 0.4367, + "step": 7200 + }, + { + "epoch": 0.29, + "learning_rate": 9.865445445445447e-06, + "loss": 0.4247, + "step": 7225 + }, + { + "epoch": 0.29, + "learning_rate": 9.864944944944945e-06, + "loss": 0.4223, + "step": 7250 + }, + { + "epoch": 0.29, + "learning_rate": 9.864444444444446e-06, + "loss": 0.4207, + "step": 7275 + }, + { + "epoch": 0.29, + "learning_rate": 9.863943943943945e-06, + "loss": 0.4166, + "step": 7300 + }, + { + "epoch": 0.29, + "learning_rate": 9.863443443443444e-06, + "loss": 0.4155, + "step": 7325 + }, + { + "epoch": 0.29, + "learning_rate": 9.862942942942944e-06, + "loss": 0.4131, + "step": 7350 + }, + { + "epoch": 0.29, + "learning_rate": 9.862442442442443e-06, + "loss": 0.4, + "step": 7375 + }, + { + "epoch": 0.3, + "learning_rate": 9.861941941941942e-06, + "loss": 0.4051, + "step": 7400 + }, + { + "epoch": 0.3, + "learning_rate": 9.861441441441443e-06, + "loss": 0.3976, + "step": 7425 + }, + { + "epoch": 0.3, + "learning_rate": 9.860940940940942e-06, + "loss": 0.4396, + "step": 7450 + }, + { + "epoch": 0.3, + "learning_rate": 9.86044044044044e-06, + "loss": 0.3999, + "step": 7475 + }, + { + "epoch": 0.3, + "learning_rate": 9.859939939939941e-06, + "loss": 0.4167, + "step": 7500 + }, + { + "epoch": 0.3, + "learning_rate": 9.85943943943944e-06, + "loss": 0.4324, + "step": 7525 + }, + { + "epoch": 0.3, + "learning_rate": 9.85893893893894e-06, + "loss": 0.4185, + "step": 7550 + }, + { + "epoch": 0.3, + "learning_rate": 9.858438438438439e-06, + "loss": 0.4205, + "step": 7575 + }, + { + "epoch": 0.3, + "learning_rate": 9.85793793793794e-06, + "loss": 0.4011, + "step": 7600 + }, + { + "epoch": 0.3, + "learning_rate": 9.857437437437437e-06, + "loss": 0.4032, + "step": 7625 + }, + { + "epoch": 0.31, + "learning_rate": 9.856936936936937e-06, + "loss": 0.4223, + "step": 7650 + }, + { + "epoch": 0.31, + "learning_rate": 9.856436436436438e-06, + "loss": 0.4024, + "step": 7675 + }, + { + "epoch": 0.31, + "learning_rate": 9.855935935935937e-06, + "loss": 0.4071, + "step": 7700 + }, + { + "epoch": 0.31, + "learning_rate": 9.855435435435436e-06, + "loss": 0.4024, + "step": 7725 + }, + { + "epoch": 0.31, + "learning_rate": 9.854934934934936e-06, + "loss": 0.3904, + "step": 7750 + }, + { + "epoch": 0.31, + "learning_rate": 9.854434434434435e-06, + "loss": 0.4041, + "step": 7775 + }, + { + "epoch": 0.31, + "learning_rate": 9.853933933933934e-06, + "loss": 0.4201, + "step": 7800 + }, + { + "epoch": 0.31, + "learning_rate": 9.853433433433435e-06, + "loss": 0.393, + "step": 7825 + }, + { + "epoch": 0.31, + "learning_rate": 9.852932932932935e-06, + "loss": 0.4405, + "step": 7850 + }, + { + "epoch": 0.31, + "learning_rate": 9.852432432432432e-06, + "loss": 0.402, + "step": 7875 + }, + { + "epoch": 0.32, + "learning_rate": 9.851931931931933e-06, + "loss": 0.4064, + "step": 7900 + }, + { + "epoch": 0.32, + "learning_rate": 9.851431431431432e-06, + "loss": 0.3908, + "step": 7925 + }, + { + "epoch": 0.32, + "learning_rate": 9.850930930930932e-06, + "loss": 0.4232, + "step": 7950 + }, + { + "epoch": 0.32, + "learning_rate": 9.850430430430431e-06, + "loss": 0.4311, + "step": 7975 + }, + { + "epoch": 0.32, + "learning_rate": 9.84992992992993e-06, + "loss": 0.4266, + "step": 8000 + }, + { + "epoch": 0.32, + "eval_loss": 0.5630306601524353, + "eval_runtime": 2643.0014, + "eval_samples_per_second": 6.134, + "eval_steps_per_second": 0.154, + "eval_wer": 34.73531656401045, + "step": 8000 + }, + { + "epoch": 0.32, + "learning_rate": 9.84942942942943e-06, + "loss": 0.4117, + "step": 8025 + }, + { + "epoch": 0.32, + "learning_rate": 9.84894894894895e-06, + "loss": 0.3983, + "step": 8050 + }, + { + "epoch": 0.32, + "learning_rate": 9.848448448448448e-06, + "loss": 0.4025, + "step": 8075 + }, + { + "epoch": 0.32, + "learning_rate": 9.847947947947949e-06, + "loss": 0.4119, + "step": 8100 + }, + { + "epoch": 0.32, + "learning_rate": 9.847447447447448e-06, + "loss": 0.4135, + "step": 8125 + }, + { + "epoch": 0.33, + "learning_rate": 9.846946946946948e-06, + "loss": 0.4048, + "step": 8150 + }, + { + "epoch": 0.33, + "learning_rate": 9.846446446446447e-06, + "loss": 0.4371, + "step": 8175 + }, + { + "epoch": 0.33, + "learning_rate": 9.845945945945948e-06, + "loss": 0.3954, + "step": 8200 + }, + { + "epoch": 0.33, + "learning_rate": 9.845445445445446e-06, + "loss": 0.3933, + "step": 8225 + }, + { + "epoch": 0.33, + "learning_rate": 9.844944944944945e-06, + "loss": 0.3956, + "step": 8250 + }, + { + "epoch": 0.33, + "learning_rate": 9.844444444444446e-06, + "loss": 0.4109, + "step": 8275 + }, + { + "epoch": 0.33, + "learning_rate": 9.843943943943945e-06, + "loss": 0.4087, + "step": 8300 + }, + { + "epoch": 0.33, + "learning_rate": 9.843443443443444e-06, + "loss": 0.3904, + "step": 8325 + }, + { + "epoch": 0.33, + "learning_rate": 9.842942942942944e-06, + "loss": 0.4309, + "step": 8350 + }, + { + "epoch": 0.33, + "learning_rate": 9.842442442442443e-06, + "loss": 0.411, + "step": 8375 + }, + { + "epoch": 0.33, + "learning_rate": 9.841941941941942e-06, + "loss": 0.384, + "step": 8400 + }, + { + "epoch": 0.34, + "learning_rate": 9.841441441441443e-06, + "loss": 0.3993, + "step": 8425 + }, + { + "epoch": 0.34, + "learning_rate": 9.840940940940943e-06, + "loss": 0.3931, + "step": 8450 + }, + { + "epoch": 0.34, + "learning_rate": 9.84044044044044e-06, + "loss": 0.4044, + "step": 8475 + }, + { + "epoch": 0.34, + "learning_rate": 9.839939939939941e-06, + "loss": 0.3985, + "step": 8500 + }, + { + "epoch": 0.34, + "learning_rate": 9.83943943943944e-06, + "loss": 0.4317, + "step": 8525 + }, + { + "epoch": 0.34, + "learning_rate": 9.83893893893894e-06, + "loss": 0.3932, + "step": 8550 + }, + { + "epoch": 0.34, + "learning_rate": 9.838438438438439e-06, + "loss": 0.3925, + "step": 8575 + }, + { + "epoch": 0.34, + "learning_rate": 9.837937937937938e-06, + "loss": 0.3799, + "step": 8600 + }, + { + "epoch": 0.34, + "learning_rate": 9.837437437437438e-06, + "loss": 0.3975, + "step": 8625 + }, + { + "epoch": 0.34, + "learning_rate": 9.836936936936937e-06, + "loss": 0.4047, + "step": 8650 + }, + { + "epoch": 0.35, + "learning_rate": 9.836436436436438e-06, + "loss": 0.4092, + "step": 8675 + }, + { + "epoch": 0.35, + "learning_rate": 9.835935935935936e-06, + "loss": 0.3945, + "step": 8700 + }, + { + "epoch": 0.35, + "learning_rate": 9.835435435435437e-06, + "loss": 0.4068, + "step": 8725 + }, + { + "epoch": 0.35, + "learning_rate": 9.834934934934936e-06, + "loss": 0.3877, + "step": 8750 + }, + { + "epoch": 0.35, + "learning_rate": 9.834434434434435e-06, + "loss": 0.3949, + "step": 8775 + }, + { + "epoch": 0.35, + "learning_rate": 9.833933933933934e-06, + "loss": 0.3841, + "step": 8800 + }, + { + "epoch": 0.35, + "learning_rate": 9.833433433433435e-06, + "loss": 0.4074, + "step": 8825 + }, + { + "epoch": 0.35, + "learning_rate": 9.832932932932933e-06, + "loss": 0.4171, + "step": 8850 + }, + { + "epoch": 0.35, + "learning_rate": 9.832452452452454e-06, + "loss": 0.3953, + "step": 8875 + }, + { + "epoch": 0.35, + "learning_rate": 9.831951951951953e-06, + "loss": 0.3761, + "step": 8900 + }, + { + "epoch": 0.36, + "learning_rate": 9.831451451451452e-06, + "loss": 0.4115, + "step": 8925 + }, + { + "epoch": 0.36, + "learning_rate": 9.830950950950952e-06, + "loss": 0.3979, + "step": 8950 + }, + { + "epoch": 0.36, + "learning_rate": 9.830450450450451e-06, + "loss": 0.405, + "step": 8975 + }, + { + "epoch": 0.36, + "learning_rate": 9.82994994994995e-06, + "loss": 0.4057, + "step": 9000 + }, + { + "epoch": 0.36, + "eval_loss": 0.5405702590942383, + "eval_runtime": 2698.8083, + "eval_samples_per_second": 6.007, + "eval_steps_per_second": 0.15, + "eval_wer": 34.710648237370975, + "step": 9000 + }, + { + "epoch": 0.36, + "learning_rate": 9.829449449449451e-06, + "loss": 0.3833, + "step": 9025 + }, + { + "epoch": 0.36, + "learning_rate": 9.82894894894895e-06, + "loss": 0.4058, + "step": 9050 + }, + { + "epoch": 0.36, + "learning_rate": 9.828448448448448e-06, + "loss": 0.3861, + "step": 9075 + }, + { + "epoch": 0.36, + "learning_rate": 9.82794794794795e-06, + "loss": 0.4031, + "step": 9100 + }, + { + "epoch": 0.36, + "learning_rate": 9.827447447447449e-06, + "loss": 0.3894, + "step": 9125 + }, + { + "epoch": 0.36, + "learning_rate": 9.826946946946948e-06, + "loss": 0.3892, + "step": 9150 + }, + { + "epoch": 0.37, + "learning_rate": 9.826446446446447e-06, + "loss": 0.3991, + "step": 9175 + }, + { + "epoch": 0.37, + "learning_rate": 9.825945945945946e-06, + "loss": 0.3803, + "step": 9200 + }, + { + "epoch": 0.37, + "learning_rate": 9.825445445445446e-06, + "loss": 0.3927, + "step": 9225 + }, + { + "epoch": 0.37, + "learning_rate": 9.824944944944945e-06, + "loss": 0.4084, + "step": 9250 + }, + { + "epoch": 0.37, + "learning_rate": 9.824444444444446e-06, + "loss": 0.3916, + "step": 9275 + }, + { + "epoch": 0.37, + "learning_rate": 9.823943943943944e-06, + "loss": 0.3674, + "step": 9300 + }, + { + "epoch": 0.37, + "learning_rate": 9.823443443443445e-06, + "loss": 0.3683, + "step": 9325 + }, + { + "epoch": 0.37, + "learning_rate": 9.822942942942944e-06, + "loss": 0.4016, + "step": 9350 + }, + { + "epoch": 0.37, + "learning_rate": 9.822442442442443e-06, + "loss": 0.395, + "step": 9375 + }, + { + "epoch": 0.37, + "learning_rate": 9.821941941941942e-06, + "loss": 0.3906, + "step": 9400 + }, + { + "epoch": 0.38, + "learning_rate": 9.821441441441443e-06, + "loss": 0.3843, + "step": 9425 + }, + { + "epoch": 0.38, + "learning_rate": 9.820940940940941e-06, + "loss": 0.3732, + "step": 9450 + }, + { + "epoch": 0.38, + "learning_rate": 9.82044044044044e-06, + "loss": 0.3927, + "step": 9475 + }, + { + "epoch": 0.38, + "learning_rate": 9.819939939939941e-06, + "loss": 0.4151, + "step": 9500 + }, + { + "epoch": 0.38, + "learning_rate": 9.81943943943944e-06, + "loss": 0.3933, + "step": 9525 + }, + { + "epoch": 0.38, + "learning_rate": 9.81893893893894e-06, + "loss": 0.3856, + "step": 9550 + }, + { + "epoch": 0.38, + "learning_rate": 9.81843843843844e-06, + "loss": 0.3818, + "step": 9575 + }, + { + "epoch": 0.38, + "learning_rate": 9.817937937937939e-06, + "loss": 0.3932, + "step": 9600 + }, + { + "epoch": 0.38, + "learning_rate": 9.817437437437438e-06, + "loss": 0.4085, + "step": 9625 + }, + { + "epoch": 0.38, + "learning_rate": 9.816936936936939e-06, + "loss": 0.4023, + "step": 9650 + }, + { + "epoch": 0.39, + "learning_rate": 9.816436436436436e-06, + "loss": 0.3918, + "step": 9675 + }, + { + "epoch": 0.39, + "learning_rate": 9.815935935935936e-06, + "loss": 0.3965, + "step": 9700 + }, + { + "epoch": 0.39, + "learning_rate": 9.815435435435437e-06, + "loss": 0.3934, + "step": 9725 + }, + { + "epoch": 0.39, + "learning_rate": 9.814934934934936e-06, + "loss": 0.3807, + "step": 9750 + }, + { + "epoch": 0.39, + "learning_rate": 9.814434434434435e-06, + "loss": 0.3809, + "step": 9775 + }, + { + "epoch": 0.39, + "learning_rate": 9.813933933933935e-06, + "loss": 0.3804, + "step": 9800 + }, + { + "epoch": 0.39, + "learning_rate": 9.813433433433434e-06, + "loss": 0.4112, + "step": 9825 + }, + { + "epoch": 0.39, + "learning_rate": 9.812932932932933e-06, + "loss": 0.3853, + "step": 9850 + }, + { + "epoch": 0.39, + "learning_rate": 9.812432432432433e-06, + "loss": 0.3967, + "step": 9875 + }, + { + "epoch": 0.39, + "learning_rate": 9.811931931931934e-06, + "loss": 0.3934, + "step": 9900 + }, + { + "epoch": 0.4, + "learning_rate": 9.811431431431431e-06, + "loss": 0.4013, + "step": 9925 + }, + { + "epoch": 0.4, + "learning_rate": 9.810930930930932e-06, + "loss": 0.4004, + "step": 9950 + }, + { + "epoch": 0.4, + "learning_rate": 9.810430430430431e-06, + "loss": 0.3825, + "step": 9975 + }, + { + "epoch": 0.4, + "learning_rate": 9.80992992992993e-06, + "loss": 0.3798, + "step": 10000 + }, + { + "epoch": 0.4, + "eval_loss": 0.5242385864257812, + "eval_runtime": 2613.1802, + "eval_samples_per_second": 6.204, + "eval_steps_per_second": 0.155, + "eval_wer": 32.9584261607604, + "step": 10000 + }, + { + "epoch": 0.4, + "learning_rate": 9.80942942942943e-06, + "loss": 0.379, + "step": 10025 + }, + { + "epoch": 0.4, + "learning_rate": 9.808928928928931e-06, + "loss": 0.397, + "step": 10050 + }, + { + "epoch": 0.4, + "learning_rate": 9.808428428428429e-06, + "loss": 0.3818, + "step": 10075 + }, + { + "epoch": 0.4, + "learning_rate": 9.807927927927928e-06, + "loss": 0.373, + "step": 10100 + }, + { + "epoch": 0.4, + "learning_rate": 9.807427427427429e-06, + "loss": 0.3592, + "step": 10125 + }, + { + "epoch": 0.4, + "learning_rate": 9.806926926926928e-06, + "loss": 0.3824, + "step": 10150 + }, + { + "epoch": 0.41, + "learning_rate": 9.806426426426427e-06, + "loss": 0.3907, + "step": 10175 + }, + { + "epoch": 0.41, + "learning_rate": 9.805925925925927e-06, + "loss": 0.3787, + "step": 10200 + }, + { + "epoch": 0.41, + "learning_rate": 9.805425425425426e-06, + "loss": 0.3571, + "step": 10225 + }, + { + "epoch": 0.41, + "learning_rate": 9.804924924924925e-06, + "loss": 0.3785, + "step": 10250 + }, + { + "epoch": 0.41, + "learning_rate": 9.804424424424426e-06, + "loss": 0.41, + "step": 10275 + }, + { + "epoch": 0.41, + "learning_rate": 9.803923923923924e-06, + "loss": 0.3703, + "step": 10300 + }, + { + "epoch": 0.41, + "learning_rate": 9.803423423423423e-06, + "loss": 0.38, + "step": 10325 + }, + { + "epoch": 0.41, + "learning_rate": 9.802922922922924e-06, + "loss": 0.3787, + "step": 10350 + }, + { + "epoch": 0.41, + "learning_rate": 9.802422422422424e-06, + "loss": 0.3948, + "step": 10375 + }, + { + "epoch": 0.41, + "learning_rate": 9.801921921921923e-06, + "loss": 0.3775, + "step": 10400 + }, + { + "epoch": 0.42, + "learning_rate": 9.801421421421422e-06, + "loss": 0.3823, + "step": 10425 + }, + { + "epoch": 0.42, + "learning_rate": 9.800920920920921e-06, + "loss": 0.3868, + "step": 10450 + }, + { + "epoch": 0.42, + "learning_rate": 9.80042042042042e-06, + "loss": 0.378, + "step": 10475 + }, + { + "epoch": 0.42, + "learning_rate": 9.79991991991992e-06, + "loss": 0.3911, + "step": 10500 + }, + { + "epoch": 0.42, + "learning_rate": 9.799419419419421e-06, + "loss": 0.3845, + "step": 10525 + }, + { + "epoch": 0.42, + "learning_rate": 9.798918918918919e-06, + "loss": 0.3899, + "step": 10550 + }, + { + "epoch": 0.42, + "learning_rate": 9.79841841841842e-06, + "loss": 0.3919, + "step": 10575 + }, + { + "epoch": 0.42, + "learning_rate": 9.797917917917919e-06, + "loss": 0.4163, + "step": 10600 + }, + { + "epoch": 0.42, + "learning_rate": 9.797417417417418e-06, + "loss": 0.382, + "step": 10625 + }, + { + "epoch": 0.42, + "learning_rate": 9.796916916916918e-06, + "loss": 0.3796, + "step": 10650 + }, + { + "epoch": 0.43, + "learning_rate": 9.796416416416419e-06, + "loss": 0.3751, + "step": 10675 + }, + { + "epoch": 0.43, + "learning_rate": 9.795915915915916e-06, + "loss": 0.3768, + "step": 10700 + }, + { + "epoch": 0.43, + "learning_rate": 9.795415415415415e-06, + "loss": 0.3878, + "step": 10725 + }, + { + "epoch": 0.43, + "learning_rate": 9.794914914914916e-06, + "loss": 0.3821, + "step": 10750 + }, + { + "epoch": 0.43, + "learning_rate": 9.794414414414416e-06, + "loss": 0.3879, + "step": 10775 + }, + { + "epoch": 0.43, + "learning_rate": 9.793913913913915e-06, + "loss": 0.3685, + "step": 10800 + }, + { + "epoch": 0.43, + "learning_rate": 9.793413413413414e-06, + "loss": 0.3673, + "step": 10825 + }, + { + "epoch": 0.43, + "learning_rate": 9.792912912912914e-06, + "loss": 0.3955, + "step": 10850 + }, + { + "epoch": 0.43, + "learning_rate": 9.792412412412413e-06, + "loss": 0.3616, + "step": 10875 + }, + { + "epoch": 0.43, + "learning_rate": 9.791911911911914e-06, + "loss": 0.3692, + "step": 10900 + }, + { + "epoch": 0.44, + "learning_rate": 9.791411411411411e-06, + "loss": 0.3766, + "step": 10925 + }, + { + "epoch": 0.44, + "learning_rate": 9.79091091091091e-06, + "loss": 0.3873, + "step": 10950 + }, + { + "epoch": 0.44, + "learning_rate": 9.790410410410412e-06, + "loss": 0.3792, + "step": 10975 + }, + { + "epoch": 0.44, + "learning_rate": 9.789909909909911e-06, + "loss": 0.3781, + "step": 11000 + }, + { + "epoch": 0.44, + "eval_loss": 0.5272489190101624, + "eval_runtime": 2804.5214, + "eval_samples_per_second": 5.781, + "eval_steps_per_second": 0.145, + "eval_wer": 34.24349180163582, + "step": 11000 + }, + { + "epoch": 0.44, + "learning_rate": 9.78940940940941e-06, + "loss": 0.3926, + "step": 11025 + }, + { + "epoch": 0.44, + "learning_rate": 9.78890890890891e-06, + "loss": 0.3849, + "step": 11050 + }, + { + "epoch": 0.44, + "learning_rate": 9.788408408408409e-06, + "loss": 0.3726, + "step": 11075 + }, + { + "epoch": 0.44, + "learning_rate": 9.787907907907908e-06, + "loss": 0.3798, + "step": 11100 + }, + { + "epoch": 0.44, + "learning_rate": 9.787407407407408e-06, + "loss": 0.3877, + "step": 11125 + }, + { + "epoch": 0.44, + "learning_rate": 9.786906906906909e-06, + "loss": 0.3873, + "step": 11150 + }, + { + "epoch": 0.45, + "learning_rate": 9.786426426426428e-06, + "loss": 0.381, + "step": 11175 + }, + { + "epoch": 0.45, + "learning_rate": 9.785925925925927e-06, + "loss": 0.3769, + "step": 11200 + }, + { + "epoch": 0.45, + "learning_rate": 9.785425425425426e-06, + "loss": 0.3903, + "step": 11225 + }, + { + "epoch": 0.45, + "learning_rate": 9.784924924924926e-06, + "loss": 0.3778, + "step": 11250 + }, + { + "epoch": 0.45, + "learning_rate": 9.784424424424427e-06, + "loss": 0.3966, + "step": 11275 + }, + { + "epoch": 0.45, + "learning_rate": 9.783923923923924e-06, + "loss": 0.3851, + "step": 11300 + }, + { + "epoch": 0.45, + "learning_rate": 9.783423423423423e-06, + "loss": 0.3737, + "step": 11325 + }, + { + "epoch": 0.45, + "learning_rate": 9.782922922922924e-06, + "loss": 0.3602, + "step": 11350 + }, + { + "epoch": 0.45, + "learning_rate": 9.782422422422424e-06, + "loss": 0.3722, + "step": 11375 + }, + { + "epoch": 0.45, + "learning_rate": 9.781921921921923e-06, + "loss": 0.3874, + "step": 11400 + }, + { + "epoch": 0.46, + "learning_rate": 9.781421421421422e-06, + "loss": 0.3895, + "step": 11425 + }, + { + "epoch": 0.46, + "learning_rate": 9.780920920920922e-06, + "loss": 0.375, + "step": 11450 + }, + { + "epoch": 0.46, + "learning_rate": 9.780420420420421e-06, + "loss": 0.3858, + "step": 11475 + }, + { + "epoch": 0.46, + "learning_rate": 9.77991991991992e-06, + "loss": 0.3877, + "step": 11500 + }, + { + "epoch": 0.46, + "learning_rate": 9.77941941941942e-06, + "loss": 0.3932, + "step": 11525 + }, + { + "epoch": 0.46, + "learning_rate": 9.778918918918919e-06, + "loss": 0.3792, + "step": 11550 + }, + { + "epoch": 0.46, + "learning_rate": 9.77841841841842e-06, + "loss": 0.3709, + "step": 11575 + }, + { + "epoch": 0.46, + "learning_rate": 9.777917917917919e-06, + "loss": 0.3815, + "step": 11600 + }, + { + "epoch": 0.46, + "learning_rate": 9.777417417417418e-06, + "loss": 0.3834, + "step": 11625 + }, + { + "epoch": 0.46, + "learning_rate": 9.776916916916918e-06, + "loss": 0.3598, + "step": 11650 + }, + { + "epoch": 0.47, + "learning_rate": 9.776416416416417e-06, + "loss": 0.3648, + "step": 11675 + }, + { + "epoch": 0.47, + "learning_rate": 9.775915915915916e-06, + "loss": 0.3582, + "step": 11700 + }, + { + "epoch": 0.47, + "learning_rate": 9.775415415415416e-06, + "loss": 0.3753, + "step": 11725 + }, + { + "epoch": 0.47, + "learning_rate": 9.774914914914917e-06, + "loss": 0.3689, + "step": 11750 + }, + { + "epoch": 0.47, + "learning_rate": 9.774414414414414e-06, + "loss": 0.3774, + "step": 11775 + }, + { + "epoch": 0.47, + "learning_rate": 9.773913913913915e-06, + "loss": 0.3825, + "step": 11800 + }, + { + "epoch": 0.47, + "learning_rate": 9.773413413413414e-06, + "loss": 0.36, + "step": 11825 + }, + { + "epoch": 0.47, + "learning_rate": 9.772912912912914e-06, + "loss": 0.3672, + "step": 11850 + }, + { + "epoch": 0.47, + "learning_rate": 9.772412412412413e-06, + "loss": 0.3848, + "step": 11875 + }, + { + "epoch": 0.47, + "learning_rate": 9.771911911911914e-06, + "loss": 0.357, + "step": 11900 + }, + { + "epoch": 0.48, + "learning_rate": 9.771411411411412e-06, + "loss": 0.3658, + "step": 11925 + }, + { + "epoch": 0.48, + "learning_rate": 9.770910910910911e-06, + "loss": 0.3733, + "step": 11950 + }, + { + "epoch": 0.48, + "learning_rate": 9.770410410410412e-06, + "loss": 0.3731, + "step": 11975 + }, + { + "epoch": 0.48, + "learning_rate": 9.76990990990991e-06, + "loss": 0.3674, + "step": 12000 + }, + { + "epoch": 0.48, + "eval_loss": 0.5061578750610352, + "eval_runtime": 2740.8866, + "eval_samples_per_second": 5.915, + "eval_steps_per_second": 0.148, + "eval_wer": 33.014700780906715, + "step": 12000 + }, + { + "epoch": 0.48, + "learning_rate": 9.76940940940941e-06, + "loss": 0.3981, + "step": 12025 + }, + { + "epoch": 0.48, + "learning_rate": 9.76890890890891e-06, + "loss": 0.3759, + "step": 12050 + }, + { + "epoch": 0.48, + "learning_rate": 9.76840840840841e-06, + "loss": 0.3647, + "step": 12075 + }, + { + "epoch": 0.48, + "learning_rate": 9.767907907907908e-06, + "loss": 0.3756, + "step": 12100 + }, + { + "epoch": 0.48, + "learning_rate": 9.767407407407408e-06, + "loss": 0.3444, + "step": 12125 + }, + { + "epoch": 0.48, + "learning_rate": 9.766906906906907e-06, + "loss": 0.3536, + "step": 12150 + }, + { + "epoch": 0.49, + "learning_rate": 9.766406406406406e-06, + "loss": 0.3584, + "step": 12175 + }, + { + "epoch": 0.49, + "learning_rate": 9.765905905905907e-06, + "loss": 0.3879, + "step": 12200 + }, + { + "epoch": 0.49, + "learning_rate": 9.765405405405407e-06, + "loss": 0.3403, + "step": 12225 + }, + { + "epoch": 0.49, + "learning_rate": 9.764904904904906e-06, + "loss": 0.3646, + "step": 12250 + }, + { + "epoch": 0.49, + "learning_rate": 9.764404404404405e-06, + "loss": 0.3697, + "step": 12275 + }, + { + "epoch": 0.49, + "learning_rate": 9.763903903903905e-06, + "loss": 0.3607, + "step": 12300 + }, + { + "epoch": 0.49, + "learning_rate": 9.763403403403404e-06, + "loss": 0.3588, + "step": 12325 + }, + { + "epoch": 0.49, + "learning_rate": 9.762902902902903e-06, + "loss": 0.3668, + "step": 12350 + }, + { + "epoch": 0.49, + "learning_rate": 9.762402402402404e-06, + "loss": 0.3933, + "step": 12375 + }, + { + "epoch": 0.49, + "learning_rate": 9.761901901901902e-06, + "loss": 0.3744, + "step": 12400 + }, + { + "epoch": 0.5, + "learning_rate": 9.761401401401403e-06, + "loss": 0.3905, + "step": 12425 + }, + { + "epoch": 0.5, + "learning_rate": 9.760900900900902e-06, + "loss": 0.3641, + "step": 12450 + }, + { + "epoch": 0.5, + "learning_rate": 9.760400400400401e-06, + "loss": 0.3647, + "step": 12475 + }, + { + "epoch": 0.5, + "learning_rate": 9.7598998998999e-06, + "loss": 0.35, + "step": 12500 + }, + { + "epoch": 0.5, + "learning_rate": 9.7593993993994e-06, + "loss": 0.3545, + "step": 12525 + }, + { + "epoch": 0.5, + "learning_rate": 9.7588988988989e-06, + "loss": 0.3645, + "step": 12550 + }, + { + "epoch": 0.5, + "learning_rate": 9.758398398398398e-06, + "loss": 0.3625, + "step": 12575 + }, + { + "epoch": 0.5, + "learning_rate": 9.7578978978979e-06, + "loss": 0.3801, + "step": 12600 + }, + { + "epoch": 0.5, + "learning_rate": 9.757397397397397e-06, + "loss": 0.3562, + "step": 12625 + }, + { + "epoch": 0.5, + "learning_rate": 9.756896896896898e-06, + "loss": 0.3594, + "step": 12650 + }, + { + "epoch": 0.51, + "learning_rate": 9.756396396396397e-06, + "loss": 0.3644, + "step": 12675 + }, + { + "epoch": 0.51, + "learning_rate": 9.755895895895897e-06, + "loss": 0.356, + "step": 12700 + }, + { + "epoch": 0.51, + "learning_rate": 9.755395395395396e-06, + "loss": 0.3676, + "step": 12725 + }, + { + "epoch": 0.51, + "learning_rate": 9.754894894894895e-06, + "loss": 0.3722, + "step": 12750 + }, + { + "epoch": 0.51, + "learning_rate": 9.754394394394395e-06, + "loss": 0.396, + "step": 12775 + }, + { + "epoch": 0.51, + "learning_rate": 9.753893893893894e-06, + "loss": 0.3613, + "step": 12800 + }, + { + "epoch": 0.51, + "learning_rate": 9.753393393393395e-06, + "loss": 0.3626, + "step": 12825 + }, + { + "epoch": 0.51, + "learning_rate": 9.752892892892894e-06, + "loss": 0.3642, + "step": 12850 + }, + { + "epoch": 0.51, + "learning_rate": 9.752392392392393e-06, + "loss": 0.3674, + "step": 12875 + }, + { + "epoch": 0.51, + "learning_rate": 9.751891891891893e-06, + "loss": 0.3526, + "step": 12900 + }, + { + "epoch": 0.52, + "learning_rate": 9.751391391391392e-06, + "loss": 0.3767, + "step": 12925 + }, + { + "epoch": 0.52, + "learning_rate": 9.750890890890891e-06, + "loss": 0.3616, + "step": 12950 + }, + { + "epoch": 0.52, + "learning_rate": 9.75039039039039e-06, + "loss": 0.3475, + "step": 12975 + }, + { + "epoch": 0.52, + "learning_rate": 9.749889889889892e-06, + "loss": 0.3507, + "step": 13000 + }, + { + "epoch": 0.52, + "eval_loss": 0.49944427609443665, + "eval_runtime": 2897.6163, + "eval_samples_per_second": 5.595, + "eval_steps_per_second": 0.14, + "eval_wer": 33.72160251616932, + "step": 13000 + }, + { + "epoch": 0.52, + "learning_rate": 9.74938938938939e-06, + "loss": 0.3743, + "step": 13025 + }, + { + "epoch": 0.52, + "learning_rate": 9.74888888888889e-06, + "loss": 0.3597, + "step": 13050 + }, + { + "epoch": 0.52, + "learning_rate": 9.74838838838839e-06, + "loss": 0.3862, + "step": 13075 + }, + { + "epoch": 0.52, + "learning_rate": 9.747887887887889e-06, + "loss": 0.3606, + "step": 13100 + }, + { + "epoch": 0.52, + "learning_rate": 9.747387387387388e-06, + "loss": 0.4099, + "step": 13125 + }, + { + "epoch": 0.52, + "learning_rate": 9.746886886886887e-06, + "loss": 0.3583, + "step": 13150 + }, + { + "epoch": 0.53, + "learning_rate": 9.746386386386387e-06, + "loss": 0.3673, + "step": 13175 + }, + { + "epoch": 0.53, + "learning_rate": 9.745885885885886e-06, + "loss": 0.3597, + "step": 13200 + }, + { + "epoch": 0.53, + "learning_rate": 9.745385385385387e-06, + "loss": 0.3715, + "step": 13225 + }, + { + "epoch": 0.53, + "learning_rate": 9.744884884884885e-06, + "loss": 0.3681, + "step": 13250 + }, + { + "epoch": 0.53, + "learning_rate": 9.744384384384386e-06, + "loss": 0.3793, + "step": 13275 + }, + { + "epoch": 0.53, + "learning_rate": 9.743883883883885e-06, + "loss": 0.3574, + "step": 13300 + }, + { + "epoch": 0.53, + "learning_rate": 9.743383383383384e-06, + "loss": 0.3602, + "step": 13325 + }, + { + "epoch": 0.53, + "learning_rate": 9.742882882882883e-06, + "loss": 0.3663, + "step": 13350 + }, + { + "epoch": 0.53, + "learning_rate": 9.742382382382383e-06, + "loss": 0.3947, + "step": 13375 + }, + { + "epoch": 0.53, + "learning_rate": 9.741881881881882e-06, + "loss": 0.3709, + "step": 13400 + }, + { + "epoch": 0.54, + "learning_rate": 9.741381381381381e-06, + "loss": 0.3625, + "step": 13425 + }, + { + "epoch": 0.54, + "learning_rate": 9.740880880880882e-06, + "loss": 0.3574, + "step": 13450 + }, + { + "epoch": 0.54, + "learning_rate": 9.740380380380382e-06, + "loss": 0.3642, + "step": 13475 + }, + { + "epoch": 0.54, + "learning_rate": 9.739879879879881e-06, + "loss": 0.3639, + "step": 13500 + }, + { + "epoch": 0.54, + "learning_rate": 9.73937937937938e-06, + "loss": 0.3669, + "step": 13525 + }, + { + "epoch": 0.54, + "learning_rate": 9.73887887887888e-06, + "loss": 0.3762, + "step": 13550 + }, + { + "epoch": 0.54, + "learning_rate": 9.738378378378379e-06, + "loss": 0.3564, + "step": 13575 + }, + { + "epoch": 0.54, + "learning_rate": 9.737877877877878e-06, + "loss": 0.3602, + "step": 13600 + }, + { + "epoch": 0.54, + "learning_rate": 9.737377377377379e-06, + "loss": 0.3464, + "step": 13625 + }, + { + "epoch": 0.54, + "learning_rate": 9.736876876876877e-06, + "loss": 0.3618, + "step": 13650 + }, + { + "epoch": 0.55, + "learning_rate": 9.736376376376378e-06, + "loss": 0.3761, + "step": 13675 + }, + { + "epoch": 0.55, + "learning_rate": 9.735875875875877e-06, + "loss": 0.3604, + "step": 13700 + }, + { + "epoch": 0.55, + "learning_rate": 9.735375375375376e-06, + "loss": 0.3714, + "step": 13725 + }, + { + "epoch": 0.55, + "learning_rate": 9.734874874874876e-06, + "loss": 0.3699, + "step": 13750 + }, + { + "epoch": 0.55, + "learning_rate": 9.734374374374375e-06, + "loss": 0.3728, + "step": 13775 + }, + { + "epoch": 0.55, + "learning_rate": 9.733873873873874e-06, + "loss": 0.3878, + "step": 13800 + }, + { + "epoch": 0.55, + "learning_rate": 9.733373373373374e-06, + "loss": 0.3461, + "step": 13825 + }, + { + "epoch": 0.55, + "learning_rate": 9.732872872872875e-06, + "loss": 0.3415, + "step": 13850 + }, + { + "epoch": 0.55, + "learning_rate": 9.732372372372372e-06, + "loss": 0.3548, + "step": 13875 + }, + { + "epoch": 0.55, + "learning_rate": 9.731871871871873e-06, + "loss": 0.3729, + "step": 13900 + }, + { + "epoch": 0.56, + "learning_rate": 9.731371371371372e-06, + "loss": 0.3705, + "step": 13925 + }, + { + "epoch": 0.56, + "learning_rate": 9.730870870870872e-06, + "loss": 0.3605, + "step": 13950 + }, + { + "epoch": 0.56, + "learning_rate": 9.730370370370371e-06, + "loss": 0.3631, + "step": 13975 + }, + { + "epoch": 0.56, + "learning_rate": 9.72986986986987e-06, + "loss": 0.375, + "step": 14000 + }, + { + "epoch": 0.56, + "eval_loss": 0.5072089433670044, + "eval_runtime": 2512.5863, + "eval_samples_per_second": 6.453, + "eval_steps_per_second": 0.162, + "eval_wer": 30.171676135706633, + "step": 14000 + }, + { + "epoch": 0.56, + "learning_rate": 9.72936936936937e-06, + "loss": 0.3642, + "step": 14025 + }, + { + "epoch": 0.56, + "learning_rate": 9.728868868868869e-06, + "loss": 0.348, + "step": 14050 + }, + { + "epoch": 0.56, + "learning_rate": 9.72836836836837e-06, + "loss": 0.3413, + "step": 14075 + }, + { + "epoch": 0.56, + "learning_rate": 9.72786786786787e-06, + "loss": 0.3528, + "step": 14100 + }, + { + "epoch": 0.56, + "learning_rate": 9.727367367367368e-06, + "loss": 0.3501, + "step": 14125 + }, + { + "epoch": 0.56, + "learning_rate": 9.726866866866868e-06, + "loss": 0.3318, + "step": 14150 + }, + { + "epoch": 0.57, + "learning_rate": 9.726366366366367e-06, + "loss": 0.3655, + "step": 14175 + }, + { + "epoch": 0.57, + "learning_rate": 9.725865865865866e-06, + "loss": 0.3496, + "step": 14200 + }, + { + "epoch": 0.57, + "learning_rate": 9.725365365365366e-06, + "loss": 0.3379, + "step": 14225 + }, + { + "epoch": 0.57, + "learning_rate": 9.724884884884885e-06, + "loss": 0.3893, + "step": 14250 + }, + { + "epoch": 0.57, + "learning_rate": 9.724384384384386e-06, + "loss": 0.3703, + "step": 14275 + }, + { + "epoch": 0.57, + "learning_rate": 9.723883883883885e-06, + "loss": 0.3531, + "step": 14300 + }, + { + "epoch": 0.57, + "learning_rate": 9.723383383383384e-06, + "loss": 0.3604, + "step": 14325 + }, + { + "epoch": 0.57, + "learning_rate": 9.722882882882884e-06, + "loss": 0.3527, + "step": 14350 + }, + { + "epoch": 0.57, + "learning_rate": 9.722382382382383e-06, + "loss": 0.3556, + "step": 14375 + }, + { + "epoch": 0.57, + "learning_rate": 9.721881881881882e-06, + "loss": 0.3664, + "step": 14400 + }, + { + "epoch": 0.58, + "learning_rate": 9.721381381381382e-06, + "loss": 0.3641, + "step": 14425 + }, + { + "epoch": 0.58, + "learning_rate": 9.720880880880883e-06, + "loss": 0.3553, + "step": 14450 + }, + { + "epoch": 0.58, + "learning_rate": 9.72038038038038e-06, + "loss": 0.3605, + "step": 14475 + }, + { + "epoch": 0.58, + "learning_rate": 9.719879879879881e-06, + "loss": 0.3412, + "step": 14500 + }, + { + "epoch": 0.58, + "learning_rate": 9.71937937937938e-06, + "loss": 0.3588, + "step": 14525 + }, + { + "epoch": 0.58, + "learning_rate": 9.71887887887888e-06, + "loss": 0.3334, + "step": 14550 + }, + { + "epoch": 0.58, + "learning_rate": 9.718378378378379e-06, + "loss": 0.3624, + "step": 14575 + }, + { + "epoch": 0.58, + "learning_rate": 9.717877877877878e-06, + "loss": 0.3609, + "step": 14600 + }, + { + "epoch": 0.58, + "learning_rate": 9.717377377377378e-06, + "loss": 0.3339, + "step": 14625 + }, + { + "epoch": 0.58, + "learning_rate": 9.716876876876877e-06, + "loss": 0.353, + "step": 14650 + }, + { + "epoch": 0.59, + "learning_rate": 9.716376376376378e-06, + "loss": 0.3517, + "step": 14675 + }, + { + "epoch": 0.59, + "learning_rate": 9.715875875875877e-06, + "loss": 0.3626, + "step": 14700 + }, + { + "epoch": 0.59, + "learning_rate": 9.715375375375377e-06, + "loss": 0.3268, + "step": 14725 + }, + { + "epoch": 0.59, + "learning_rate": 9.714874874874876e-06, + "loss": 0.3648, + "step": 14750 + }, + { + "epoch": 0.59, + "learning_rate": 9.714374374374375e-06, + "loss": 0.3579, + "step": 14775 + }, + { + "epoch": 0.59, + "learning_rate": 9.713873873873874e-06, + "loss": 0.3403, + "step": 14800 + }, + { + "epoch": 0.59, + "learning_rate": 9.713373373373374e-06, + "loss": 0.3597, + "step": 14825 + }, + { + "epoch": 0.59, + "learning_rate": 9.712872872872873e-06, + "loss": 0.3323, + "step": 14850 + }, + { + "epoch": 0.59, + "learning_rate": 9.712372372372372e-06, + "loss": 0.3412, + "step": 14875 + }, + { + "epoch": 0.59, + "learning_rate": 9.711871871871873e-06, + "loss": 0.3574, + "step": 14900 + }, + { + "epoch": 0.6, + "learning_rate": 9.711371371371373e-06, + "loss": 0.348, + "step": 14925 + }, + { + "epoch": 0.6, + "learning_rate": 9.710870870870872e-06, + "loss": 0.3588, + "step": 14950 + }, + { + "epoch": 0.6, + "learning_rate": 9.710370370370371e-06, + "loss": 0.3445, + "step": 14975 + }, + { + "epoch": 0.6, + "learning_rate": 9.70986986986987e-06, + "loss": 0.3545, + "step": 15000 + }, + { + "epoch": 0.6, + "eval_loss": 0.5023101568222046, + "eval_runtime": 2571.7112, + "eval_samples_per_second": 6.304, + "eval_steps_per_second": 0.158, + "eval_wer": 30.215616592533205, + "step": 15000 + }, + { + "epoch": 0.6, + "learning_rate": 9.70936936936937e-06, + "loss": 0.3526, + "step": 15025 + }, + { + "epoch": 0.6, + "learning_rate": 9.708868868868869e-06, + "loss": 0.361, + "step": 15050 + }, + { + "epoch": 0.6, + "learning_rate": 9.70836836836837e-06, + "loss": 0.3731, + "step": 15075 + }, + { + "epoch": 0.6, + "learning_rate": 9.707867867867868e-06, + "loss": 0.3499, + "step": 15100 + }, + { + "epoch": 0.6, + "learning_rate": 9.707367367367369e-06, + "loss": 0.3608, + "step": 15125 + }, + { + "epoch": 0.6, + "learning_rate": 9.706866866866868e-06, + "loss": 0.3465, + "step": 15150 + }, + { + "epoch": 0.61, + "learning_rate": 9.706366366366367e-06, + "loss": 0.362, + "step": 15175 + }, + { + "epoch": 0.61, + "learning_rate": 9.705865865865867e-06, + "loss": 0.348, + "step": 15200 + }, + { + "epoch": 0.61, + "learning_rate": 9.705365365365366e-06, + "loss": 0.3532, + "step": 15225 + }, + { + "epoch": 0.61, + "learning_rate": 9.704864864864865e-06, + "loss": 0.3352, + "step": 15250 + }, + { + "epoch": 0.61, + "learning_rate": 9.704364364364364e-06, + "loss": 0.3424, + "step": 15275 + }, + { + "epoch": 0.61, + "learning_rate": 9.703863863863865e-06, + "loss": 0.3569, + "step": 15300 + }, + { + "epoch": 0.61, + "learning_rate": 9.703363363363365e-06, + "loss": 0.329, + "step": 15325 + }, + { + "epoch": 0.61, + "learning_rate": 9.702862862862864e-06, + "loss": 0.3551, + "step": 15350 + }, + { + "epoch": 0.61, + "learning_rate": 9.702362362362363e-06, + "loss": 0.3592, + "step": 15375 + }, + { + "epoch": 0.61, + "learning_rate": 9.701861861861863e-06, + "loss": 0.359, + "step": 15400 + }, + { + "epoch": 0.62, + "learning_rate": 9.701361361361362e-06, + "loss": 0.3498, + "step": 15425 + }, + { + "epoch": 0.62, + "learning_rate": 9.700860860860861e-06, + "loss": 0.352, + "step": 15450 + }, + { + "epoch": 0.62, + "learning_rate": 9.70036036036036e-06, + "loss": 0.3451, + "step": 15475 + }, + { + "epoch": 0.62, + "learning_rate": 9.69985985985986e-06, + "loss": 0.3582, + "step": 15500 + }, + { + "epoch": 0.62, + "learning_rate": 9.69935935935936e-06, + "loss": 0.3495, + "step": 15525 + }, + { + "epoch": 0.62, + "learning_rate": 9.69885885885886e-06, + "loss": 0.3603, + "step": 15550 + }, + { + "epoch": 0.62, + "learning_rate": 9.69835835835836e-06, + "loss": 0.3398, + "step": 15575 + }, + { + "epoch": 0.62, + "learning_rate": 9.697857857857859e-06, + "loss": 0.3532, + "step": 15600 + }, + { + "epoch": 0.62, + "learning_rate": 9.697357357357358e-06, + "loss": 0.3848, + "step": 15625 + }, + { + "epoch": 0.62, + "learning_rate": 9.696856856856857e-06, + "loss": 0.3341, + "step": 15650 + }, + { + "epoch": 0.63, + "learning_rate": 9.696356356356357e-06, + "loss": 0.37, + "step": 15675 + }, + { + "epoch": 0.63, + "learning_rate": 9.695855855855858e-06, + "loss": 0.3635, + "step": 15700 + }, + { + "epoch": 0.63, + "learning_rate": 9.695355355355355e-06, + "loss": 0.3614, + "step": 15725 + }, + { + "epoch": 0.63, + "learning_rate": 9.694854854854856e-06, + "loss": 0.3651, + "step": 15750 + }, + { + "epoch": 0.63, + "learning_rate": 9.694354354354355e-06, + "loss": 0.3733, + "step": 15775 + }, + { + "epoch": 0.63, + "learning_rate": 9.693853853853855e-06, + "loss": 0.3455, + "step": 15800 + }, + { + "epoch": 0.63, + "learning_rate": 9.693353353353354e-06, + "loss": 0.3551, + "step": 15825 + }, + { + "epoch": 0.63, + "learning_rate": 9.692852852852853e-06, + "loss": 0.3517, + "step": 15850 + }, + { + "epoch": 0.63, + "learning_rate": 9.692352352352353e-06, + "loss": 0.3595, + "step": 15875 + }, + { + "epoch": 0.63, + "learning_rate": 9.691851851851852e-06, + "loss": 0.3694, + "step": 15900 + }, + { + "epoch": 0.64, + "learning_rate": 9.691351351351353e-06, + "loss": 0.3433, + "step": 15925 + }, + { + "epoch": 0.64, + "learning_rate": 9.69085085085085e-06, + "loss": 0.3443, + "step": 15950 + }, + { + "epoch": 0.64, + "learning_rate": 9.690350350350352e-06, + "loss": 0.3754, + "step": 15975 + }, + { + "epoch": 0.64, + "learning_rate": 9.689849849849851e-06, + "loss": 0.369, + "step": 16000 + }, + { + "epoch": 0.64, + "eval_loss": 0.4858362674713135, + "eval_runtime": 2697.5515, + "eval_samples_per_second": 6.01, + "eval_steps_per_second": 0.151, + "eval_wer": 31.24320657410905, + "step": 16000 + }, + { + "epoch": 0.64, + "learning_rate": 9.68934934934935e-06, + "loss": 0.3536, + "step": 16025 + }, + { + "epoch": 0.64, + "learning_rate": 9.68884884884885e-06, + "loss": 0.339, + "step": 16050 + }, + { + "epoch": 0.64, + "learning_rate": 9.688348348348349e-06, + "loss": 0.3319, + "step": 16075 + }, + { + "epoch": 0.64, + "learning_rate": 9.687847847847848e-06, + "loss": 0.3742, + "step": 16100 + }, + { + "epoch": 0.64, + "learning_rate": 9.687347347347347e-06, + "loss": 0.3299, + "step": 16125 + }, + { + "epoch": 0.64, + "learning_rate": 9.686846846846848e-06, + "loss": 0.3526, + "step": 16150 + }, + { + "epoch": 0.65, + "learning_rate": 9.686346346346348e-06, + "loss": 0.3479, + "step": 16175 + }, + { + "epoch": 0.65, + "learning_rate": 9.685845845845847e-06, + "loss": 0.3631, + "step": 16200 + }, + { + "epoch": 0.65, + "learning_rate": 9.685345345345346e-06, + "loss": 0.3545, + "step": 16225 + }, + { + "epoch": 0.65, + "learning_rate": 9.684844844844846e-06, + "loss": 0.3651, + "step": 16250 + }, + { + "epoch": 0.65, + "learning_rate": 9.684344344344345e-06, + "loss": 0.3438, + "step": 16275 + }, + { + "epoch": 0.65, + "learning_rate": 9.683843843843844e-06, + "loss": 0.3502, + "step": 16300 + }, + { + "epoch": 0.65, + "learning_rate": 9.683343343343345e-06, + "loss": 0.357, + "step": 16325 + }, + { + "epoch": 0.65, + "learning_rate": 9.682842842842843e-06, + "loss": 0.349, + "step": 16350 + }, + { + "epoch": 0.65, + "learning_rate": 9.682342342342344e-06, + "loss": 0.3369, + "step": 16375 + }, + { + "epoch": 0.65, + "learning_rate": 9.681841841841843e-06, + "loss": 0.361, + "step": 16400 + }, + { + "epoch": 0.66, + "learning_rate": 9.681341341341342e-06, + "loss": 0.3435, + "step": 16425 + }, + { + "epoch": 0.66, + "learning_rate": 9.680840840840842e-06, + "loss": 0.3185, + "step": 16450 + }, + { + "epoch": 0.66, + "learning_rate": 9.680340340340341e-06, + "loss": 0.3341, + "step": 16475 + }, + { + "epoch": 0.66, + "learning_rate": 9.67983983983984e-06, + "loss": 0.3349, + "step": 16500 + }, + { + "epoch": 0.66, + "learning_rate": 9.67933933933934e-06, + "loss": 0.3453, + "step": 16525 + }, + { + "epoch": 0.66, + "learning_rate": 9.67883883883884e-06, + "loss": 0.3519, + "step": 16550 + }, + { + "epoch": 0.66, + "learning_rate": 9.678338338338338e-06, + "loss": 0.3529, + "step": 16575 + }, + { + "epoch": 0.66, + "learning_rate": 9.677857857857859e-06, + "loss": 0.3486, + "step": 16600 + }, + { + "epoch": 0.66, + "learning_rate": 9.677357357357358e-06, + "loss": 0.3424, + "step": 16625 + }, + { + "epoch": 0.66, + "learning_rate": 9.676856856856858e-06, + "loss": 0.3455, + "step": 16650 + }, + { + "epoch": 0.66, + "learning_rate": 9.676356356356357e-06, + "loss": 0.3431, + "step": 16675 + }, + { + "epoch": 0.67, + "learning_rate": 9.675855855855856e-06, + "loss": 0.3379, + "step": 16700 + }, + { + "epoch": 0.67, + "learning_rate": 9.675355355355355e-06, + "loss": 0.3539, + "step": 16725 + }, + { + "epoch": 0.67, + "learning_rate": 9.674854854854856e-06, + "loss": 0.327, + "step": 16750 + }, + { + "epoch": 0.67, + "learning_rate": 9.674354354354356e-06, + "loss": 0.3275, + "step": 16775 + }, + { + "epoch": 0.67, + "learning_rate": 9.673853853853855e-06, + "loss": 0.3396, + "step": 16800 + }, + { + "epoch": 0.67, + "learning_rate": 9.673353353353354e-06, + "loss": 0.3476, + "step": 16825 + }, + { + "epoch": 0.67, + "learning_rate": 9.672852852852854e-06, + "loss": 0.3675, + "step": 16850 + }, + { + "epoch": 0.67, + "learning_rate": 9.672352352352353e-06, + "loss": 0.3571, + "step": 16875 + }, + { + "epoch": 0.67, + "learning_rate": 9.671851851851852e-06, + "loss": 0.3463, + "step": 16900 + }, + { + "epoch": 0.67, + "learning_rate": 9.671351351351353e-06, + "loss": 0.3381, + "step": 16925 + }, + { + "epoch": 0.68, + "learning_rate": 9.67085085085085e-06, + "loss": 0.3582, + "step": 16950 + }, + { + "epoch": 0.68, + "learning_rate": 9.670350350350352e-06, + "loss": 0.3633, + "step": 16975 + }, + { + "epoch": 0.68, + "learning_rate": 9.669849849849851e-06, + "loss": 0.3585, + "step": 17000 + }, + { + "epoch": 0.68, + "eval_loss": 0.4826071560382843, + "eval_runtime": 2556.6287, + "eval_samples_per_second": 6.342, + "eval_steps_per_second": 0.159, + "eval_wer": 29.16952536597775, + "step": 17000 + }, + { + "epoch": 0.68, + "learning_rate": 9.66934934934935e-06, + "loss": 0.3504, + "step": 17025 + }, + { + "epoch": 0.68, + "learning_rate": 9.66884884884885e-06, + "loss": 0.3523, + "step": 17050 + }, + { + "epoch": 0.68, + "learning_rate": 9.668348348348349e-06, + "loss": 0.3572, + "step": 17075 + }, + { + "epoch": 0.68, + "learning_rate": 9.667847847847848e-06, + "loss": 0.364, + "step": 17100 + }, + { + "epoch": 0.68, + "learning_rate": 9.667347347347348e-06, + "loss": 0.3251, + "step": 17125 + }, + { + "epoch": 0.68, + "learning_rate": 9.666846846846849e-06, + "loss": 0.3318, + "step": 17150 + }, + { + "epoch": 0.68, + "learning_rate": 9.666346346346346e-06, + "loss": 0.3456, + "step": 17175 + }, + { + "epoch": 0.69, + "learning_rate": 9.665845845845847e-06, + "loss": 0.345, + "step": 17200 + }, + { + "epoch": 0.69, + "learning_rate": 9.665345345345346e-06, + "loss": 0.3224, + "step": 17225 + }, + { + "epoch": 0.69, + "learning_rate": 9.664844844844846e-06, + "loss": 0.3397, + "step": 17250 + }, + { + "epoch": 0.69, + "learning_rate": 9.664344344344345e-06, + "loss": 0.3484, + "step": 17275 + }, + { + "epoch": 0.69, + "learning_rate": 9.663843843843844e-06, + "loss": 0.3267, + "step": 17300 + }, + { + "epoch": 0.69, + "learning_rate": 9.663343343343344e-06, + "loss": 0.3642, + "step": 17325 + }, + { + "epoch": 0.69, + "learning_rate": 9.662842842842843e-06, + "loss": 0.3447, + "step": 17350 + }, + { + "epoch": 0.69, + "learning_rate": 9.662342342342344e-06, + "loss": 0.3429, + "step": 17375 + }, + { + "epoch": 0.69, + "learning_rate": 9.661841841841843e-06, + "loss": 0.3258, + "step": 17400 + }, + { + "epoch": 0.69, + "learning_rate": 9.661341341341343e-06, + "loss": 0.3305, + "step": 17425 + }, + { + "epoch": 0.7, + "learning_rate": 9.660840840840842e-06, + "loss": 0.3376, + "step": 17450 + }, + { + "epoch": 0.7, + "learning_rate": 9.660340340340341e-06, + "loss": 0.3417, + "step": 17475 + }, + { + "epoch": 0.7, + "learning_rate": 9.65983983983984e-06, + "loss": 0.3326, + "step": 17500 + }, + { + "epoch": 0.7, + "learning_rate": 9.65933933933934e-06, + "loss": 0.334, + "step": 17525 + }, + { + "epoch": 0.7, + "learning_rate": 9.65883883883884e-06, + "loss": 0.3461, + "step": 17550 + }, + { + "epoch": 0.7, + "learning_rate": 9.658338338338338e-06, + "loss": 0.3512, + "step": 17575 + }, + { + "epoch": 0.7, + "learning_rate": 9.65783783783784e-06, + "loss": 0.3609, + "step": 17600 + }, + { + "epoch": 0.7, + "learning_rate": 9.657337337337339e-06, + "loss": 0.3502, + "step": 17625 + }, + { + "epoch": 0.7, + "learning_rate": 9.656836836836838e-06, + "loss": 0.3508, + "step": 17650 + }, + { + "epoch": 0.7, + "learning_rate": 9.656336336336337e-06, + "loss": 0.3436, + "step": 17675 + }, + { + "epoch": 0.71, + "learning_rate": 9.655835835835836e-06, + "loss": 0.3525, + "step": 17700 + }, + { + "epoch": 0.71, + "learning_rate": 9.655335335335336e-06, + "loss": 0.339, + "step": 17725 + }, + { + "epoch": 0.71, + "learning_rate": 9.654834834834835e-06, + "loss": 0.3507, + "step": 17750 + }, + { + "epoch": 0.71, + "learning_rate": 9.654334334334336e-06, + "loss": 0.3277, + "step": 17775 + }, + { + "epoch": 0.71, + "learning_rate": 9.653833833833834e-06, + "loss": 0.3486, + "step": 17800 + }, + { + "epoch": 0.71, + "learning_rate": 9.653353353353354e-06, + "loss": 0.3529, + "step": 17825 + }, + { + "epoch": 0.71, + "learning_rate": 9.652852852852854e-06, + "loss": 0.3228, + "step": 17850 + }, + { + "epoch": 0.71, + "learning_rate": 9.652352352352353e-06, + "loss": 0.335, + "step": 17875 + }, + { + "epoch": 0.71, + "learning_rate": 9.651851851851852e-06, + "loss": 0.3641, + "step": 17900 + }, + { + "epoch": 0.71, + "learning_rate": 9.651351351351352e-06, + "loss": 0.3248, + "step": 17925 + }, + { + "epoch": 0.72, + "learning_rate": 9.650850850850851e-06, + "loss": 0.3308, + "step": 17950 + }, + { + "epoch": 0.72, + "learning_rate": 9.650350350350352e-06, + "loss": 0.333, + "step": 17975 + }, + { + "epoch": 0.72, + "learning_rate": 9.649849849849851e-06, + "loss": 0.3302, + "step": 18000 + }, + { + "epoch": 0.72, + "eval_loss": 0.4842660427093506, + "eval_runtime": 2644.843, + "eval_samples_per_second": 6.13, + "eval_steps_per_second": 0.154, + "eval_wer": 29.56498947741692, + "step": 18000 + }, + { + "epoch": 0.72, + "learning_rate": 9.64934934934935e-06, + "loss": 0.3624, + "step": 18025 + }, + { + "epoch": 0.72, + "learning_rate": 9.64884884884885e-06, + "loss": 0.3645, + "step": 18050 + }, + { + "epoch": 0.72, + "learning_rate": 9.648348348348349e-06, + "loss": 0.3563, + "step": 18075 + }, + { + "epoch": 0.72, + "learning_rate": 9.647847847847848e-06, + "loss": 0.3354, + "step": 18100 + }, + { + "epoch": 0.72, + "learning_rate": 9.647347347347348e-06, + "loss": 0.3352, + "step": 18125 + }, + { + "epoch": 0.72, + "learning_rate": 9.646846846846849e-06, + "loss": 0.3426, + "step": 18150 + }, + { + "epoch": 0.72, + "learning_rate": 9.646346346346346e-06, + "loss": 0.3534, + "step": 18175 + }, + { + "epoch": 0.73, + "learning_rate": 9.645845845845847e-06, + "loss": 0.3316, + "step": 18200 + }, + { + "epoch": 0.73, + "learning_rate": 9.645345345345347e-06, + "loss": 0.3387, + "step": 18225 + }, + { + "epoch": 0.73, + "learning_rate": 9.644844844844846e-06, + "loss": 0.3489, + "step": 18250 + }, + { + "epoch": 0.73, + "learning_rate": 9.644344344344345e-06, + "loss": 0.3339, + "step": 18275 + }, + { + "epoch": 0.73, + "learning_rate": 9.643843843843845e-06, + "loss": 0.3416, + "step": 18300 + }, + { + "epoch": 0.73, + "learning_rate": 9.643343343343344e-06, + "loss": 0.3259, + "step": 18325 + }, + { + "epoch": 0.73, + "learning_rate": 9.642842842842843e-06, + "loss": 0.3476, + "step": 18350 + }, + { + "epoch": 0.73, + "learning_rate": 9.642342342342344e-06, + "loss": 0.3499, + "step": 18375 + }, + { + "epoch": 0.73, + "learning_rate": 9.641841841841842e-06, + "loss": 0.3438, + "step": 18400 + }, + { + "epoch": 0.73, + "learning_rate": 9.641341341341343e-06, + "loss": 0.3316, + "step": 18425 + }, + { + "epoch": 0.74, + "learning_rate": 9.640840840840842e-06, + "loss": 0.3397, + "step": 18450 + }, + { + "epoch": 0.74, + "learning_rate": 9.640340340340341e-06, + "loss": 0.3281, + "step": 18475 + }, + { + "epoch": 0.74, + "learning_rate": 9.63983983983984e-06, + "loss": 0.3316, + "step": 18500 + }, + { + "epoch": 0.74, + "learning_rate": 9.63933933933934e-06, + "loss": 0.3487, + "step": 18525 + }, + { + "epoch": 0.74, + "learning_rate": 9.63883883883884e-06, + "loss": 0.3273, + "step": 18550 + }, + { + "epoch": 0.74, + "learning_rate": 9.638338338338338e-06, + "loss": 0.3522, + "step": 18575 + }, + { + "epoch": 0.74, + "learning_rate": 9.63783783783784e-06, + "loss": 0.3261, + "step": 18600 + }, + { + "epoch": 0.74, + "learning_rate": 9.637337337337339e-06, + "loss": 0.3551, + "step": 18625 + }, + { + "epoch": 0.74, + "learning_rate": 9.636836836836838e-06, + "loss": 0.343, + "step": 18650 + }, + { + "epoch": 0.74, + "learning_rate": 9.636336336336337e-06, + "loss": 0.3302, + "step": 18675 + }, + { + "epoch": 0.75, + "learning_rate": 9.635835835835837e-06, + "loss": 0.3287, + "step": 18700 + }, + { + "epoch": 0.75, + "learning_rate": 9.635335335335336e-06, + "loss": 0.3317, + "step": 18725 + }, + { + "epoch": 0.75, + "learning_rate": 9.634834834834835e-06, + "loss": 0.3346, + "step": 18750 + }, + { + "epoch": 0.75, + "learning_rate": 9.634334334334336e-06, + "loss": 0.3531, + "step": 18775 + }, + { + "epoch": 0.75, + "learning_rate": 9.633833833833834e-06, + "loss": 0.35, + "step": 18800 + }, + { + "epoch": 0.75, + "learning_rate": 9.633333333333335e-06, + "loss": 0.3407, + "step": 18825 + }, + { + "epoch": 0.75, + "learning_rate": 9.632832832832834e-06, + "loss": 0.3193, + "step": 18850 + }, + { + "epoch": 0.75, + "learning_rate": 9.632332332332333e-06, + "loss": 0.351, + "step": 18875 + }, + { + "epoch": 0.75, + "learning_rate": 9.631831831831833e-06, + "loss": 0.3554, + "step": 18900 + }, + { + "epoch": 0.75, + "learning_rate": 9.631331331331332e-06, + "loss": 0.3389, + "step": 18925 + }, + { + "epoch": 0.76, + "learning_rate": 9.630830830830831e-06, + "loss": 0.3196, + "step": 18950 + }, + { + "epoch": 0.76, + "learning_rate": 9.63033033033033e-06, + "loss": 0.3271, + "step": 18975 + }, + { + "epoch": 0.76, + "learning_rate": 9.629829829829832e-06, + "loss": 0.3252, + "step": 19000 + }, + { + "epoch": 0.76, + "eval_loss": 0.4709344506263733, + "eval_runtime": 2536.9152, + "eval_samples_per_second": 6.391, + "eval_steps_per_second": 0.16, + "eval_wer": 28.698514504205182, + "step": 19000 + }, + { + "epoch": 0.76, + "learning_rate": 9.62932932932933e-06, + "loss": 0.3142, + "step": 19025 + }, + { + "epoch": 0.76, + "learning_rate": 9.62882882882883e-06, + "loss": 0.3346, + "step": 19050 + }, + { + "epoch": 0.76, + "learning_rate": 9.62832832832833e-06, + "loss": 0.3582, + "step": 19075 + }, + { + "epoch": 0.76, + "learning_rate": 9.627827827827829e-06, + "loss": 0.327, + "step": 19100 + }, + { + "epoch": 0.76, + "learning_rate": 9.627327327327328e-06, + "loss": 0.3347, + "step": 19125 + }, + { + "epoch": 0.76, + "learning_rate": 9.626826826826827e-06, + "loss": 0.3509, + "step": 19150 + }, + { + "epoch": 0.76, + "learning_rate": 9.626326326326327e-06, + "loss": 0.3349, + "step": 19175 + }, + { + "epoch": 0.77, + "learning_rate": 9.625825825825826e-06, + "loss": 0.335, + "step": 19200 + }, + { + "epoch": 0.77, + "learning_rate": 9.625325325325327e-06, + "loss": 0.3371, + "step": 19225 + }, + { + "epoch": 0.77, + "learning_rate": 9.624824824824826e-06, + "loss": 0.3475, + "step": 19250 + }, + { + "epoch": 0.77, + "learning_rate": 9.624324324324326e-06, + "loss": 0.3428, + "step": 19275 + }, + { + "epoch": 0.77, + "learning_rate": 9.623823823823825e-06, + "loss": 0.3375, + "step": 19300 + }, + { + "epoch": 0.77, + "learning_rate": 9.623323323323324e-06, + "loss": 0.335, + "step": 19325 + }, + { + "epoch": 0.77, + "learning_rate": 9.622822822822823e-06, + "loss": 0.3488, + "step": 19350 + }, + { + "epoch": 0.77, + "learning_rate": 9.622322322322323e-06, + "loss": 0.3255, + "step": 19375 + }, + { + "epoch": 0.77, + "learning_rate": 9.621821821821822e-06, + "loss": 0.3419, + "step": 19400 + }, + { + "epoch": 0.77, + "learning_rate": 9.621321321321321e-06, + "loss": 0.3257, + "step": 19425 + }, + { + "epoch": 0.78, + "learning_rate": 9.620820820820822e-06, + "loss": 0.337, + "step": 19450 + }, + { + "epoch": 0.78, + "learning_rate": 9.620320320320322e-06, + "loss": 0.3159, + "step": 19475 + }, + { + "epoch": 0.78, + "learning_rate": 9.619819819819821e-06, + "loss": 0.336, + "step": 19500 + }, + { + "epoch": 0.78, + "learning_rate": 9.61931931931932e-06, + "loss": 0.3218, + "step": 19525 + }, + { + "epoch": 0.78, + "learning_rate": 9.61881881881882e-06, + "loss": 0.3447, + "step": 19550 + }, + { + "epoch": 0.78, + "learning_rate": 9.618318318318319e-06, + "loss": 0.3395, + "step": 19575 + }, + { + "epoch": 0.78, + "learning_rate": 9.617817817817818e-06, + "loss": 0.3237, + "step": 19600 + }, + { + "epoch": 0.78, + "learning_rate": 9.617317317317319e-06, + "loss": 0.331, + "step": 19625 + }, + { + "epoch": 0.78, + "learning_rate": 9.616816816816817e-06, + "loss": 0.3152, + "step": 19650 + }, + { + "epoch": 0.78, + "learning_rate": 9.616316316316318e-06, + "loss": 0.3391, + "step": 19675 + }, + { + "epoch": 0.79, + "learning_rate": 9.615815815815817e-06, + "loss": 0.3293, + "step": 19700 + }, + { + "epoch": 0.79, + "learning_rate": 9.615315315315316e-06, + "loss": 0.3322, + "step": 19725 + }, + { + "epoch": 0.79, + "learning_rate": 9.614814814814816e-06, + "loss": 0.3294, + "step": 19750 + }, + { + "epoch": 0.79, + "learning_rate": 9.614314314314315e-06, + "loss": 0.334, + "step": 19775 + }, + { + "epoch": 0.79, + "learning_rate": 9.613813813813814e-06, + "loss": 0.3418, + "step": 19800 + }, + { + "epoch": 0.79, + "learning_rate": 9.613313313313314e-06, + "loss": 0.3456, + "step": 19825 + }, + { + "epoch": 0.79, + "learning_rate": 9.612812812812815e-06, + "loss": 0.3513, + "step": 19850 + }, + { + "epoch": 0.79, + "learning_rate": 9.612312312312314e-06, + "loss": 0.3395, + "step": 19875 + }, + { + "epoch": 0.79, + "learning_rate": 9.611811811811813e-06, + "loss": 0.3478, + "step": 19900 + }, + { + "epoch": 0.79, + "learning_rate": 9.611311311311312e-06, + "loss": 0.3278, + "step": 19925 + }, + { + "epoch": 0.8, + "learning_rate": 9.610810810810812e-06, + "loss": 0.3012, + "step": 19950 + }, + { + "epoch": 0.8, + "learning_rate": 9.610310310310311e-06, + "loss": 0.3453, + "step": 19975 + }, + { + "epoch": 0.8, + "learning_rate": 9.60980980980981e-06, + "loss": 0.3453, + "step": 20000 + }, + { + "epoch": 0.8, + "eval_loss": 0.471629798412323, + "eval_runtime": 2478.9552, + "eval_samples_per_second": 6.54, + "eval_steps_per_second": 0.164, + "eval_wer": 27.84051926827576, + "step": 20000 + }, + { + "epoch": 0.8, + "learning_rate": 9.60930930930931e-06, + "loss": 0.3442, + "step": 20025 + }, + { + "epoch": 0.8, + "learning_rate": 9.608808808808809e-06, + "loss": 0.3431, + "step": 20050 + }, + { + "epoch": 0.8, + "learning_rate": 9.60830830830831e-06, + "loss": 0.3146, + "step": 20075 + }, + { + "epoch": 0.8, + "learning_rate": 9.60780780780781e-06, + "loss": 0.3474, + "step": 20100 + }, + { + "epoch": 0.8, + "learning_rate": 9.607307307307307e-06, + "loss": 0.3335, + "step": 20125 + }, + { + "epoch": 0.8, + "learning_rate": 9.606806806806808e-06, + "loss": 0.3374, + "step": 20150 + }, + { + "epoch": 0.8, + "learning_rate": 9.606306306306307e-06, + "loss": 0.3235, + "step": 20175 + }, + { + "epoch": 0.81, + "learning_rate": 9.605805805805806e-06, + "loss": 0.339, + "step": 20200 + }, + { + "epoch": 0.81, + "learning_rate": 9.605305305305306e-06, + "loss": 0.3468, + "step": 20225 + }, + { + "epoch": 0.81, + "learning_rate": 9.604804804804807e-06, + "loss": 0.3587, + "step": 20250 + }, + { + "epoch": 0.81, + "learning_rate": 9.604304304304304e-06, + "loss": 0.3113, + "step": 20275 + }, + { + "epoch": 0.81, + "learning_rate": 9.603803803803805e-06, + "loss": 0.3224, + "step": 20300 + }, + { + "epoch": 0.81, + "learning_rate": 9.603303303303305e-06, + "loss": 0.3298, + "step": 20325 + }, + { + "epoch": 0.81, + "learning_rate": 9.602802802802804e-06, + "loss": 0.3489, + "step": 20350 + }, + { + "epoch": 0.81, + "learning_rate": 9.602302302302303e-06, + "loss": 0.2943, + "step": 20375 + }, + { + "epoch": 0.81, + "learning_rate": 9.601801801801802e-06, + "loss": 0.3283, + "step": 20400 + }, + { + "epoch": 0.81, + "learning_rate": 9.601301301301302e-06, + "loss": 0.3167, + "step": 20425 + }, + { + "epoch": 0.82, + "learning_rate": 9.600800800800801e-06, + "loss": 0.3427, + "step": 20450 + }, + { + "epoch": 0.82, + "learning_rate": 9.600300300300302e-06, + "loss": 0.3538, + "step": 20475 + }, + { + "epoch": 0.82, + "learning_rate": 9.599799799799801e-06, + "loss": 0.3353, + "step": 20500 + }, + { + "epoch": 0.82, + "learning_rate": 9.5992992992993e-06, + "loss": 0.3427, + "step": 20525 + }, + { + "epoch": 0.82, + "learning_rate": 9.5987987987988e-06, + "loss": 0.3349, + "step": 20550 + }, + { + "epoch": 0.82, + "learning_rate": 9.5982982982983e-06, + "loss": 0.334, + "step": 20575 + }, + { + "epoch": 0.82, + "learning_rate": 9.597797797797799e-06, + "loss": 0.3281, + "step": 20600 + }, + { + "epoch": 0.82, + "learning_rate": 9.597297297297298e-06, + "loss": 0.3231, + "step": 20625 + }, + { + "epoch": 0.82, + "learning_rate": 9.596796796796797e-06, + "loss": 0.336, + "step": 20650 + }, + { + "epoch": 0.82, + "learning_rate": 9.596296296296296e-06, + "loss": 0.3208, + "step": 20675 + }, + { + "epoch": 0.83, + "learning_rate": 9.595795795795797e-06, + "loss": 0.3261, + "step": 20700 + }, + { + "epoch": 0.83, + "learning_rate": 9.595295295295297e-06, + "loss": 0.3354, + "step": 20725 + }, + { + "epoch": 0.83, + "learning_rate": 9.594794794794794e-06, + "loss": 0.3311, + "step": 20750 + }, + { + "epoch": 0.83, + "learning_rate": 9.594294294294295e-06, + "loss": 0.3372, + "step": 20775 + }, + { + "epoch": 0.83, + "learning_rate": 9.593793793793795e-06, + "loss": 0.3263, + "step": 20800 + }, + { + "epoch": 0.83, + "learning_rate": 9.593293293293294e-06, + "loss": 0.3187, + "step": 20825 + }, + { + "epoch": 0.83, + "learning_rate": 9.592792792792793e-06, + "loss": 0.317, + "step": 20850 + }, + { + "epoch": 0.83, + "learning_rate": 9.592292292292294e-06, + "loss": 0.3428, + "step": 20875 + }, + { + "epoch": 0.83, + "learning_rate": 9.591791791791792e-06, + "loss": 0.3049, + "step": 20900 + }, + { + "epoch": 0.83, + "learning_rate": 9.591291291291293e-06, + "loss": 0.3125, + "step": 20925 + }, + { + "epoch": 0.84, + "learning_rate": 9.590790790790792e-06, + "loss": 0.3206, + "step": 20950 + }, + { + "epoch": 0.84, + "learning_rate": 9.590290290290291e-06, + "loss": 0.3515, + "step": 20975 + }, + { + "epoch": 0.84, + "learning_rate": 9.58978978978979e-06, + "loss": 0.3412, + "step": 21000 + }, + { + "epoch": 0.84, + "eval_loss": 0.4714227020740509, + "eval_runtime": 2637.8451, + "eval_samples_per_second": 6.146, + "eval_steps_per_second": 0.154, + "eval_wer": 29.17954687367504, + "step": 21000 + }, + { + "epoch": 0.84, + "learning_rate": 9.58928928928929e-06, + "loss": 0.3176, + "step": 21025 + }, + { + "epoch": 0.84, + "learning_rate": 9.58878878878879e-06, + "loss": 0.3355, + "step": 21050 + }, + { + "epoch": 0.84, + "learning_rate": 9.588288288288289e-06, + "loss": 0.3306, + "step": 21075 + }, + { + "epoch": 0.84, + "learning_rate": 9.58778778778779e-06, + "loss": 0.3532, + "step": 21100 + }, + { + "epoch": 0.84, + "learning_rate": 9.587287287287287e-06, + "loss": 0.3311, + "step": 21125 + }, + { + "epoch": 0.84, + "learning_rate": 9.586786786786788e-06, + "loss": 0.3377, + "step": 21150 + }, + { + "epoch": 0.84, + "learning_rate": 9.586286286286287e-06, + "loss": 0.3171, + "step": 21175 + }, + { + "epoch": 0.85, + "learning_rate": 9.585785785785787e-06, + "loss": 0.3454, + "step": 21200 + }, + { + "epoch": 0.85, + "learning_rate": 9.585285285285286e-06, + "loss": 0.311, + "step": 21225 + }, + { + "epoch": 0.85, + "learning_rate": 9.584784784784785e-06, + "loss": 0.3303, + "step": 21250 + }, + { + "epoch": 0.85, + "learning_rate": 9.584284284284285e-06, + "loss": 0.3204, + "step": 21275 + }, + { + "epoch": 0.85, + "learning_rate": 9.583783783783784e-06, + "loss": 0.3104, + "step": 21300 + }, + { + "epoch": 0.85, + "learning_rate": 9.583283283283285e-06, + "loss": 0.3244, + "step": 21325 + }, + { + "epoch": 0.85, + "learning_rate": 9.582782782782784e-06, + "loss": 0.3192, + "step": 21350 + }, + { + "epoch": 0.85, + "learning_rate": 9.582282282282282e-06, + "loss": 0.3238, + "step": 21375 + }, + { + "epoch": 0.85, + "learning_rate": 9.581781781781783e-06, + "loss": 0.3298, + "step": 21400 + }, + { + "epoch": 0.85, + "learning_rate": 9.581281281281282e-06, + "loss": 0.3223, + "step": 21425 + }, + { + "epoch": 0.86, + "learning_rate": 9.580780780780781e-06, + "loss": 0.3576, + "step": 21450 + }, + { + "epoch": 0.86, + "learning_rate": 9.58028028028028e-06, + "loss": 0.305, + "step": 21475 + }, + { + "epoch": 0.86, + "learning_rate": 9.579779779779782e-06, + "loss": 0.3287, + "step": 21500 + }, + { + "epoch": 0.86, + "learning_rate": 9.57927927927928e-06, + "loss": 0.3372, + "step": 21525 + }, + { + "epoch": 0.86, + "learning_rate": 9.57877877877878e-06, + "loss": 0.3142, + "step": 21550 + }, + { + "epoch": 0.86, + "learning_rate": 9.57827827827828e-06, + "loss": 0.3222, + "step": 21575 + }, + { + "epoch": 0.86, + "learning_rate": 9.577777777777779e-06, + "loss": 0.3413, + "step": 21600 + }, + { + "epoch": 0.86, + "learning_rate": 9.577277277277278e-06, + "loss": 0.3194, + "step": 21625 + }, + { + "epoch": 0.86, + "learning_rate": 9.576776776776777e-06, + "loss": 0.3226, + "step": 21650 + }, + { + "epoch": 0.86, + "learning_rate": 9.576276276276277e-06, + "loss": 0.3162, + "step": 21675 + }, + { + "epoch": 0.87, + "learning_rate": 9.575775775775776e-06, + "loss": 0.3097, + "step": 21700 + }, + { + "epoch": 0.87, + "learning_rate": 9.575275275275277e-06, + "loss": 0.3366, + "step": 21725 + }, + { + "epoch": 0.87, + "learning_rate": 9.574774774774775e-06, + "loss": 0.322, + "step": 21750 + }, + { + "epoch": 0.87, + "learning_rate": 9.574274274274276e-06, + "loss": 0.3407, + "step": 21775 + }, + { + "epoch": 0.87, + "learning_rate": 9.573773773773775e-06, + "loss": 0.325, + "step": 21800 + }, + { + "epoch": 0.87, + "learning_rate": 9.573273273273274e-06, + "loss": 0.319, + "step": 21825 + }, + { + "epoch": 0.87, + "learning_rate": 9.572772772772774e-06, + "loss": 0.318, + "step": 21850 + }, + { + "epoch": 0.87, + "learning_rate": 9.572272272272273e-06, + "loss": 0.3029, + "step": 21875 + }, + { + "epoch": 0.87, + "learning_rate": 9.571771771771772e-06, + "loss": 0.3398, + "step": 21900 + }, + { + "epoch": 0.87, + "learning_rate": 9.571271271271271e-06, + "loss": 0.345, + "step": 21925 + }, + { + "epoch": 0.88, + "learning_rate": 9.570770770770772e-06, + "loss": 0.3366, + "step": 21950 + }, + { + "epoch": 0.88, + "learning_rate": 9.570270270270272e-06, + "loss": 0.3192, + "step": 21975 + }, + { + "epoch": 0.88, + "learning_rate": 9.56976976976977e-06, + "loss": 0.3221, + "step": 22000 + }, + { + "epoch": 0.88, + "eval_loss": 0.4648185670375824, + "eval_runtime": 2509.1979, + "eval_samples_per_second": 6.461, + "eval_steps_per_second": 0.162, + "eval_wer": 27.938421689626196, + "step": 22000 + }, + { + "epoch": 0.88, + "learning_rate": 9.56926926926927e-06, + "loss": 0.3333, + "step": 22025 + }, + { + "epoch": 0.88, + "learning_rate": 9.56876876876877e-06, + "loss": 0.3309, + "step": 22050 + }, + { + "epoch": 0.88, + "learning_rate": 9.568268268268269e-06, + "loss": 0.3252, + "step": 22075 + }, + { + "epoch": 0.88, + "learning_rate": 9.567767767767768e-06, + "loss": 0.339, + "step": 22100 + }, + { + "epoch": 0.88, + "learning_rate": 9.56726726726727e-06, + "loss": 0.3185, + "step": 22125 + }, + { + "epoch": 0.88, + "learning_rate": 9.566766766766767e-06, + "loss": 0.3312, + "step": 22150 + }, + { + "epoch": 0.88, + "learning_rate": 9.566266266266268e-06, + "loss": 0.3279, + "step": 22175 + }, + { + "epoch": 0.89, + "learning_rate": 9.565765765765767e-06, + "loss": 0.3111, + "step": 22200 + }, + { + "epoch": 0.89, + "learning_rate": 9.565265265265266e-06, + "loss": 0.3294, + "step": 22225 + }, + { + "epoch": 0.89, + "learning_rate": 9.564764764764766e-06, + "loss": 0.3359, + "step": 22250 + }, + { + "epoch": 0.89, + "learning_rate": 9.564264264264265e-06, + "loss": 0.3324, + "step": 22275 + }, + { + "epoch": 0.89, + "learning_rate": 9.563763763763764e-06, + "loss": 0.3331, + "step": 22300 + }, + { + "epoch": 0.89, + "learning_rate": 9.563263263263264e-06, + "loss": 0.3331, + "step": 22325 + }, + { + "epoch": 0.89, + "learning_rate": 9.562762762762765e-06, + "loss": 0.307, + "step": 22350 + }, + { + "epoch": 0.89, + "learning_rate": 9.562262262262262e-06, + "loss": 0.3384, + "step": 22375 + }, + { + "epoch": 0.89, + "learning_rate": 9.561761761761763e-06, + "loss": 0.3291, + "step": 22400 + }, + { + "epoch": 0.89, + "learning_rate": 9.561261261261262e-06, + "loss": 0.3411, + "step": 22425 + }, + { + "epoch": 0.9, + "learning_rate": 9.560760760760762e-06, + "loss": 0.3141, + "step": 22450 + }, + { + "epoch": 0.9, + "learning_rate": 9.560260260260261e-06, + "loss": 0.3289, + "step": 22475 + }, + { + "epoch": 0.9, + "learning_rate": 9.55975975975976e-06, + "loss": 0.3289, + "step": 22500 + }, + { + "epoch": 0.9, + "learning_rate": 9.55925925925926e-06, + "loss": 0.2942, + "step": 22525 + }, + { + "epoch": 0.9, + "learning_rate": 9.558758758758759e-06, + "loss": 0.3307, + "step": 22550 + }, + { + "epoch": 0.9, + "learning_rate": 9.55825825825826e-06, + "loss": 0.3565, + "step": 22575 + }, + { + "epoch": 0.9, + "learning_rate": 9.55775775775776e-06, + "loss": 0.3065, + "step": 22600 + }, + { + "epoch": 0.9, + "learning_rate": 9.557257257257257e-06, + "loss": 0.3128, + "step": 22625 + }, + { + "epoch": 0.9, + "learning_rate": 9.556756756756758e-06, + "loss": 0.3181, + "step": 22650 + }, + { + "epoch": 0.9, + "learning_rate": 9.556256256256257e-06, + "loss": 0.321, + "step": 22675 + }, + { + "epoch": 0.91, + "learning_rate": 9.555755755755756e-06, + "loss": 0.3305, + "step": 22700 + }, + { + "epoch": 0.91, + "learning_rate": 9.555255255255256e-06, + "loss": 0.3454, + "step": 22725 + }, + { + "epoch": 0.91, + "learning_rate": 9.554754754754757e-06, + "loss": 0.3236, + "step": 22750 + }, + { + "epoch": 0.91, + "learning_rate": 9.554254254254254e-06, + "loss": 0.3345, + "step": 22775 + }, + { + "epoch": 0.91, + "learning_rate": 9.553753753753755e-06, + "loss": 0.3221, + "step": 22800 + }, + { + "epoch": 0.91, + "learning_rate": 9.553253253253255e-06, + "loss": 0.3333, + "step": 22825 + }, + { + "epoch": 0.91, + "learning_rate": 9.552752752752752e-06, + "loss": 0.3176, + "step": 22850 + }, + { + "epoch": 0.91, + "learning_rate": 9.552252252252253e-06, + "loss": 0.3286, + "step": 22875 + }, + { + "epoch": 0.91, + "learning_rate": 9.551751751751753e-06, + "loss": 0.3165, + "step": 22900 + }, + { + "epoch": 0.91, + "learning_rate": 9.551251251251252e-06, + "loss": 0.3312, + "step": 22925 + }, + { + "epoch": 0.92, + "learning_rate": 9.550750750750751e-06, + "loss": 0.3334, + "step": 22950 + }, + { + "epoch": 0.92, + "learning_rate": 9.550250250250252e-06, + "loss": 0.3092, + "step": 22975 + }, + { + "epoch": 0.92, + "learning_rate": 9.54974974974975e-06, + "loss": 0.322, + "step": 23000 + }, + { + "epoch": 0.92, + "eval_loss": 0.46254613995552063, + "eval_runtime": 2464.8795, + "eval_samples_per_second": 6.578, + "eval_steps_per_second": 0.165, + "eval_wer": 27.390322307105247, + "step": 23000 + }, + { + "epoch": 0.92, + "learning_rate": 9.54924924924925e-06, + "loss": 0.3245, + "step": 23025 + }, + { + "epoch": 0.92, + "learning_rate": 9.54874874874875e-06, + "loss": 0.3263, + "step": 23050 + }, + { + "epoch": 0.92, + "learning_rate": 9.54824824824825e-06, + "loss": 0.3246, + "step": 23075 + }, + { + "epoch": 0.92, + "learning_rate": 9.547747747747749e-06, + "loss": 0.3407, + "step": 23100 + }, + { + "epoch": 0.92, + "learning_rate": 9.547247247247248e-06, + "loss": 0.3116, + "step": 23125 + }, + { + "epoch": 0.92, + "learning_rate": 9.546746746746747e-06, + "loss": 0.3278, + "step": 23150 + }, + { + "epoch": 0.92, + "learning_rate": 9.546246246246246e-06, + "loss": 0.3369, + "step": 23175 + }, + { + "epoch": 0.93, + "learning_rate": 9.545745745745747e-06, + "loss": 0.3133, + "step": 23200 + }, + { + "epoch": 0.93, + "learning_rate": 9.545245245245247e-06, + "loss": 0.3112, + "step": 23225 + }, + { + "epoch": 0.93, + "learning_rate": 9.544744744744744e-06, + "loss": 0.3316, + "step": 23250 + }, + { + "epoch": 0.93, + "learning_rate": 9.544244244244245e-06, + "loss": 0.3266, + "step": 23275 + }, + { + "epoch": 0.93, + "learning_rate": 9.543743743743745e-06, + "loss": 0.3237, + "step": 23300 + }, + { + "epoch": 0.93, + "learning_rate": 9.543243243243244e-06, + "loss": 0.3073, + "step": 23325 + }, + { + "epoch": 0.93, + "learning_rate": 9.542742742742743e-06, + "loss": 0.3326, + "step": 23350 + }, + { + "epoch": 0.93, + "learning_rate": 9.542242242242243e-06, + "loss": 0.3063, + "step": 23375 + }, + { + "epoch": 0.93, + "learning_rate": 9.541741741741742e-06, + "loss": 0.3145, + "step": 23400 + }, + { + "epoch": 0.93, + "learning_rate": 9.541241241241243e-06, + "loss": 0.3329, + "step": 23425 + }, + { + "epoch": 0.94, + "learning_rate": 9.540740740740742e-06, + "loss": 0.3285, + "step": 23450 + }, + { + "epoch": 0.94, + "learning_rate": 9.54024024024024e-06, + "loss": 0.3312, + "step": 23475 + }, + { + "epoch": 0.94, + "learning_rate": 9.53973973973974e-06, + "loss": 0.3203, + "step": 23500 + }, + { + "epoch": 0.94, + "learning_rate": 9.53923923923924e-06, + "loss": 0.327, + "step": 23525 + }, + { + "epoch": 0.94, + "learning_rate": 9.53873873873874e-06, + "loss": 0.3136, + "step": 23550 + }, + { + "epoch": 0.94, + "learning_rate": 9.538238238238239e-06, + "loss": 0.314, + "step": 23575 + }, + { + "epoch": 0.94, + "learning_rate": 9.53773773773774e-06, + "loss": 0.3294, + "step": 23600 + }, + { + "epoch": 0.94, + "learning_rate": 9.537237237237237e-06, + "loss": 0.3331, + "step": 23625 + }, + { + "epoch": 0.94, + "learning_rate": 9.536736736736738e-06, + "loss": 0.3112, + "step": 23650 + }, + { + "epoch": 0.94, + "learning_rate": 9.536236236236237e-06, + "loss": 0.3047, + "step": 23675 + }, + { + "epoch": 0.95, + "learning_rate": 9.535735735735737e-06, + "loss": 0.3153, + "step": 23700 + }, + { + "epoch": 0.95, + "learning_rate": 9.535235235235236e-06, + "loss": 0.3195, + "step": 23725 + }, + { + "epoch": 0.95, + "learning_rate": 9.534734734734735e-06, + "loss": 0.3187, + "step": 23750 + }, + { + "epoch": 0.95, + "learning_rate": 9.534234234234235e-06, + "loss": 0.3351, + "step": 23775 + }, + { + "epoch": 0.95, + "learning_rate": 9.533733733733734e-06, + "loss": 0.3172, + "step": 23800 + }, + { + "epoch": 0.95, + "learning_rate": 9.533233233233235e-06, + "loss": 0.3206, + "step": 23825 + }, + { + "epoch": 0.95, + "learning_rate": 9.532752752752752e-06, + "loss": 0.3261, + "step": 23850 + }, + { + "epoch": 0.95, + "learning_rate": 9.532252252252253e-06, + "loss": 0.3204, + "step": 23875 + }, + { + "epoch": 0.95, + "learning_rate": 9.531751751751753e-06, + "loss": 0.3154, + "step": 23900 + }, + { + "epoch": 0.95, + "learning_rate": 9.531251251251252e-06, + "loss": 0.3159, + "step": 23925 + }, + { + "epoch": 0.96, + "learning_rate": 9.530750750750751e-06, + "loss": 0.326, + "step": 23950 + }, + { + "epoch": 0.96, + "learning_rate": 9.53025025025025e-06, + "loss": 0.3014, + "step": 23975 + }, + { + "epoch": 0.96, + "learning_rate": 9.52974974974975e-06, + "loss": 0.312, + "step": 24000 + }, + { + "epoch": 0.96, + "eval_loss": 0.46919143199920654, + "eval_runtime": 2551.3752, + "eval_samples_per_second": 6.355, + "eval_steps_per_second": 0.159, + "eval_wer": 28.381680683929357, + "step": 24000 + }, + { + "epoch": 0.96, + "learning_rate": 9.529249249249251e-06, + "loss": 0.317, + "step": 24025 + }, + { + "epoch": 0.96, + "learning_rate": 9.52874874874875e-06, + "loss": 0.3128, + "step": 24050 + }, + { + "epoch": 0.96, + "learning_rate": 9.528248248248248e-06, + "loss": 0.324, + "step": 24075 + }, + { + "epoch": 0.96, + "learning_rate": 9.527747747747749e-06, + "loss": 0.3367, + "step": 24100 + }, + { + "epoch": 0.96, + "learning_rate": 9.527247247247248e-06, + "loss": 0.3159, + "step": 24125 + }, + { + "epoch": 0.96, + "learning_rate": 9.526746746746747e-06, + "loss": 0.3288, + "step": 24150 + }, + { + "epoch": 0.96, + "learning_rate": 9.526246246246247e-06, + "loss": 0.3379, + "step": 24175 + }, + { + "epoch": 0.97, + "learning_rate": 9.525745745745748e-06, + "loss": 0.3359, + "step": 24200 + }, + { + "epoch": 0.97, + "learning_rate": 9.525245245245245e-06, + "loss": 0.3146, + "step": 24225 + }, + { + "epoch": 0.97, + "learning_rate": 9.524744744744745e-06, + "loss": 0.3054, + "step": 24250 + }, + { + "epoch": 0.97, + "learning_rate": 9.524244244244246e-06, + "loss": 0.3329, + "step": 24275 + }, + { + "epoch": 0.97, + "learning_rate": 9.523743743743745e-06, + "loss": 0.3157, + "step": 24300 + }, + { + "epoch": 0.97, + "learning_rate": 9.523243243243244e-06, + "loss": 0.3252, + "step": 24325 + }, + { + "epoch": 0.97, + "learning_rate": 9.522742742742743e-06, + "loss": 0.3199, + "step": 24350 + }, + { + "epoch": 0.97, + "learning_rate": 9.522242242242243e-06, + "loss": 0.2962, + "step": 24375 + }, + { + "epoch": 0.97, + "learning_rate": 9.521741741741742e-06, + "loss": 0.3197, + "step": 24400 + }, + { + "epoch": 0.97, + "learning_rate": 9.521241241241243e-06, + "loss": 0.3105, + "step": 24425 + }, + { + "epoch": 0.98, + "learning_rate": 9.520740740740742e-06, + "loss": 0.3158, + "step": 24450 + }, + { + "epoch": 0.98, + "learning_rate": 9.52024024024024e-06, + "loss": 0.3084, + "step": 24475 + }, + { + "epoch": 0.98, + "learning_rate": 9.519739739739741e-06, + "loss": 0.3258, + "step": 24500 + }, + { + "epoch": 0.98, + "learning_rate": 9.51923923923924e-06, + "loss": 0.3087, + "step": 24525 + }, + { + "epoch": 0.98, + "learning_rate": 9.51873873873874e-06, + "loss": 0.323, + "step": 24550 + }, + { + "epoch": 0.98, + "learning_rate": 9.518238238238239e-06, + "loss": 0.3153, + "step": 24575 + }, + { + "epoch": 0.98, + "learning_rate": 9.517737737737738e-06, + "loss": 0.3256, + "step": 24600 + }, + { + "epoch": 0.98, + "learning_rate": 9.517237237237237e-06, + "loss": 0.3461, + "step": 24625 + }, + { + "epoch": 0.98, + "learning_rate": 9.516736736736738e-06, + "loss": 0.319, + "step": 24650 + }, + { + "epoch": 0.98, + "learning_rate": 9.516236236236238e-06, + "loss": 0.3091, + "step": 24675 + }, + { + "epoch": 0.99, + "learning_rate": 9.515735735735735e-06, + "loss": 0.3109, + "step": 24700 + }, + { + "epoch": 0.99, + "learning_rate": 9.515235235235236e-06, + "loss": 0.3062, + "step": 24725 + }, + { + "epoch": 0.99, + "learning_rate": 9.514734734734736e-06, + "loss": 0.3162, + "step": 24750 + }, + { + "epoch": 0.99, + "learning_rate": 9.514234234234235e-06, + "loss": 0.3184, + "step": 24775 + }, + { + "epoch": 0.99, + "learning_rate": 9.513733733733734e-06, + "loss": 0.3168, + "step": 24800 + }, + { + "epoch": 0.99, + "learning_rate": 9.513233233233235e-06, + "loss": 0.315, + "step": 24825 + }, + { + "epoch": 0.99, + "learning_rate": 9.512732732732733e-06, + "loss": 0.3023, + "step": 24850 + }, + { + "epoch": 0.99, + "learning_rate": 9.512232232232232e-06, + "loss": 0.3242, + "step": 24875 + }, + { + "epoch": 0.99, + "learning_rate": 9.511731731731733e-06, + "loss": 0.3337, + "step": 24900 + }, + { + "epoch": 0.99, + "learning_rate": 9.511231231231232e-06, + "loss": 0.3149, + "step": 24925 + }, + { + "epoch": 0.99, + "learning_rate": 9.510730730730732e-06, + "loss": 0.3085, + "step": 24950 + }, + { + "epoch": 1.0, + "learning_rate": 9.510230230230231e-06, + "loss": 0.3263, + "step": 24975 + }, + { + "epoch": 1.0, + "learning_rate": 9.50972972972973e-06, + "loss": 0.3089, + "step": 25000 + }, + { + "epoch": 1.0, + "eval_loss": 0.457874059677124, + "eval_runtime": 2679.5488, + "eval_samples_per_second": 6.051, + "eval_steps_per_second": 0.152, + "eval_wer": 27.82818510495602, + "step": 25000 + }, + { + "epoch": 1.0, + "learning_rate": 9.50922922922923e-06, + "loss": 0.3246, + "step": 25025 + }, + { + "epoch": 1.0, + "learning_rate": 9.50872872872873e-06, + "loss": 0.3371, + "step": 25050 + }, + { + "epoch": 1.0, + "learning_rate": 9.50822822822823e-06, + "loss": 0.2992, + "step": 25075 + }, + { + "epoch": 1.0, + "learning_rate": 9.507727727727727e-06, + "loss": 0.2763, + "step": 25100 + }, + { + "epoch": 1.0, + "learning_rate": 9.507227227227228e-06, + "loss": 0.277, + "step": 25125 + }, + { + "epoch": 1.0, + "learning_rate": 9.506726726726728e-06, + "loss": 0.2702, + "step": 25150 + }, + { + "epoch": 1.0, + "learning_rate": 9.506226226226227e-06, + "loss": 0.2656, + "step": 25175 + }, + { + "epoch": 1.0, + "learning_rate": 9.505725725725726e-06, + "loss": 0.2767, + "step": 25200 + }, + { + "epoch": 1.01, + "learning_rate": 9.505225225225226e-06, + "loss": 0.2745, + "step": 25225 + }, + { + "epoch": 1.01, + "learning_rate": 9.504724724724725e-06, + "loss": 0.2637, + "step": 25250 + }, + { + "epoch": 1.01, + "learning_rate": 9.504224224224226e-06, + "loss": 0.2704, + "step": 25275 + }, + { + "epoch": 1.01, + "learning_rate": 9.503723723723725e-06, + "loss": 0.2554, + "step": 25300 + }, + { + "epoch": 1.01, + "learning_rate": 9.503223223223223e-06, + "loss": 0.271, + "step": 25325 + }, + { + "epoch": 1.01, + "learning_rate": 9.502722722722724e-06, + "loss": 0.2757, + "step": 25350 + }, + { + "epoch": 1.01, + "learning_rate": 9.502222222222223e-06, + "loss": 0.2606, + "step": 25375 + }, + { + "epoch": 1.01, + "learning_rate": 9.501721721721722e-06, + "loss": 0.2664, + "step": 25400 + }, + { + "epoch": 1.01, + "learning_rate": 9.501221221221222e-06, + "loss": 0.2702, + "step": 25425 + }, + { + "epoch": 1.01, + "learning_rate": 9.500720720720723e-06, + "loss": 0.2633, + "step": 25450 + }, + { + "epoch": 1.02, + "learning_rate": 9.50022022022022e-06, + "loss": 0.2816, + "step": 25475 + }, + { + "epoch": 1.02, + "learning_rate": 9.49971971971972e-06, + "loss": 0.2848, + "step": 25500 + }, + { + "epoch": 1.02, + "learning_rate": 9.49921921921922e-06, + "loss": 0.2655, + "step": 25525 + }, + { + "epoch": 1.02, + "learning_rate": 9.49871871871872e-06, + "loss": 0.2652, + "step": 25550 + }, + { + "epoch": 1.02, + "learning_rate": 9.49821821821822e-06, + "loss": 0.2704, + "step": 25575 + }, + { + "epoch": 1.02, + "learning_rate": 9.497717717717718e-06, + "loss": 0.2605, + "step": 25600 + }, + { + "epoch": 1.02, + "learning_rate": 9.497217217217218e-06, + "loss": 0.2674, + "step": 25625 + }, + { + "epoch": 1.02, + "learning_rate": 9.496716716716717e-06, + "loss": 0.2677, + "step": 25650 + }, + { + "epoch": 1.02, + "learning_rate": 9.496216216216218e-06, + "loss": 0.2761, + "step": 25675 + }, + { + "epoch": 1.02, + "learning_rate": 9.495715715715716e-06, + "loss": 0.2626, + "step": 25700 + }, + { + "epoch": 1.03, + "learning_rate": 9.495215215215215e-06, + "loss": 0.2637, + "step": 25725 + }, + { + "epoch": 1.03, + "learning_rate": 9.494714714714716e-06, + "loss": 0.2704, + "step": 25750 + }, + { + "epoch": 1.03, + "learning_rate": 9.494214214214215e-06, + "loss": 0.2756, + "step": 25775 + }, + { + "epoch": 1.03, + "learning_rate": 9.493713713713715e-06, + "loss": 0.2807, + "step": 25800 + }, + { + "epoch": 1.03, + "learning_rate": 9.493213213213214e-06, + "loss": 0.2798, + "step": 25825 + }, + { + "epoch": 1.03, + "learning_rate": 9.492712712712713e-06, + "loss": 0.2728, + "step": 25850 + }, + { + "epoch": 1.03, + "learning_rate": 9.492212212212212e-06, + "loss": 0.2664, + "step": 25875 + }, + { + "epoch": 1.03, + "learning_rate": 9.491731731731733e-06, + "loss": 0.2811, + "step": 25900 + }, + { + "epoch": 1.03, + "learning_rate": 9.491231231231231e-06, + "loss": 0.2582, + "step": 25925 + }, + { + "epoch": 1.03, + "learning_rate": 9.490730730730732e-06, + "loss": 0.2739, + "step": 25950 + }, + { + "epoch": 1.04, + "learning_rate": 9.490230230230231e-06, + "loss": 0.264, + "step": 25975 + }, + { + "epoch": 1.04, + "learning_rate": 9.48972972972973e-06, + "loss": 0.2625, + "step": 26000 + }, + { + "epoch": 1.04, + "eval_loss": 0.45843926072120667, + "eval_runtime": 2831.694, + "eval_samples_per_second": 5.726, + "eval_steps_per_second": 0.143, + "eval_wer": 27.744929502547777, + "step": 26000 + }, + { + "epoch": 1.04, + "learning_rate": 9.48922922922923e-06, + "loss": 0.2841, + "step": 26025 + }, + { + "epoch": 1.04, + "learning_rate": 9.48872872872873e-06, + "loss": 0.2881, + "step": 26050 + }, + { + "epoch": 1.04, + "learning_rate": 9.488228228228228e-06, + "loss": 0.2915, + "step": 26075 + }, + { + "epoch": 1.04, + "learning_rate": 9.487727727727728e-06, + "loss": 0.2687, + "step": 26100 + }, + { + "epoch": 1.04, + "learning_rate": 9.487227227227229e-06, + "loss": 0.2678, + "step": 26125 + }, + { + "epoch": 1.04, + "learning_rate": 9.486726726726728e-06, + "loss": 0.2724, + "step": 26150 + }, + { + "epoch": 1.04, + "learning_rate": 9.486226226226227e-06, + "loss": 0.2792, + "step": 26175 + }, + { + "epoch": 1.04, + "learning_rate": 9.485725725725727e-06, + "loss": 0.2657, + "step": 26200 + }, + { + "epoch": 1.05, + "learning_rate": 9.485225225225226e-06, + "loss": 0.2722, + "step": 26225 + }, + { + "epoch": 1.05, + "learning_rate": 9.484724724724725e-06, + "loss": 0.2704, + "step": 26250 + }, + { + "epoch": 1.05, + "learning_rate": 9.484224224224226e-06, + "loss": 0.2595, + "step": 26275 + }, + { + "epoch": 1.05, + "learning_rate": 9.483723723723724e-06, + "loss": 0.2699, + "step": 26300 + }, + { + "epoch": 1.05, + "learning_rate": 9.483223223223223e-06, + "loss": 0.2857, + "step": 26325 + }, + { + "epoch": 1.05, + "learning_rate": 9.482722722722724e-06, + "loss": 0.2664, + "step": 26350 + }, + { + "epoch": 1.05, + "learning_rate": 9.482222222222223e-06, + "loss": 0.2606, + "step": 26375 + }, + { + "epoch": 1.05, + "learning_rate": 9.481721721721723e-06, + "loss": 0.2607, + "step": 26400 + }, + { + "epoch": 1.05, + "learning_rate": 9.481221221221222e-06, + "loss": 0.2487, + "step": 26425 + }, + { + "epoch": 1.05, + "learning_rate": 9.480720720720721e-06, + "loss": 0.2603, + "step": 26450 + }, + { + "epoch": 1.06, + "learning_rate": 9.48022022022022e-06, + "loss": 0.2819, + "step": 26475 + }, + { + "epoch": 1.06, + "learning_rate": 9.479719719719721e-06, + "loss": 0.27, + "step": 26500 + }, + { + "epoch": 1.06, + "learning_rate": 9.47921921921922e-06, + "loss": 0.2577, + "step": 26525 + }, + { + "epoch": 1.06, + "learning_rate": 9.478718718718718e-06, + "loss": 0.2743, + "step": 26550 + }, + { + "epoch": 1.06, + "learning_rate": 9.47821821821822e-06, + "loss": 0.2806, + "step": 26575 + }, + { + "epoch": 1.06, + "learning_rate": 9.477717717717719e-06, + "loss": 0.2736, + "step": 26600 + }, + { + "epoch": 1.06, + "learning_rate": 9.477217217217218e-06, + "loss": 0.2699, + "step": 26625 + }, + { + "epoch": 1.06, + "learning_rate": 9.476716716716717e-06, + "loss": 0.2743, + "step": 26650 + }, + { + "epoch": 1.06, + "learning_rate": 9.476216216216218e-06, + "loss": 0.2706, + "step": 26675 + }, + { + "epoch": 1.06, + "learning_rate": 9.475715715715716e-06, + "loss": 0.2658, + "step": 26700 + }, + { + "epoch": 1.07, + "learning_rate": 9.475215215215215e-06, + "loss": 0.263, + "step": 26725 + }, + { + "epoch": 1.07, + "learning_rate": 9.474714714714716e-06, + "loss": 0.2653, + "step": 26750 + }, + { + "epoch": 1.07, + "learning_rate": 9.474214214214215e-06, + "loss": 0.2622, + "step": 26775 + }, + { + "epoch": 1.07, + "learning_rate": 9.473713713713715e-06, + "loss": 0.2743, + "step": 26800 + }, + { + "epoch": 1.07, + "learning_rate": 9.473213213213214e-06, + "loss": 0.2531, + "step": 26825 + }, + { + "epoch": 1.07, + "learning_rate": 9.472712712712713e-06, + "loss": 0.2686, + "step": 26850 + }, + { + "epoch": 1.07, + "learning_rate": 9.472212212212213e-06, + "loss": 0.2847, + "step": 26875 + }, + { + "epoch": 1.07, + "learning_rate": 9.471711711711714e-06, + "loss": 0.2556, + "step": 26900 + }, + { + "epoch": 1.07, + "learning_rate": 9.471211211211211e-06, + "loss": 0.2642, + "step": 26925 + }, + { + "epoch": 1.07, + "learning_rate": 9.47071071071071e-06, + "loss": 0.2719, + "step": 26950 + }, + { + "epoch": 1.08, + "learning_rate": 9.470210210210212e-06, + "loss": 0.2632, + "step": 26975 + }, + { + "epoch": 1.08, + "learning_rate": 9.46970970970971e-06, + "loss": 0.2758, + "step": 27000 + }, + { + "epoch": 1.08, + "eval_loss": 0.45501989126205444, + "eval_runtime": 2547.6663, + "eval_samples_per_second": 6.364, + "eval_steps_per_second": 0.159, + "eval_wer": 26.85301531748907, + "step": 27000 + }, + { + "epoch": 1.08, + "learning_rate": 9.46920920920921e-06, + "loss": 0.2766, + "step": 27025 + }, + { + "epoch": 1.08, + "learning_rate": 9.46870870870871e-06, + "loss": 0.2724, + "step": 27050 + }, + { + "epoch": 1.08, + "learning_rate": 9.468208208208209e-06, + "loss": 0.265, + "step": 27075 + }, + { + "epoch": 1.08, + "learning_rate": 9.467707707707708e-06, + "loss": 0.2627, + "step": 27100 + }, + { + "epoch": 1.08, + "learning_rate": 9.467207207207207e-06, + "loss": 0.2648, + "step": 27125 + }, + { + "epoch": 1.08, + "learning_rate": 9.466706706706708e-06, + "loss": 0.2676, + "step": 27150 + }, + { + "epoch": 1.08, + "learning_rate": 9.466206206206206e-06, + "loss": 0.2634, + "step": 27175 + }, + { + "epoch": 1.08, + "learning_rate": 9.465705705705707e-06, + "loss": 0.2631, + "step": 27200 + }, + { + "epoch": 1.09, + "learning_rate": 9.465205205205206e-06, + "loss": 0.2729, + "step": 27225 + }, + { + "epoch": 1.09, + "learning_rate": 9.464704704704705e-06, + "loss": 0.2772, + "step": 27250 + }, + { + "epoch": 1.09, + "learning_rate": 9.464204204204205e-06, + "loss": 0.2605, + "step": 27275 + }, + { + "epoch": 1.09, + "learning_rate": 9.463703703703706e-06, + "loss": 0.2753, + "step": 27300 + }, + { + "epoch": 1.09, + "learning_rate": 9.463203203203203e-06, + "loss": 0.2719, + "step": 27325 + }, + { + "epoch": 1.09, + "learning_rate": 9.462702702702703e-06, + "loss": 0.2802, + "step": 27350 + }, + { + "epoch": 1.09, + "learning_rate": 9.462202202202204e-06, + "loss": 0.2579, + "step": 27375 + }, + { + "epoch": 1.09, + "learning_rate": 9.461701701701701e-06, + "loss": 0.2781, + "step": 27400 + }, + { + "epoch": 1.09, + "learning_rate": 9.461201201201202e-06, + "loss": 0.292, + "step": 27425 + }, + { + "epoch": 1.09, + "learning_rate": 9.460700700700702e-06, + "loss": 0.25, + "step": 27450 + }, + { + "epoch": 1.1, + "learning_rate": 9.460200200200201e-06, + "loss": 0.2518, + "step": 27475 + }, + { + "epoch": 1.1, + "learning_rate": 9.4596996996997e-06, + "loss": 0.264, + "step": 27500 + }, + { + "epoch": 1.1, + "learning_rate": 9.459199199199201e-06, + "loss": 0.2603, + "step": 27525 + }, + { + "epoch": 1.1, + "learning_rate": 9.458698698698699e-06, + "loss": 0.2601, + "step": 27550 + }, + { + "epoch": 1.1, + "learning_rate": 9.458198198198198e-06, + "loss": 0.275, + "step": 27575 + }, + { + "epoch": 1.1, + "learning_rate": 9.457697697697699e-06, + "loss": 0.2681, + "step": 27600 + }, + { + "epoch": 1.1, + "learning_rate": 9.457197197197198e-06, + "loss": 0.2595, + "step": 27625 + }, + { + "epoch": 1.1, + "learning_rate": 9.456696696696698e-06, + "loss": 0.2797, + "step": 27650 + }, + { + "epoch": 1.1, + "learning_rate": 9.456196196196197e-06, + "loss": 0.2564, + "step": 27675 + }, + { + "epoch": 1.1, + "learning_rate": 9.455695695695696e-06, + "loss": 0.2565, + "step": 27700 + }, + { + "epoch": 1.11, + "learning_rate": 9.455195195195196e-06, + "loss": 0.2833, + "step": 27725 + }, + { + "epoch": 1.11, + "learning_rate": 9.454694694694695e-06, + "loss": 0.2648, + "step": 27750 + }, + { + "epoch": 1.11, + "learning_rate": 9.454194194194196e-06, + "loss": 0.2607, + "step": 27775 + }, + { + "epoch": 1.11, + "learning_rate": 9.453693693693693e-06, + "loss": 0.2697, + "step": 27800 + }, + { + "epoch": 1.11, + "learning_rate": 9.453193193193194e-06, + "loss": 0.2778, + "step": 27825 + }, + { + "epoch": 1.11, + "learning_rate": 9.452692692692694e-06, + "loss": 0.2616, + "step": 27850 + }, + { + "epoch": 1.11, + "learning_rate": 9.452192192192193e-06, + "loss": 0.27, + "step": 27875 + }, + { + "epoch": 1.11, + "learning_rate": 9.451691691691692e-06, + "loss": 0.2726, + "step": 27900 + }, + { + "epoch": 1.11, + "learning_rate": 9.451191191191193e-06, + "loss": 0.2444, + "step": 27925 + }, + { + "epoch": 1.11, + "learning_rate": 9.450690690690691e-06, + "loss": 0.258, + "step": 27950 + }, + { + "epoch": 1.12, + "learning_rate": 9.45019019019019e-06, + "loss": 0.2758, + "step": 27975 + }, + { + "epoch": 1.12, + "learning_rate": 9.449689689689691e-06, + "loss": 0.265, + "step": 28000 + }, + { + "epoch": 1.12, + "eval_loss": 0.45008718967437744, + "eval_runtime": 2652.1712, + "eval_samples_per_second": 6.113, + "eval_steps_per_second": 0.153, + "eval_wer": 28.59213234557242, + "step": 28000 + }, + { + "epoch": 1.12, + "learning_rate": 9.44920920920921e-06, + "loss": 0.2703, + "step": 28025 + }, + { + "epoch": 1.12, + "learning_rate": 9.44870870870871e-06, + "loss": 0.2573, + "step": 28050 + }, + { + "epoch": 1.12, + "learning_rate": 9.448208208208209e-06, + "loss": 0.2824, + "step": 28075 + }, + { + "epoch": 1.12, + "learning_rate": 9.447707707707708e-06, + "loss": 0.2697, + "step": 28100 + }, + { + "epoch": 1.12, + "learning_rate": 9.44720720720721e-06, + "loss": 0.2586, + "step": 28125 + }, + { + "epoch": 1.12, + "learning_rate": 9.446706706706707e-06, + "loss": 0.2882, + "step": 28150 + }, + { + "epoch": 1.12, + "learning_rate": 9.446206206206206e-06, + "loss": 0.2649, + "step": 28175 + }, + { + "epoch": 1.12, + "learning_rate": 9.445705705705707e-06, + "loss": 0.2542, + "step": 28200 + }, + { + "epoch": 1.13, + "learning_rate": 9.445205205205206e-06, + "loss": 0.263, + "step": 28225 + }, + { + "epoch": 1.13, + "learning_rate": 9.444704704704706e-06, + "loss": 0.2729, + "step": 28250 + }, + { + "epoch": 1.13, + "learning_rate": 9.444204204204205e-06, + "loss": 0.2861, + "step": 28275 + }, + { + "epoch": 1.13, + "learning_rate": 9.443703703703704e-06, + "loss": 0.2692, + "step": 28300 + }, + { + "epoch": 1.13, + "learning_rate": 9.443203203203204e-06, + "loss": 0.2826, + "step": 28325 + }, + { + "epoch": 1.13, + "learning_rate": 9.442702702702703e-06, + "loss": 0.2795, + "step": 28350 + }, + { + "epoch": 1.13, + "learning_rate": 9.442202202202204e-06, + "loss": 0.2655, + "step": 28375 + }, + { + "epoch": 1.13, + "learning_rate": 9.441701701701701e-06, + "loss": 0.2605, + "step": 28400 + }, + { + "epoch": 1.13, + "learning_rate": 9.441201201201202e-06, + "loss": 0.2626, + "step": 28425 + }, + { + "epoch": 1.13, + "learning_rate": 9.440700700700702e-06, + "loss": 0.2867, + "step": 28450 + }, + { + "epoch": 1.14, + "learning_rate": 9.440200200200201e-06, + "loss": 0.272, + "step": 28475 + }, + { + "epoch": 1.14, + "learning_rate": 9.4396996996997e-06, + "loss": 0.257, + "step": 28500 + }, + { + "epoch": 1.14, + "learning_rate": 9.4391991991992e-06, + "loss": 0.2783, + "step": 28525 + }, + { + "epoch": 1.14, + "learning_rate": 9.438698698698699e-06, + "loss": 0.2602, + "step": 28550 + }, + { + "epoch": 1.14, + "learning_rate": 9.438198198198198e-06, + "loss": 0.2644, + "step": 28575 + }, + { + "epoch": 1.14, + "learning_rate": 9.4376976976977e-06, + "loss": 0.2554, + "step": 28600 + }, + { + "epoch": 1.14, + "learning_rate": 9.437197197197197e-06, + "loss": 0.2743, + "step": 28625 + }, + { + "epoch": 1.14, + "learning_rate": 9.436696696696698e-06, + "loss": 0.2724, + "step": 28650 + }, + { + "epoch": 1.14, + "learning_rate": 9.436196196196197e-06, + "loss": 0.2607, + "step": 28675 + }, + { + "epoch": 1.14, + "learning_rate": 9.435695695695696e-06, + "loss": 0.2626, + "step": 28700 + }, + { + "epoch": 1.15, + "learning_rate": 9.435195195195196e-06, + "loss": 0.2616, + "step": 28725 + }, + { + "epoch": 1.15, + "learning_rate": 9.434694694694697e-06, + "loss": 0.2602, + "step": 28750 + }, + { + "epoch": 1.15, + "learning_rate": 9.434194194194194e-06, + "loss": 0.2639, + "step": 28775 + }, + { + "epoch": 1.15, + "learning_rate": 9.433693693693694e-06, + "loss": 0.2564, + "step": 28800 + }, + { + "epoch": 1.15, + "learning_rate": 9.433193193193195e-06, + "loss": 0.2544, + "step": 28825 + }, + { + "epoch": 1.15, + "learning_rate": 9.432692692692694e-06, + "loss": 0.2874, + "step": 28850 + }, + { + "epoch": 1.15, + "learning_rate": 9.432192192192193e-06, + "loss": 0.2663, + "step": 28875 + }, + { + "epoch": 1.15, + "learning_rate": 9.431691691691692e-06, + "loss": 0.2658, + "step": 28900 + }, + { + "epoch": 1.15, + "learning_rate": 9.431191191191192e-06, + "loss": 0.286, + "step": 28925 + }, + { + "epoch": 1.15, + "learning_rate": 9.430690690690691e-06, + "loss": 0.2451, + "step": 28950 + }, + { + "epoch": 1.16, + "learning_rate": 9.43019019019019e-06, + "loss": 0.2811, + "step": 28975 + }, + { + "epoch": 1.16, + "learning_rate": 9.429689689689691e-06, + "loss": 0.258, + "step": 29000 + }, + { + "epoch": 1.16, + "eval_loss": 0.44391068816185, + "eval_runtime": 2504.9501, + "eval_samples_per_second": 6.472, + "eval_steps_per_second": 0.162, + "eval_wer": 26.30877036100554, + "step": 29000 + }, + { + "epoch": 1.16, + "learning_rate": 9.429189189189189e-06, + "loss": 0.2654, + "step": 29025 + }, + { + "epoch": 1.16, + "learning_rate": 9.42868868868869e-06, + "loss": 0.2587, + "step": 29050 + }, + { + "epoch": 1.16, + "learning_rate": 9.42818818818819e-06, + "loss": 0.2571, + "step": 29075 + }, + { + "epoch": 1.16, + "learning_rate": 9.427687687687689e-06, + "loss": 0.2734, + "step": 29100 + }, + { + "epoch": 1.16, + "learning_rate": 9.427187187187188e-06, + "loss": 0.2898, + "step": 29125 + }, + { + "epoch": 1.16, + "learning_rate": 9.426686686686687e-06, + "loss": 0.2514, + "step": 29150 + }, + { + "epoch": 1.16, + "learning_rate": 9.426186186186186e-06, + "loss": 0.2804, + "step": 29175 + }, + { + "epoch": 1.16, + "learning_rate": 9.425685685685686e-06, + "loss": 0.2812, + "step": 29200 + }, + { + "epoch": 1.17, + "learning_rate": 9.425185185185187e-06, + "loss": 0.265, + "step": 29225 + }, + { + "epoch": 1.17, + "learning_rate": 9.424684684684684e-06, + "loss": 0.2546, + "step": 29250 + }, + { + "epoch": 1.17, + "learning_rate": 9.424184184184185e-06, + "loss": 0.2818, + "step": 29275 + }, + { + "epoch": 1.17, + "learning_rate": 9.423683683683685e-06, + "loss": 0.2448, + "step": 29300 + }, + { + "epoch": 1.17, + "learning_rate": 9.423183183183184e-06, + "loss": 0.2791, + "step": 29325 + }, + { + "epoch": 1.17, + "learning_rate": 9.422682682682683e-06, + "loss": 0.2583, + "step": 29350 + }, + { + "epoch": 1.17, + "learning_rate": 9.422182182182184e-06, + "loss": 0.2737, + "step": 29375 + }, + { + "epoch": 1.17, + "learning_rate": 9.421701701701702e-06, + "loss": 0.266, + "step": 29400 + }, + { + "epoch": 1.17, + "learning_rate": 9.421201201201203e-06, + "loss": 0.265, + "step": 29425 + }, + { + "epoch": 1.17, + "learning_rate": 9.420700700700702e-06, + "loss": 0.2771, + "step": 29450 + }, + { + "epoch": 1.18, + "learning_rate": 9.420200200200201e-06, + "loss": 0.2569, + "step": 29475 + }, + { + "epoch": 1.18, + "learning_rate": 9.4196996996997e-06, + "loss": 0.2621, + "step": 29500 + }, + { + "epoch": 1.18, + "learning_rate": 9.4191991991992e-06, + "loss": 0.2703, + "step": 29525 + }, + { + "epoch": 1.18, + "learning_rate": 9.418698698698699e-06, + "loss": 0.2786, + "step": 29550 + }, + { + "epoch": 1.18, + "learning_rate": 9.418198198198198e-06, + "loss": 0.2628, + "step": 29575 + }, + { + "epoch": 1.18, + "learning_rate": 9.4176976976977e-06, + "loss": 0.295, + "step": 29600 + }, + { + "epoch": 1.18, + "learning_rate": 9.417197197197197e-06, + "loss": 0.2829, + "step": 29625 + }, + { + "epoch": 1.18, + "learning_rate": 9.416696696696698e-06, + "loss": 0.2721, + "step": 29650 + }, + { + "epoch": 1.18, + "learning_rate": 9.416196196196197e-06, + "loss": 0.2721, + "step": 29675 + }, + { + "epoch": 1.18, + "learning_rate": 9.415695695695697e-06, + "loss": 0.2683, + "step": 29700 + }, + { + "epoch": 1.19, + "learning_rate": 9.415195195195196e-06, + "loss": 0.2655, + "step": 29725 + }, + { + "epoch": 1.19, + "learning_rate": 9.414694694694695e-06, + "loss": 0.2567, + "step": 29750 + }, + { + "epoch": 1.19, + "learning_rate": 9.414194194194194e-06, + "loss": 0.2542, + "step": 29775 + }, + { + "epoch": 1.19, + "learning_rate": 9.413693693693694e-06, + "loss": 0.2722, + "step": 29800 + }, + { + "epoch": 1.19, + "learning_rate": 9.413193193193195e-06, + "loss": 0.2707, + "step": 29825 + }, + { + "epoch": 1.19, + "learning_rate": 9.412692692692692e-06, + "loss": 0.2718, + "step": 29850 + }, + { + "epoch": 1.19, + "learning_rate": 9.412192192192193e-06, + "loss": 0.2634, + "step": 29875 + }, + { + "epoch": 1.19, + "learning_rate": 9.411691691691693e-06, + "loss": 0.2643, + "step": 29900 + }, + { + "epoch": 1.19, + "learning_rate": 9.411191191191192e-06, + "loss": 0.2618, + "step": 29925 + }, + { + "epoch": 1.19, + "learning_rate": 9.410690690690691e-06, + "loss": 0.2684, + "step": 29950 + }, + { + "epoch": 1.2, + "learning_rate": 9.41019019019019e-06, + "loss": 0.282, + "step": 29975 + }, + { + "epoch": 1.2, + "learning_rate": 9.40968968968969e-06, + "loss": 0.2837, + "step": 30000 + }, + { + "epoch": 1.2, + "eval_loss": 0.4546422064304352, + "eval_runtime": 2695.5326, + "eval_samples_per_second": 6.015, + "eval_steps_per_second": 0.151, + "eval_wer": 27.167536482142445, + "step": 30000 + }, + { + "epoch": 1.2, + "learning_rate": 9.40918918918919e-06, + "loss": 0.2669, + "step": 30025 + }, + { + "epoch": 1.2, + "learning_rate": 9.40868868868869e-06, + "loss": 0.2881, + "step": 30050 + }, + { + "epoch": 1.2, + "learning_rate": 9.40818818818819e-06, + "loss": 0.2759, + "step": 30075 + }, + { + "epoch": 1.2, + "learning_rate": 9.407687687687689e-06, + "loss": 0.2568, + "step": 30100 + }, + { + "epoch": 1.2, + "learning_rate": 9.407187187187188e-06, + "loss": 0.2779, + "step": 30125 + }, + { + "epoch": 1.2, + "learning_rate": 9.406686686686687e-06, + "loss": 0.2668, + "step": 30150 + }, + { + "epoch": 1.2, + "learning_rate": 9.406186186186187e-06, + "loss": 0.272, + "step": 30175 + }, + { + "epoch": 1.2, + "learning_rate": 9.405685685685686e-06, + "loss": 0.2638, + "step": 30200 + }, + { + "epoch": 1.21, + "learning_rate": 9.405185185185187e-06, + "loss": 0.27, + "step": 30225 + }, + { + "epoch": 1.21, + "learning_rate": 9.404684684684685e-06, + "loss": 0.2757, + "step": 30250 + }, + { + "epoch": 1.21, + "learning_rate": 9.404184184184186e-06, + "loss": 0.2499, + "step": 30275 + }, + { + "epoch": 1.21, + "learning_rate": 9.403683683683685e-06, + "loss": 0.2886, + "step": 30300 + }, + { + "epoch": 1.21, + "learning_rate": 9.403183183183184e-06, + "loss": 0.2756, + "step": 30325 + }, + { + "epoch": 1.21, + "learning_rate": 9.402682682682683e-06, + "loss": 0.261, + "step": 30350 + }, + { + "epoch": 1.21, + "learning_rate": 9.402182182182183e-06, + "loss": 0.2748, + "step": 30375 + }, + { + "epoch": 1.21, + "learning_rate": 9.401681681681682e-06, + "loss": 0.261, + "step": 30400 + }, + { + "epoch": 1.21, + "learning_rate": 9.401181181181181e-06, + "loss": 0.2839, + "step": 30425 + }, + { + "epoch": 1.21, + "learning_rate": 9.400680680680682e-06, + "loss": 0.2735, + "step": 30450 + }, + { + "epoch": 1.22, + "learning_rate": 9.40018018018018e-06, + "loss": 0.2659, + "step": 30475 + }, + { + "epoch": 1.22, + "learning_rate": 9.3996996996997e-06, + "loss": 0.2621, + "step": 30500 + }, + { + "epoch": 1.22, + "learning_rate": 9.3991991991992e-06, + "loss": 0.2744, + "step": 30525 + }, + { + "epoch": 1.22, + "learning_rate": 9.3986986986987e-06, + "loss": 0.2632, + "step": 30550 + }, + { + "epoch": 1.22, + "learning_rate": 9.398198198198199e-06, + "loss": 0.2589, + "step": 30575 + }, + { + "epoch": 1.22, + "learning_rate": 9.397697697697698e-06, + "loss": 0.2528, + "step": 30600 + }, + { + "epoch": 1.22, + "learning_rate": 9.397197197197197e-06, + "loss": 0.265, + "step": 30625 + }, + { + "epoch": 1.22, + "learning_rate": 9.396696696696698e-06, + "loss": 0.2569, + "step": 30650 + }, + { + "epoch": 1.22, + "learning_rate": 9.396196196196197e-06, + "loss": 0.2646, + "step": 30675 + }, + { + "epoch": 1.22, + "learning_rate": 9.395695695695697e-06, + "loss": 0.2737, + "step": 30700 + }, + { + "epoch": 1.23, + "learning_rate": 9.395195195195196e-06, + "loss": 0.2555, + "step": 30725 + }, + { + "epoch": 1.23, + "learning_rate": 9.394694694694695e-06, + "loss": 0.2671, + "step": 30750 + }, + { + "epoch": 1.23, + "learning_rate": 9.394194194194195e-06, + "loss": 0.2693, + "step": 30775 + }, + { + "epoch": 1.23, + "learning_rate": 9.393693693693694e-06, + "loss": 0.2795, + "step": 30800 + }, + { + "epoch": 1.23, + "learning_rate": 9.393193193193193e-06, + "loss": 0.2641, + "step": 30825 + }, + { + "epoch": 1.23, + "learning_rate": 9.392692692692693e-06, + "loss": 0.2789, + "step": 30850 + }, + { + "epoch": 1.23, + "learning_rate": 9.392192192192194e-06, + "loss": 0.2617, + "step": 30875 + }, + { + "epoch": 1.23, + "learning_rate": 9.391691691691693e-06, + "loss": 0.2536, + "step": 30900 + }, + { + "epoch": 1.23, + "learning_rate": 9.391191191191192e-06, + "loss": 0.2636, + "step": 30925 + }, + { + "epoch": 1.23, + "learning_rate": 9.390690690690691e-06, + "loss": 0.2713, + "step": 30950 + }, + { + "epoch": 1.24, + "learning_rate": 9.39019019019019e-06, + "loss": 0.2741, + "step": 30975 + }, + { + "epoch": 1.24, + "learning_rate": 9.38968968968969e-06, + "loss": 0.2804, + "step": 31000 + }, + { + "epoch": 1.24, + "eval_loss": 0.44737279415130615, + "eval_runtime": 2512.7508, + "eval_samples_per_second": 6.452, + "eval_steps_per_second": 0.162, + "eval_wer": 26.34577285096476, + "step": 31000 + }, + { + "epoch": 1.24, + "learning_rate": 9.38918918918919e-06, + "loss": 0.277, + "step": 31025 + }, + { + "epoch": 1.24, + "learning_rate": 9.38868868868869e-06, + "loss": 0.2563, + "step": 31050 + }, + { + "epoch": 1.24, + "learning_rate": 9.388188188188188e-06, + "loss": 0.2455, + "step": 31075 + }, + { + "epoch": 1.24, + "learning_rate": 9.387687687687689e-06, + "loss": 0.2606, + "step": 31100 + }, + { + "epoch": 1.24, + "learning_rate": 9.387187187187188e-06, + "loss": 0.2602, + "step": 31125 + }, + { + "epoch": 1.24, + "learning_rate": 9.386686686686688e-06, + "loss": 0.2576, + "step": 31150 + }, + { + "epoch": 1.24, + "learning_rate": 9.386186186186187e-06, + "loss": 0.27, + "step": 31175 + }, + { + "epoch": 1.24, + "learning_rate": 9.385685685685686e-06, + "loss": 0.2806, + "step": 31200 + }, + { + "epoch": 1.25, + "learning_rate": 9.385185185185185e-06, + "loss": 0.2673, + "step": 31225 + }, + { + "epoch": 1.25, + "learning_rate": 9.384684684684685e-06, + "loss": 0.2766, + "step": 31250 + }, + { + "epoch": 1.25, + "learning_rate": 9.384184184184186e-06, + "loss": 0.2575, + "step": 31275 + }, + { + "epoch": 1.25, + "learning_rate": 9.383683683683685e-06, + "loss": 0.2526, + "step": 31300 + }, + { + "epoch": 1.25, + "learning_rate": 9.383183183183184e-06, + "loss": 0.2678, + "step": 31325 + }, + { + "epoch": 1.25, + "learning_rate": 9.382682682682684e-06, + "loss": 0.2711, + "step": 31350 + }, + { + "epoch": 1.25, + "learning_rate": 9.382182182182183e-06, + "loss": 0.2889, + "step": 31375 + }, + { + "epoch": 1.25, + "learning_rate": 9.381681681681682e-06, + "loss": 0.2709, + "step": 31400 + }, + { + "epoch": 1.25, + "learning_rate": 9.381181181181182e-06, + "loss": 0.2736, + "step": 31425 + }, + { + "epoch": 1.25, + "learning_rate": 9.38068068068068e-06, + "loss": 0.2699, + "step": 31450 + }, + { + "epoch": 1.26, + "learning_rate": 9.38018018018018e-06, + "loss": 0.2801, + "step": 31475 + }, + { + "epoch": 1.26, + "learning_rate": 9.379679679679681e-06, + "loss": 0.2774, + "step": 31500 + }, + { + "epoch": 1.26, + "learning_rate": 9.37917917917918e-06, + "loss": 0.2658, + "step": 31525 + }, + { + "epoch": 1.26, + "learning_rate": 9.37867867867868e-06, + "loss": 0.2663, + "step": 31550 + }, + { + "epoch": 1.26, + "learning_rate": 9.378178178178179e-06, + "loss": 0.2673, + "step": 31575 + }, + { + "epoch": 1.26, + "learning_rate": 9.377677677677678e-06, + "loss": 0.2722, + "step": 31600 + }, + { + "epoch": 1.26, + "learning_rate": 9.377177177177178e-06, + "loss": 0.2818, + "step": 31625 + }, + { + "epoch": 1.26, + "learning_rate": 9.376676676676677e-06, + "loss": 0.2689, + "step": 31650 + }, + { + "epoch": 1.26, + "learning_rate": 9.376176176176178e-06, + "loss": 0.2755, + "step": 31675 + }, + { + "epoch": 1.26, + "learning_rate": 9.375675675675675e-06, + "loss": 0.2563, + "step": 31700 + }, + { + "epoch": 1.27, + "learning_rate": 9.375175175175176e-06, + "loss": 0.2691, + "step": 31725 + }, + { + "epoch": 1.27, + "learning_rate": 9.374674674674676e-06, + "loss": 0.2775, + "step": 31750 + }, + { + "epoch": 1.27, + "learning_rate": 9.374174174174175e-06, + "loss": 0.2625, + "step": 31775 + }, + { + "epoch": 1.27, + "learning_rate": 9.373673673673674e-06, + "loss": 0.2526, + "step": 31800 + }, + { + "epoch": 1.27, + "learning_rate": 9.373173173173174e-06, + "loss": 0.2624, + "step": 31825 + }, + { + "epoch": 1.27, + "learning_rate": 9.372672672672673e-06, + "loss": 0.2823, + "step": 31850 + }, + { + "epoch": 1.27, + "learning_rate": 9.372172172172172e-06, + "loss": 0.2637, + "step": 31875 + }, + { + "epoch": 1.27, + "learning_rate": 9.371671671671673e-06, + "loss": 0.2747, + "step": 31900 + }, + { + "epoch": 1.27, + "learning_rate": 9.371171171171173e-06, + "loss": 0.2795, + "step": 31925 + }, + { + "epoch": 1.27, + "learning_rate": 9.370670670670672e-06, + "loss": 0.2643, + "step": 31950 + }, + { + "epoch": 1.28, + "learning_rate": 9.370170170170171e-06, + "loss": 0.2799, + "step": 31975 + }, + { + "epoch": 1.28, + "learning_rate": 9.36966966966967e-06, + "loss": 0.2612, + "step": 32000 + }, + { + "epoch": 1.28, + "eval_loss": 0.4532637298107147, + "eval_runtime": 2555.128, + "eval_samples_per_second": 6.345, + "eval_steps_per_second": 0.159, + "eval_wer": 25.984998573862367, + "step": 32000 + }, + { + "epoch": 1.28, + "learning_rate": 9.36916916916917e-06, + "loss": 0.2583, + "step": 32025 + }, + { + "epoch": 1.28, + "learning_rate": 9.368668668668669e-06, + "loss": 0.257, + "step": 32050 + }, + { + "epoch": 1.28, + "learning_rate": 9.368168168168168e-06, + "loss": 0.2726, + "step": 32075 + }, + { + "epoch": 1.28, + "learning_rate": 9.367667667667668e-06, + "loss": 0.2675, + "step": 32100 + }, + { + "epoch": 1.28, + "learning_rate": 9.367167167167169e-06, + "loss": 0.2606, + "step": 32125 + }, + { + "epoch": 1.28, + "learning_rate": 9.366666666666668e-06, + "loss": 0.2672, + "step": 32150 + }, + { + "epoch": 1.28, + "learning_rate": 9.366166166166167e-06, + "loss": 0.2622, + "step": 32175 + }, + { + "epoch": 1.28, + "learning_rate": 9.365665665665666e-06, + "loss": 0.2592, + "step": 32200 + }, + { + "epoch": 1.29, + "learning_rate": 9.365165165165166e-06, + "loss": 0.2618, + "step": 32225 + }, + { + "epoch": 1.29, + "learning_rate": 9.364664664664665e-06, + "loss": 0.2669, + "step": 32250 + }, + { + "epoch": 1.29, + "learning_rate": 9.364164164164164e-06, + "loss": 0.2725, + "step": 32275 + }, + { + "epoch": 1.29, + "learning_rate": 9.363663663663665e-06, + "loss": 0.2695, + "step": 32300 + }, + { + "epoch": 1.29, + "learning_rate": 9.363163163163163e-06, + "loss": 0.2727, + "step": 32325 + }, + { + "epoch": 1.29, + "learning_rate": 9.362662662662664e-06, + "loss": 0.28, + "step": 32350 + }, + { + "epoch": 1.29, + "learning_rate": 9.362162162162163e-06, + "loss": 0.2826, + "step": 32375 + }, + { + "epoch": 1.29, + "learning_rate": 9.361661661661663e-06, + "loss": 0.2728, + "step": 32400 + }, + { + "epoch": 1.29, + "learning_rate": 9.361161161161162e-06, + "loss": 0.2653, + "step": 32425 + }, + { + "epoch": 1.29, + "learning_rate": 9.360660660660661e-06, + "loss": 0.2655, + "step": 32450 + }, + { + "epoch": 1.3, + "learning_rate": 9.36016016016016e-06, + "loss": 0.2787, + "step": 32475 + }, + { + "epoch": 1.3, + "learning_rate": 9.35965965965966e-06, + "loss": 0.2677, + "step": 32500 + }, + { + "epoch": 1.3, + "learning_rate": 9.35915915915916e-06, + "loss": 0.2587, + "step": 32525 + }, + { + "epoch": 1.3, + "learning_rate": 9.358658658658658e-06, + "loss": 0.2685, + "step": 32550 + }, + { + "epoch": 1.3, + "learning_rate": 9.35815815815816e-06, + "loss": 0.2583, + "step": 32575 + }, + { + "epoch": 1.3, + "learning_rate": 9.357657657657659e-06, + "loss": 0.2673, + "step": 32600 + }, + { + "epoch": 1.3, + "learning_rate": 9.357157157157158e-06, + "loss": 0.2828, + "step": 32625 + }, + { + "epoch": 1.3, + "learning_rate": 9.356656656656657e-06, + "loss": 0.2753, + "step": 32650 + }, + { + "epoch": 1.3, + "learning_rate": 9.356156156156157e-06, + "loss": 0.2847, + "step": 32675 + }, + { + "epoch": 1.3, + "learning_rate": 9.355655655655656e-06, + "loss": 0.2671, + "step": 32700 + }, + { + "epoch": 1.31, + "learning_rate": 9.355155155155155e-06, + "loss": 0.2655, + "step": 32725 + }, + { + "epoch": 1.31, + "learning_rate": 9.354654654654656e-06, + "loss": 0.2602, + "step": 32750 + }, + { + "epoch": 1.31, + "learning_rate": 9.354154154154155e-06, + "loss": 0.2707, + "step": 32775 + }, + { + "epoch": 1.31, + "learning_rate": 9.353653653653655e-06, + "loss": 0.2577, + "step": 32800 + }, + { + "epoch": 1.31, + "learning_rate": 9.353153153153154e-06, + "loss": 0.2786, + "step": 32825 + }, + { + "epoch": 1.31, + "learning_rate": 9.352652652652653e-06, + "loss": 0.2529, + "step": 32850 + }, + { + "epoch": 1.31, + "learning_rate": 9.352152152152153e-06, + "loss": 0.2544, + "step": 32875 + }, + { + "epoch": 1.31, + "learning_rate": 9.351651651651652e-06, + "loss": 0.2748, + "step": 32900 + }, + { + "epoch": 1.31, + "learning_rate": 9.351151151151153e-06, + "loss": 0.2696, + "step": 32925 + }, + { + "epoch": 1.31, + "learning_rate": 9.35065065065065e-06, + "loss": 0.2646, + "step": 32950 + }, + { + "epoch": 1.32, + "learning_rate": 9.350150150150151e-06, + "loss": 0.2598, + "step": 32975 + }, + { + "epoch": 1.32, + "learning_rate": 9.34964964964965e-06, + "loss": 0.2551, + "step": 33000 + }, + { + "epoch": 1.32, + "eval_loss": 0.4496789276599884, + "eval_runtime": 2555.1297, + "eval_samples_per_second": 6.345, + "eval_steps_per_second": 0.159, + "eval_wer": 26.183886957393177, + "step": 33000 + }, + { + "epoch": 1.32, + "learning_rate": 9.34914914914915e-06, + "loss": 0.2877, + "step": 33025 + }, + { + "epoch": 1.32, + "learning_rate": 9.34864864864865e-06, + "loss": 0.2536, + "step": 33050 + }, + { + "epoch": 1.32, + "learning_rate": 9.348148148148149e-06, + "loss": 0.2592, + "step": 33075 + }, + { + "epoch": 1.32, + "learning_rate": 9.347647647647648e-06, + "loss": 0.2691, + "step": 33100 + }, + { + "epoch": 1.32, + "learning_rate": 9.347147147147147e-06, + "loss": 0.269, + "step": 33125 + }, + { + "epoch": 1.32, + "learning_rate": 9.346646646646648e-06, + "loss": 0.2585, + "step": 33150 + }, + { + "epoch": 1.32, + "learning_rate": 9.346146146146146e-06, + "loss": 0.2547, + "step": 33175 + }, + { + "epoch": 1.32, + "learning_rate": 9.345645645645647e-06, + "loss": 0.278, + "step": 33200 + }, + { + "epoch": 1.32, + "learning_rate": 9.345145145145146e-06, + "loss": 0.283, + "step": 33225 + }, + { + "epoch": 1.33, + "learning_rate": 9.344644644644645e-06, + "loss": 0.2708, + "step": 33250 + }, + { + "epoch": 1.33, + "learning_rate": 9.344144144144145e-06, + "loss": 0.2549, + "step": 33275 + }, + { + "epoch": 1.33, + "learning_rate": 9.343643643643644e-06, + "loss": 0.2601, + "step": 33300 + }, + { + "epoch": 1.33, + "learning_rate": 9.343143143143143e-06, + "loss": 0.2585, + "step": 33325 + }, + { + "epoch": 1.33, + "learning_rate": 9.342642642642643e-06, + "loss": 0.2794, + "step": 33350 + }, + { + "epoch": 1.33, + "learning_rate": 9.342142142142144e-06, + "loss": 0.2721, + "step": 33375 + }, + { + "epoch": 1.33, + "learning_rate": 9.341641641641643e-06, + "loss": 0.278, + "step": 33400 + }, + { + "epoch": 1.33, + "learning_rate": 9.341141141141142e-06, + "loss": 0.2702, + "step": 33425 + }, + { + "epoch": 1.33, + "learning_rate": 9.340640640640642e-06, + "loss": 0.2577, + "step": 33450 + }, + { + "epoch": 1.33, + "learning_rate": 9.34014014014014e-06, + "loss": 0.2706, + "step": 33475 + }, + { + "epoch": 1.34, + "learning_rate": 9.33963963963964e-06, + "loss": 0.25, + "step": 33500 + }, + { + "epoch": 1.34, + "learning_rate": 9.33913913913914e-06, + "loss": 0.2774, + "step": 33525 + }, + { + "epoch": 1.34, + "learning_rate": 9.33863863863864e-06, + "loss": 0.2676, + "step": 33550 + }, + { + "epoch": 1.34, + "learning_rate": 9.338138138138138e-06, + "loss": 0.2776, + "step": 33575 + }, + { + "epoch": 1.34, + "learning_rate": 9.337637637637639e-06, + "loss": 0.2542, + "step": 33600 + }, + { + "epoch": 1.34, + "learning_rate": 9.337137137137138e-06, + "loss": 0.273, + "step": 33625 + }, + { + "epoch": 1.34, + "learning_rate": 9.336636636636638e-06, + "loss": 0.2498, + "step": 33650 + }, + { + "epoch": 1.34, + "learning_rate": 9.336136136136137e-06, + "loss": 0.2624, + "step": 33675 + }, + { + "epoch": 1.34, + "learning_rate": 9.335635635635636e-06, + "loss": 0.255, + "step": 33700 + }, + { + "epoch": 1.34, + "learning_rate": 9.335135135135135e-06, + "loss": 0.2639, + "step": 33725 + }, + { + "epoch": 1.35, + "learning_rate": 9.334634634634635e-06, + "loss": 0.281, + "step": 33750 + }, + { + "epoch": 1.35, + "learning_rate": 9.334134134134136e-06, + "loss": 0.2733, + "step": 33775 + }, + { + "epoch": 1.35, + "learning_rate": 9.333633633633633e-06, + "loss": 0.2613, + "step": 33800 + }, + { + "epoch": 1.35, + "learning_rate": 9.333133133133134e-06, + "loss": 0.273, + "step": 33825 + }, + { + "epoch": 1.35, + "learning_rate": 9.332632632632634e-06, + "loss": 0.264, + "step": 33850 + }, + { + "epoch": 1.35, + "learning_rate": 9.332132132132133e-06, + "loss": 0.2665, + "step": 33875 + }, + { + "epoch": 1.35, + "learning_rate": 9.331631631631632e-06, + "loss": 0.264, + "step": 33900 + }, + { + "epoch": 1.35, + "learning_rate": 9.331131131131132e-06, + "loss": 0.2686, + "step": 33925 + }, + { + "epoch": 1.35, + "learning_rate": 9.330630630630631e-06, + "loss": 0.2709, + "step": 33950 + }, + { + "epoch": 1.35, + "learning_rate": 9.33013013013013e-06, + "loss": 0.2731, + "step": 33975 + }, + { + "epoch": 1.36, + "learning_rate": 9.329629629629631e-06, + "loss": 0.28, + "step": 34000 + }, + { + "epoch": 1.36, + "eval_loss": 0.44749680161476135, + "eval_runtime": 2532.2254, + "eval_samples_per_second": 6.403, + "eval_steps_per_second": 0.16, + "eval_wer": 26.161531286376142, + "step": 34000 + }, + { + "epoch": 1.36, + "learning_rate": 9.32912912912913e-06, + "loss": 0.2572, + "step": 34025 + }, + { + "epoch": 1.36, + "learning_rate": 9.32862862862863e-06, + "loss": 0.2828, + "step": 34050 + }, + { + "epoch": 1.36, + "learning_rate": 9.328128128128129e-06, + "loss": 0.268, + "step": 34075 + }, + { + "epoch": 1.36, + "learning_rate": 9.327627627627628e-06, + "loss": 0.2602, + "step": 34100 + }, + { + "epoch": 1.36, + "learning_rate": 9.327127127127128e-06, + "loss": 0.2651, + "step": 34125 + }, + { + "epoch": 1.36, + "learning_rate": 9.326626626626627e-06, + "loss": 0.2796, + "step": 34150 + }, + { + "epoch": 1.36, + "learning_rate": 9.326126126126128e-06, + "loss": 0.2649, + "step": 34175 + }, + { + "epoch": 1.36, + "learning_rate": 9.325625625625626e-06, + "loss": 0.2729, + "step": 34200 + }, + { + "epoch": 1.36, + "learning_rate": 9.325125125125127e-06, + "loss": 0.2492, + "step": 34225 + }, + { + "epoch": 1.37, + "learning_rate": 9.324624624624626e-06, + "loss": 0.2389, + "step": 34250 + }, + { + "epoch": 1.37, + "learning_rate": 9.324124124124125e-06, + "loss": 0.2584, + "step": 34275 + }, + { + "epoch": 1.37, + "learning_rate": 9.323623623623624e-06, + "loss": 0.2635, + "step": 34300 + }, + { + "epoch": 1.37, + "learning_rate": 9.323123123123124e-06, + "loss": 0.2556, + "step": 34325 + }, + { + "epoch": 1.37, + "learning_rate": 9.322622622622623e-06, + "loss": 0.2661, + "step": 34350 + }, + { + "epoch": 1.37, + "learning_rate": 9.322122122122122e-06, + "loss": 0.2698, + "step": 34375 + }, + { + "epoch": 1.37, + "learning_rate": 9.321621621621623e-06, + "loss": 0.2622, + "step": 34400 + }, + { + "epoch": 1.37, + "learning_rate": 9.321121121121121e-06, + "loss": 0.2606, + "step": 34425 + }, + { + "epoch": 1.37, + "learning_rate": 9.320620620620622e-06, + "loss": 0.2561, + "step": 34450 + }, + { + "epoch": 1.37, + "learning_rate": 9.320120120120121e-06, + "loss": 0.2681, + "step": 34475 + }, + { + "epoch": 1.38, + "learning_rate": 9.31961961961962e-06, + "loss": 0.2686, + "step": 34500 + }, + { + "epoch": 1.38, + "learning_rate": 9.31911911911912e-06, + "loss": 0.2691, + "step": 34525 + }, + { + "epoch": 1.38, + "learning_rate": 9.318618618618619e-06, + "loss": 0.2481, + "step": 34550 + }, + { + "epoch": 1.38, + "learning_rate": 9.318118118118118e-06, + "loss": 0.2579, + "step": 34575 + }, + { + "epoch": 1.38, + "learning_rate": 9.317617617617618e-06, + "loss": 0.2442, + "step": 34600 + }, + { + "epoch": 1.38, + "learning_rate": 9.317117117117119e-06, + "loss": 0.2605, + "step": 34625 + }, + { + "epoch": 1.38, + "learning_rate": 9.316616616616618e-06, + "loss": 0.2717, + "step": 34650 + }, + { + "epoch": 1.38, + "learning_rate": 9.316116116116117e-06, + "loss": 0.2749, + "step": 34675 + }, + { + "epoch": 1.38, + "learning_rate": 9.315615615615617e-06, + "loss": 0.2525, + "step": 34700 + }, + { + "epoch": 1.38, + "learning_rate": 9.315115115115116e-06, + "loss": 0.2586, + "step": 34725 + }, + { + "epoch": 1.39, + "learning_rate": 9.314614614614615e-06, + "loss": 0.2683, + "step": 34750 + }, + { + "epoch": 1.39, + "learning_rate": 9.314114114114114e-06, + "loss": 0.2538, + "step": 34775 + }, + { + "epoch": 1.39, + "learning_rate": 9.313613613613614e-06, + "loss": 0.2354, + "step": 34800 + }, + { + "epoch": 1.39, + "learning_rate": 9.313113113113113e-06, + "loss": 0.2591, + "step": 34825 + }, + { + "epoch": 1.39, + "learning_rate": 9.312612612612614e-06, + "loss": 0.28, + "step": 34850 + }, + { + "epoch": 1.39, + "learning_rate": 9.312112112112113e-06, + "loss": 0.2789, + "step": 34875 + }, + { + "epoch": 1.39, + "learning_rate": 9.311611611611613e-06, + "loss": 0.2741, + "step": 34900 + }, + { + "epoch": 1.39, + "learning_rate": 9.311111111111112e-06, + "loss": 0.2803, + "step": 34925 + }, + { + "epoch": 1.39, + "learning_rate": 9.310610610610611e-06, + "loss": 0.2699, + "step": 34950 + }, + { + "epoch": 1.39, + "learning_rate": 9.31011011011011e-06, + "loss": 0.2618, + "step": 34975 + }, + { + "epoch": 1.4, + "learning_rate": 9.30960960960961e-06, + "loss": 0.2775, + "step": 35000 + }, + { + "epoch": 1.4, + "eval_loss": 0.44763508439064026, + "eval_runtime": 2480.936, + "eval_samples_per_second": 6.535, + "eval_steps_per_second": 0.164, + "eval_wer": 25.96958086971269, + "step": 35000 + }, + { + "epoch": 1.4, + "learning_rate": 9.30910910910911e-06, + "loss": 0.2801, + "step": 35025 + }, + { + "epoch": 1.4, + "learning_rate": 9.308608608608608e-06, + "loss": 0.2666, + "step": 35050 + }, + { + "epoch": 1.4, + "learning_rate": 9.30810810810811e-06, + "loss": 0.2817, + "step": 35075 + }, + { + "epoch": 1.4, + "learning_rate": 9.307607607607609e-06, + "loss": 0.2618, + "step": 35100 + }, + { + "epoch": 1.4, + "learning_rate": 9.307107107107108e-06, + "loss": 0.2637, + "step": 35125 + }, + { + "epoch": 1.4, + "learning_rate": 9.306606606606607e-06, + "loss": 0.2679, + "step": 35150 + }, + { + "epoch": 1.4, + "learning_rate": 9.306106106106107e-06, + "loss": 0.2729, + "step": 35175 + }, + { + "epoch": 1.4, + "learning_rate": 9.305605605605606e-06, + "loss": 0.2659, + "step": 35200 + }, + { + "epoch": 1.4, + "learning_rate": 9.305105105105105e-06, + "loss": 0.2642, + "step": 35225 + }, + { + "epoch": 1.41, + "learning_rate": 9.304604604604606e-06, + "loss": 0.2607, + "step": 35250 + }, + { + "epoch": 1.41, + "learning_rate": 9.304104104104105e-06, + "loss": 0.2831, + "step": 35275 + }, + { + "epoch": 1.41, + "learning_rate": 9.303603603603605e-06, + "loss": 0.2681, + "step": 35300 + }, + { + "epoch": 1.41, + "learning_rate": 9.303103103103104e-06, + "loss": 0.2611, + "step": 35325 + }, + { + "epoch": 1.41, + "learning_rate": 9.302602602602603e-06, + "loss": 0.2525, + "step": 35350 + }, + { + "epoch": 1.41, + "learning_rate": 9.302102102102103e-06, + "loss": 0.2629, + "step": 35375 + }, + { + "epoch": 1.41, + "learning_rate": 9.301601601601602e-06, + "loss": 0.2576, + "step": 35400 + }, + { + "epoch": 1.41, + "learning_rate": 9.301101101101101e-06, + "loss": 0.2576, + "step": 35425 + }, + { + "epoch": 1.41, + "learning_rate": 9.3006006006006e-06, + "loss": 0.2558, + "step": 35450 + }, + { + "epoch": 1.41, + "learning_rate": 9.300100100100102e-06, + "loss": 0.2591, + "step": 35475 + }, + { + "epoch": 1.42, + "learning_rate": 9.299599599599601e-06, + "loss": 0.2646, + "step": 35500 + }, + { + "epoch": 1.42, + "learning_rate": 9.2990990990991e-06, + "loss": 0.2515, + "step": 35525 + }, + { + "epoch": 1.42, + "learning_rate": 9.2985985985986e-06, + "loss": 0.274, + "step": 35550 + }, + { + "epoch": 1.42, + "learning_rate": 9.298098098098099e-06, + "loss": 0.2696, + "step": 35575 + }, + { + "epoch": 1.42, + "learning_rate": 9.297597597597598e-06, + "loss": 0.2637, + "step": 35600 + }, + { + "epoch": 1.42, + "learning_rate": 9.297097097097097e-06, + "loss": 0.2644, + "step": 35625 + }, + { + "epoch": 1.42, + "learning_rate": 9.296596596596598e-06, + "loss": 0.262, + "step": 35650 + }, + { + "epoch": 1.42, + "learning_rate": 9.296096096096096e-06, + "loss": 0.2709, + "step": 35675 + }, + { + "epoch": 1.42, + "learning_rate": 9.295595595595597e-06, + "loss": 0.263, + "step": 35700 + }, + { + "epoch": 1.42, + "learning_rate": 9.295095095095096e-06, + "loss": 0.2569, + "step": 35725 + }, + { + "epoch": 1.43, + "learning_rate": 9.294594594594596e-06, + "loss": 0.2525, + "step": 35750 + }, + { + "epoch": 1.43, + "learning_rate": 9.294094094094095e-06, + "loss": 0.2584, + "step": 35775 + }, + { + "epoch": 1.43, + "learning_rate": 9.293593593593594e-06, + "loss": 0.2665, + "step": 35800 + }, + { + "epoch": 1.43, + "learning_rate": 9.293093093093093e-06, + "loss": 0.2693, + "step": 35825 + }, + { + "epoch": 1.43, + "learning_rate": 9.292592592592593e-06, + "loss": 0.257, + "step": 35850 + }, + { + "epoch": 1.43, + "learning_rate": 9.292092092092094e-06, + "loss": 0.2616, + "step": 35875 + }, + { + "epoch": 1.43, + "learning_rate": 9.291591591591593e-06, + "loss": 0.2711, + "step": 35900 + }, + { + "epoch": 1.43, + "learning_rate": 9.291091091091092e-06, + "loss": 0.2573, + "step": 35925 + }, + { + "epoch": 1.43, + "learning_rate": 9.290590590590592e-06, + "loss": 0.2708, + "step": 35950 + }, + { + "epoch": 1.43, + "learning_rate": 9.290090090090091e-06, + "loss": 0.2423, + "step": 35975 + }, + { + "epoch": 1.44, + "learning_rate": 9.28958958958959e-06, + "loss": 0.2609, + "step": 36000 + }, + { + "epoch": 1.44, + "eval_loss": 0.4396921396255493, + "eval_runtime": 2445.1333, + "eval_samples_per_second": 6.631, + "eval_steps_per_second": 0.166, + "eval_wer": 25.296598083579376, + "step": 36000 + }, + { + "epoch": 1.44, + "learning_rate": 9.28908908908909e-06, + "loss": 0.2572, + "step": 36025 + }, + { + "epoch": 1.44, + "learning_rate": 9.288588588588589e-06, + "loss": 0.2676, + "step": 36050 + }, + { + "epoch": 1.44, + "learning_rate": 9.288088088088088e-06, + "loss": 0.2508, + "step": 36075 + }, + { + "epoch": 1.44, + "learning_rate": 9.287587587587589e-06, + "loss": 0.2714, + "step": 36100 + }, + { + "epoch": 1.44, + "learning_rate": 9.287087087087088e-06, + "loss": 0.26, + "step": 36125 + }, + { + "epoch": 1.44, + "learning_rate": 9.286586586586588e-06, + "loss": 0.2648, + "step": 36150 + }, + { + "epoch": 1.44, + "learning_rate": 9.286086086086087e-06, + "loss": 0.2748, + "step": 36175 + }, + { + "epoch": 1.44, + "learning_rate": 9.285585585585586e-06, + "loss": 0.2602, + "step": 36200 + }, + { + "epoch": 1.44, + "learning_rate": 9.285085085085086e-06, + "loss": 0.2658, + "step": 36225 + }, + { + "epoch": 1.45, + "learning_rate": 9.284584584584585e-06, + "loss": 0.2623, + "step": 36250 + }, + { + "epoch": 1.45, + "learning_rate": 9.284084084084086e-06, + "loss": 0.2634, + "step": 36275 + }, + { + "epoch": 1.45, + "learning_rate": 9.283583583583583e-06, + "loss": 0.2832, + "step": 36300 + }, + { + "epoch": 1.45, + "learning_rate": 9.283083083083084e-06, + "loss": 0.2656, + "step": 36325 + }, + { + "epoch": 1.45, + "learning_rate": 9.282582582582584e-06, + "loss": 0.2565, + "step": 36350 + }, + { + "epoch": 1.45, + "learning_rate": 9.282082082082083e-06, + "loss": 0.2542, + "step": 36375 + }, + { + "epoch": 1.45, + "learning_rate": 9.281581581581582e-06, + "loss": 0.2594, + "step": 36400 + }, + { + "epoch": 1.45, + "learning_rate": 9.281081081081082e-06, + "loss": 0.2654, + "step": 36425 + }, + { + "epoch": 1.45, + "learning_rate": 9.280580580580581e-06, + "loss": 0.292, + "step": 36450 + }, + { + "epoch": 1.45, + "learning_rate": 9.28008008008008e-06, + "loss": 0.282, + "step": 36475 + }, + { + "epoch": 1.46, + "learning_rate": 9.279579579579581e-06, + "loss": 0.2795, + "step": 36500 + }, + { + "epoch": 1.46, + "learning_rate": 9.27907907907908e-06, + "loss": 0.263, + "step": 36525 + }, + { + "epoch": 1.46, + "learning_rate": 9.27857857857858e-06, + "loss": 0.272, + "step": 36550 + }, + { + "epoch": 1.46, + "learning_rate": 9.278098098098099e-06, + "loss": 0.2498, + "step": 36575 + }, + { + "epoch": 1.46, + "learning_rate": 9.277597597597598e-06, + "loss": 0.2626, + "step": 36600 + }, + { + "epoch": 1.46, + "learning_rate": 9.277097097097098e-06, + "loss": 0.2671, + "step": 36625 + }, + { + "epoch": 1.46, + "learning_rate": 9.276596596596597e-06, + "loss": 0.2622, + "step": 36650 + }, + { + "epoch": 1.46, + "learning_rate": 9.276096096096096e-06, + "loss": 0.2507, + "step": 36675 + }, + { + "epoch": 1.46, + "learning_rate": 9.275595595595597e-06, + "loss": 0.2606, + "step": 36700 + }, + { + "epoch": 1.46, + "learning_rate": 9.275095095095096e-06, + "loss": 0.2716, + "step": 36725 + }, + { + "epoch": 1.47, + "learning_rate": 9.274594594594596e-06, + "loss": 0.2699, + "step": 36750 + }, + { + "epoch": 1.47, + "learning_rate": 9.274094094094095e-06, + "loss": 0.2819, + "step": 36775 + }, + { + "epoch": 1.47, + "learning_rate": 9.273593593593594e-06, + "loss": 0.2681, + "step": 36800 + }, + { + "epoch": 1.47, + "learning_rate": 9.273093093093094e-06, + "loss": 0.2603, + "step": 36825 + }, + { + "epoch": 1.47, + "learning_rate": 9.272592592592593e-06, + "loss": 0.2556, + "step": 36850 + }, + { + "epoch": 1.47, + "learning_rate": 9.272092092092094e-06, + "loss": 0.2798, + "step": 36875 + }, + { + "epoch": 1.47, + "learning_rate": 9.271591591591592e-06, + "loss": 0.2623, + "step": 36900 + }, + { + "epoch": 1.47, + "learning_rate": 9.271091091091092e-06, + "loss": 0.2502, + "step": 36925 + }, + { + "epoch": 1.47, + "learning_rate": 9.270590590590592e-06, + "loss": 0.262, + "step": 36950 + }, + { + "epoch": 1.47, + "learning_rate": 9.270090090090091e-06, + "loss": 0.2504, + "step": 36975 + }, + { + "epoch": 1.48, + "learning_rate": 9.26958958958959e-06, + "loss": 0.2681, + "step": 37000 + }, + { + "epoch": 1.48, + "eval_loss": 0.4397401511669159, + "eval_runtime": 2578.9596, + "eval_samples_per_second": 6.287, + "eval_steps_per_second": 0.157, + "eval_wer": 26.684962342257613, + "step": 37000 + }, + { + "epoch": 1.48, + "learning_rate": 9.26908908908909e-06, + "loss": 0.2618, + "step": 37025 + }, + { + "epoch": 1.48, + "learning_rate": 9.268588588588589e-06, + "loss": 0.2717, + "step": 37050 + }, + { + "epoch": 1.48, + "learning_rate": 9.268088088088088e-06, + "loss": 0.2628, + "step": 37075 + }, + { + "epoch": 1.48, + "learning_rate": 9.26758758758759e-06, + "loss": 0.262, + "step": 37100 + }, + { + "epoch": 1.48, + "learning_rate": 9.267087087087087e-06, + "loss": 0.2531, + "step": 37125 + }, + { + "epoch": 1.48, + "learning_rate": 9.266586586586588e-06, + "loss": 0.2407, + "step": 37150 + }, + { + "epoch": 1.48, + "learning_rate": 9.266086086086087e-06, + "loss": 0.2717, + "step": 37175 + }, + { + "epoch": 1.48, + "learning_rate": 9.265585585585586e-06, + "loss": 0.2696, + "step": 37200 + }, + { + "epoch": 1.48, + "learning_rate": 9.265085085085086e-06, + "loss": 0.2718, + "step": 37225 + }, + { + "epoch": 1.49, + "learning_rate": 9.264584584584585e-06, + "loss": 0.2523, + "step": 37250 + }, + { + "epoch": 1.49, + "learning_rate": 9.264084084084084e-06, + "loss": 0.2637, + "step": 37275 + }, + { + "epoch": 1.49, + "learning_rate": 9.263583583583584e-06, + "loss": 0.2818, + "step": 37300 + }, + { + "epoch": 1.49, + "learning_rate": 9.263083083083085e-06, + "loss": 0.2812, + "step": 37325 + }, + { + "epoch": 1.49, + "learning_rate": 9.262582582582584e-06, + "loss": 0.2623, + "step": 37350 + }, + { + "epoch": 1.49, + "learning_rate": 9.262082082082083e-06, + "loss": 0.2615, + "step": 37375 + }, + { + "epoch": 1.49, + "learning_rate": 9.261581581581583e-06, + "loss": 0.2783, + "step": 37400 + }, + { + "epoch": 1.49, + "learning_rate": 9.261081081081082e-06, + "loss": 0.2577, + "step": 37425 + }, + { + "epoch": 1.49, + "learning_rate": 9.260580580580581e-06, + "loss": 0.2718, + "step": 37450 + }, + { + "epoch": 1.49, + "learning_rate": 9.26008008008008e-06, + "loss": 0.2569, + "step": 37475 + }, + { + "epoch": 1.5, + "learning_rate": 9.259579579579581e-06, + "loss": 0.2604, + "step": 37500 + }, + { + "epoch": 1.5, + "learning_rate": 9.259079079079079e-06, + "loss": 0.265, + "step": 37525 + }, + { + "epoch": 1.5, + "learning_rate": 9.25857857857858e-06, + "loss": 0.2688, + "step": 37550 + }, + { + "epoch": 1.5, + "learning_rate": 9.25807807807808e-06, + "loss": 0.2567, + "step": 37575 + }, + { + "epoch": 1.5, + "learning_rate": 9.257577577577579e-06, + "loss": 0.2747, + "step": 37600 + }, + { + "epoch": 1.5, + "learning_rate": 9.257077077077078e-06, + "loss": 0.27, + "step": 37625 + }, + { + "epoch": 1.5, + "learning_rate": 9.256576576576577e-06, + "loss": 0.2699, + "step": 37650 + }, + { + "epoch": 1.5, + "learning_rate": 9.256076076076076e-06, + "loss": 0.2645, + "step": 37675 + }, + { + "epoch": 1.5, + "learning_rate": 9.255575575575576e-06, + "loss": 0.2723, + "step": 37700 + }, + { + "epoch": 1.5, + "learning_rate": 9.255075075075077e-06, + "loss": 0.2693, + "step": 37725 + }, + { + "epoch": 1.51, + "learning_rate": 9.254574574574574e-06, + "loss": 0.2509, + "step": 37750 + }, + { + "epoch": 1.51, + "learning_rate": 9.254074074074075e-06, + "loss": 0.2698, + "step": 37775 + }, + { + "epoch": 1.51, + "learning_rate": 9.253573573573575e-06, + "loss": 0.2359, + "step": 37800 + }, + { + "epoch": 1.51, + "learning_rate": 9.253073073073074e-06, + "loss": 0.2707, + "step": 37825 + }, + { + "epoch": 1.51, + "learning_rate": 9.252572572572573e-06, + "loss": 0.2534, + "step": 37850 + }, + { + "epoch": 1.51, + "learning_rate": 9.252072072072073e-06, + "loss": 0.2554, + "step": 37875 + }, + { + "epoch": 1.51, + "learning_rate": 9.251571571571572e-06, + "loss": 0.2753, + "step": 37900 + }, + { + "epoch": 1.51, + "learning_rate": 9.251071071071071e-06, + "loss": 0.2551, + "step": 37925 + }, + { + "epoch": 1.51, + "learning_rate": 9.250570570570572e-06, + "loss": 0.2576, + "step": 37950 + }, + { + "epoch": 1.51, + "learning_rate": 9.250070070070071e-06, + "loss": 0.2579, + "step": 37975 + }, + { + "epoch": 1.52, + "learning_rate": 9.24956956956957e-06, + "loss": 0.2661, + "step": 38000 + }, + { + "epoch": 1.52, + "eval_loss": 0.4426652491092682, + "eval_runtime": 2522.4342, + "eval_samples_per_second": 6.428, + "eval_steps_per_second": 0.161, + "eval_wer": 25.423023257606708, + "step": 38000 + }, + { + "epoch": 1.52, + "learning_rate": 9.24906906906907e-06, + "loss": 0.2819, + "step": 38025 + }, + { + "epoch": 1.52, + "learning_rate": 9.24856856856857e-06, + "loss": 0.2773, + "step": 38050 + }, + { + "epoch": 1.52, + "learning_rate": 9.248068068068069e-06, + "loss": 0.2604, + "step": 38075 + }, + { + "epoch": 1.52, + "learning_rate": 9.247567567567568e-06, + "loss": 0.2645, + "step": 38100 + }, + { + "epoch": 1.52, + "learning_rate": 9.247067067067069e-06, + "loss": 0.2504, + "step": 38125 + }, + { + "epoch": 1.52, + "learning_rate": 9.246566566566567e-06, + "loss": 0.2731, + "step": 38150 + }, + { + "epoch": 1.52, + "learning_rate": 9.246066066066068e-06, + "loss": 0.2543, + "step": 38175 + }, + { + "epoch": 1.52, + "learning_rate": 9.245565565565567e-06, + "loss": 0.2552, + "step": 38200 + }, + { + "epoch": 1.52, + "learning_rate": 9.245065065065066e-06, + "loss": 0.2789, + "step": 38225 + }, + { + "epoch": 1.53, + "learning_rate": 9.244564564564565e-06, + "loss": 0.2668, + "step": 38250 + }, + { + "epoch": 1.53, + "learning_rate": 9.244064064064065e-06, + "loss": 0.2635, + "step": 38275 + }, + { + "epoch": 1.53, + "learning_rate": 9.243563563563564e-06, + "loss": 0.248, + "step": 38300 + }, + { + "epoch": 1.53, + "learning_rate": 9.243063063063063e-06, + "loss": 0.2675, + "step": 38325 + }, + { + "epoch": 1.53, + "learning_rate": 9.242562562562564e-06, + "loss": 0.265, + "step": 38350 + }, + { + "epoch": 1.53, + "learning_rate": 9.242062062062062e-06, + "loss": 0.2509, + "step": 38375 + }, + { + "epoch": 1.53, + "learning_rate": 9.241561561561563e-06, + "loss": 0.2535, + "step": 38400 + }, + { + "epoch": 1.53, + "learning_rate": 9.241061061061062e-06, + "loss": 0.2716, + "step": 38425 + }, + { + "epoch": 1.53, + "learning_rate": 9.240560560560561e-06, + "loss": 0.2578, + "step": 38450 + }, + { + "epoch": 1.53, + "learning_rate": 9.24006006006006e-06, + "loss": 0.2743, + "step": 38475 + }, + { + "epoch": 1.54, + "learning_rate": 9.23955955955956e-06, + "loss": 0.2701, + "step": 38500 + }, + { + "epoch": 1.54, + "learning_rate": 9.23905905905906e-06, + "loss": 0.2716, + "step": 38525 + }, + { + "epoch": 1.54, + "learning_rate": 9.238558558558559e-06, + "loss": 0.2696, + "step": 38550 + }, + { + "epoch": 1.54, + "learning_rate": 9.23805805805806e-06, + "loss": 0.2701, + "step": 38575 + }, + { + "epoch": 1.54, + "learning_rate": 9.237577577577577e-06, + "loss": 0.2573, + "step": 38600 + }, + { + "epoch": 1.54, + "learning_rate": 9.237077077077078e-06, + "loss": 0.2641, + "step": 38625 + }, + { + "epoch": 1.54, + "learning_rate": 9.236576576576577e-06, + "loss": 0.277, + "step": 38650 + }, + { + "epoch": 1.54, + "learning_rate": 9.236076076076077e-06, + "loss": 0.2562, + "step": 38675 + }, + { + "epoch": 1.54, + "learning_rate": 9.235575575575576e-06, + "loss": 0.2584, + "step": 38700 + }, + { + "epoch": 1.54, + "learning_rate": 9.235075075075077e-06, + "loss": 0.2571, + "step": 38725 + }, + { + "epoch": 1.55, + "learning_rate": 9.234574574574575e-06, + "loss": 0.2652, + "step": 38750 + }, + { + "epoch": 1.55, + "learning_rate": 9.234074074074076e-06, + "loss": 0.26, + "step": 38775 + }, + { + "epoch": 1.55, + "learning_rate": 9.233573573573575e-06, + "loss": 0.2475, + "step": 38800 + }, + { + "epoch": 1.55, + "learning_rate": 9.233073073073074e-06, + "loss": 0.2728, + "step": 38825 + }, + { + "epoch": 1.55, + "learning_rate": 9.232572572572573e-06, + "loss": 0.2678, + "step": 38850 + }, + { + "epoch": 1.55, + "learning_rate": 9.232072072072073e-06, + "loss": 0.2597, + "step": 38875 + }, + { + "epoch": 1.55, + "learning_rate": 9.231571571571572e-06, + "loss": 0.2532, + "step": 38900 + }, + { + "epoch": 1.55, + "learning_rate": 9.231071071071071e-06, + "loss": 0.2552, + "step": 38925 + }, + { + "epoch": 1.55, + "learning_rate": 9.230570570570572e-06, + "loss": 0.2528, + "step": 38950 + }, + { + "epoch": 1.55, + "learning_rate": 9.23007007007007e-06, + "loss": 0.2356, + "step": 38975 + }, + { + "epoch": 1.56, + "learning_rate": 9.229569569569571e-06, + "loss": 0.2512, + "step": 39000 + }, + { + "epoch": 1.56, + "eval_loss": 0.4447844326496124, + "eval_runtime": 2535.3087, + "eval_samples_per_second": 6.395, + "eval_steps_per_second": 0.16, + "eval_wer": 26.18311607218569, + "step": 39000 + }, + { + "epoch": 1.56, + "learning_rate": 9.22906906906907e-06, + "loss": 0.28, + "step": 39025 + }, + { + "epoch": 1.56, + "learning_rate": 9.22856856856857e-06, + "loss": 0.2598, + "step": 39050 + }, + { + "epoch": 1.56, + "learning_rate": 9.228068068068069e-06, + "loss": 0.2805, + "step": 39075 + }, + { + "epoch": 1.56, + "learning_rate": 9.227567567567568e-06, + "loss": 0.2677, + "step": 39100 + }, + { + "epoch": 1.56, + "learning_rate": 9.227067067067067e-06, + "loss": 0.2749, + "step": 39125 + }, + { + "epoch": 1.56, + "learning_rate": 9.226566566566567e-06, + "loss": 0.2652, + "step": 39150 + }, + { + "epoch": 1.56, + "learning_rate": 9.226066066066068e-06, + "loss": 0.2609, + "step": 39175 + }, + { + "epoch": 1.56, + "learning_rate": 9.225565565565567e-06, + "loss": 0.2656, + "step": 39200 + }, + { + "epoch": 1.56, + "learning_rate": 9.225065065065065e-06, + "loss": 0.2648, + "step": 39225 + }, + { + "epoch": 1.57, + "learning_rate": 9.224564564564566e-06, + "loss": 0.2567, + "step": 39250 + }, + { + "epoch": 1.57, + "learning_rate": 9.224064064064065e-06, + "loss": 0.2433, + "step": 39275 + }, + { + "epoch": 1.57, + "learning_rate": 9.223563563563564e-06, + "loss": 0.276, + "step": 39300 + }, + { + "epoch": 1.57, + "learning_rate": 9.223063063063064e-06, + "loss": 0.2651, + "step": 39325 + }, + { + "epoch": 1.57, + "learning_rate": 9.222562562562564e-06, + "loss": 0.2591, + "step": 39350 + }, + { + "epoch": 1.57, + "learning_rate": 9.222062062062062e-06, + "loss": 0.2616, + "step": 39375 + }, + { + "epoch": 1.57, + "learning_rate": 9.221561561561563e-06, + "loss": 0.2563, + "step": 39400 + }, + { + "epoch": 1.57, + "learning_rate": 9.221061061061062e-06, + "loss": 0.2595, + "step": 39425 + }, + { + "epoch": 1.57, + "learning_rate": 9.22056056056056e-06, + "loss": 0.2646, + "step": 39450 + }, + { + "epoch": 1.57, + "learning_rate": 9.220060060060061e-06, + "loss": 0.2676, + "step": 39475 + }, + { + "epoch": 1.58, + "learning_rate": 9.21955955955956e-06, + "loss": 0.2585, + "step": 39500 + }, + { + "epoch": 1.58, + "learning_rate": 9.21905905905906e-06, + "loss": 0.2599, + "step": 39525 + }, + { + "epoch": 1.58, + "learning_rate": 9.218558558558559e-06, + "loss": 0.2477, + "step": 39550 + }, + { + "epoch": 1.58, + "learning_rate": 9.21805805805806e-06, + "loss": 0.2376, + "step": 39575 + }, + { + "epoch": 1.58, + "learning_rate": 9.217557557557557e-06, + "loss": 0.2491, + "step": 39600 + }, + { + "epoch": 1.58, + "learning_rate": 9.217057057057058e-06, + "loss": 0.2533, + "step": 39625 + }, + { + "epoch": 1.58, + "learning_rate": 9.216556556556558e-06, + "loss": 0.2646, + "step": 39650 + }, + { + "epoch": 1.58, + "learning_rate": 9.216056056056057e-06, + "loss": 0.2824, + "step": 39675 + }, + { + "epoch": 1.58, + "learning_rate": 9.215555555555556e-06, + "loss": 0.2854, + "step": 39700 + }, + { + "epoch": 1.58, + "learning_rate": 9.215055055055056e-06, + "loss": 0.2553, + "step": 39725 + }, + { + "epoch": 1.59, + "learning_rate": 9.214554554554555e-06, + "loss": 0.2484, + "step": 39750 + }, + { + "epoch": 1.59, + "learning_rate": 9.214054054054054e-06, + "loss": 0.2362, + "step": 39775 + }, + { + "epoch": 1.59, + "learning_rate": 9.213553553553555e-06, + "loss": 0.2634, + "step": 39800 + }, + { + "epoch": 1.59, + "learning_rate": 9.213053053053055e-06, + "loss": 0.2554, + "step": 39825 + }, + { + "epoch": 1.59, + "learning_rate": 9.212552552552552e-06, + "loss": 0.2502, + "step": 39850 + }, + { + "epoch": 1.59, + "learning_rate": 9.212052052052053e-06, + "loss": 0.2546, + "step": 39875 + }, + { + "epoch": 1.59, + "learning_rate": 9.211551551551552e-06, + "loss": 0.2723, + "step": 39900 + }, + { + "epoch": 1.59, + "learning_rate": 9.211051051051052e-06, + "loss": 0.2674, + "step": 39925 + }, + { + "epoch": 1.59, + "learning_rate": 9.210550550550551e-06, + "loss": 0.2688, + "step": 39950 + }, + { + "epoch": 1.59, + "learning_rate": 9.21005005005005e-06, + "loss": 0.2512, + "step": 39975 + }, + { + "epoch": 1.6, + "learning_rate": 9.20954954954955e-06, + "loss": 0.2541, + "step": 40000 + }, + { + "epoch": 1.6, + "eval_loss": 0.4458891749382019, + "eval_runtime": 2617.6449, + "eval_samples_per_second": 6.194, + "eval_steps_per_second": 0.155, + "eval_wer": 26.314937442665414, + "step": 40000 + }, + { + "epoch": 1.6, + "learning_rate": 9.20904904904905e-06, + "loss": 0.2547, + "step": 40025 + }, + { + "epoch": 1.6, + "learning_rate": 9.20854854854855e-06, + "loss": 0.2557, + "step": 40050 + }, + { + "epoch": 1.6, + "learning_rate": 9.208048048048048e-06, + "loss": 0.2526, + "step": 40075 + }, + { + "epoch": 1.6, + "learning_rate": 9.207547547547549e-06, + "loss": 0.2709, + "step": 40100 + }, + { + "epoch": 1.6, + "learning_rate": 9.207047047047048e-06, + "loss": 0.2643, + "step": 40125 + }, + { + "epoch": 1.6, + "learning_rate": 9.206546546546547e-06, + "loss": 0.2716, + "step": 40150 + }, + { + "epoch": 1.6, + "learning_rate": 9.206046046046046e-06, + "loss": 0.2725, + "step": 40175 + }, + { + "epoch": 1.6, + "learning_rate": 9.205545545545547e-06, + "loss": 0.2532, + "step": 40200 + }, + { + "epoch": 1.6, + "learning_rate": 9.205045045045045e-06, + "loss": 0.2595, + "step": 40225 + }, + { + "epoch": 1.61, + "learning_rate": 9.204544544544546e-06, + "loss": 0.2619, + "step": 40250 + }, + { + "epoch": 1.61, + "learning_rate": 9.204044044044045e-06, + "loss": 0.2627, + "step": 40275 + }, + { + "epoch": 1.61, + "learning_rate": 9.203543543543545e-06, + "loss": 0.2581, + "step": 40300 + }, + { + "epoch": 1.61, + "learning_rate": 9.203043043043044e-06, + "loss": 0.2634, + "step": 40325 + }, + { + "epoch": 1.61, + "learning_rate": 9.202542542542543e-06, + "loss": 0.2392, + "step": 40350 + }, + { + "epoch": 1.61, + "learning_rate": 9.202042042042042e-06, + "loss": 0.2694, + "step": 40375 + }, + { + "epoch": 1.61, + "learning_rate": 9.201541541541542e-06, + "loss": 0.2596, + "step": 40400 + }, + { + "epoch": 1.61, + "learning_rate": 9.201041041041043e-06, + "loss": 0.2844, + "step": 40425 + }, + { + "epoch": 1.61, + "learning_rate": 9.200540540540542e-06, + "loss": 0.2679, + "step": 40450 + }, + { + "epoch": 1.61, + "learning_rate": 9.20004004004004e-06, + "loss": 0.2592, + "step": 40475 + }, + { + "epoch": 1.62, + "learning_rate": 9.19953953953954e-06, + "loss": 0.2523, + "step": 40500 + }, + { + "epoch": 1.62, + "learning_rate": 9.19903903903904e-06, + "loss": 0.27, + "step": 40525 + }, + { + "epoch": 1.62, + "learning_rate": 9.19853853853854e-06, + "loss": 0.272, + "step": 40550 + }, + { + "epoch": 1.62, + "learning_rate": 9.198038038038039e-06, + "loss": 0.2621, + "step": 40575 + }, + { + "epoch": 1.62, + "learning_rate": 9.197537537537538e-06, + "loss": 0.262, + "step": 40600 + }, + { + "epoch": 1.62, + "learning_rate": 9.197057057057059e-06, + "loss": 0.2642, + "step": 40625 + }, + { + "epoch": 1.62, + "learning_rate": 9.196556556556558e-06, + "loss": 0.278, + "step": 40650 + }, + { + "epoch": 1.62, + "learning_rate": 9.196056056056056e-06, + "loss": 0.2711, + "step": 40675 + }, + { + "epoch": 1.62, + "learning_rate": 9.195555555555557e-06, + "loss": 0.2728, + "step": 40700 + }, + { + "epoch": 1.62, + "learning_rate": 9.195055055055056e-06, + "loss": 0.2844, + "step": 40725 + }, + { + "epoch": 1.63, + "learning_rate": 9.194554554554555e-06, + "loss": 0.2657, + "step": 40750 + }, + { + "epoch": 1.63, + "learning_rate": 9.194054054054054e-06, + "loss": 0.2559, + "step": 40775 + }, + { + "epoch": 1.63, + "learning_rate": 9.193553553553555e-06, + "loss": 0.2671, + "step": 40800 + }, + { + "epoch": 1.63, + "learning_rate": 9.193053053053053e-06, + "loss": 0.2559, + "step": 40825 + }, + { + "epoch": 1.63, + "learning_rate": 9.192552552552554e-06, + "loss": 0.2546, + "step": 40850 + }, + { + "epoch": 1.63, + "learning_rate": 9.192052052052053e-06, + "loss": 0.2607, + "step": 40875 + }, + { + "epoch": 1.63, + "learning_rate": 9.191551551551553e-06, + "loss": 0.2718, + "step": 40900 + }, + { + "epoch": 1.63, + "learning_rate": 9.191051051051052e-06, + "loss": 0.2672, + "step": 40925 + }, + { + "epoch": 1.63, + "learning_rate": 9.190550550550551e-06, + "loss": 0.2682, + "step": 40950 + }, + { + "epoch": 1.63, + "learning_rate": 9.19005005005005e-06, + "loss": 0.2646, + "step": 40975 + }, + { + "epoch": 1.64, + "learning_rate": 9.18954954954955e-06, + "loss": 0.2535, + "step": 41000 + }, + { + "epoch": 1.64, + "eval_loss": 0.44114458560943604, + "eval_runtime": 2473.7687, + "eval_samples_per_second": 6.554, + "eval_steps_per_second": 0.164, + "eval_wer": 25.31355755814402, + "step": 41000 + }, + { + "epoch": 1.64, + "learning_rate": 9.18904904904905e-06, + "loss": 0.2634, + "step": 41025 + }, + { + "epoch": 1.64, + "learning_rate": 9.18854854854855e-06, + "loss": 0.2616, + "step": 41050 + }, + { + "epoch": 1.64, + "learning_rate": 9.188048048048048e-06, + "loss": 0.266, + "step": 41075 + }, + { + "epoch": 1.64, + "learning_rate": 9.187547547547549e-06, + "loss": 0.264, + "step": 41100 + }, + { + "epoch": 1.64, + "learning_rate": 9.187047047047048e-06, + "loss": 0.2604, + "step": 41125 + }, + { + "epoch": 1.64, + "learning_rate": 9.186546546546547e-06, + "loss": 0.2552, + "step": 41150 + }, + { + "epoch": 1.64, + "learning_rate": 9.186046046046047e-06, + "loss": 0.2539, + "step": 41175 + }, + { + "epoch": 1.64, + "learning_rate": 9.185545545545546e-06, + "loss": 0.2854, + "step": 41200 + }, + { + "epoch": 1.64, + "learning_rate": 9.185045045045045e-06, + "loss": 0.2629, + "step": 41225 + }, + { + "epoch": 1.64, + "learning_rate": 9.184544544544546e-06, + "loss": 0.2613, + "step": 41250 + }, + { + "epoch": 1.65, + "learning_rate": 9.184044044044045e-06, + "loss": 0.2561, + "step": 41275 + }, + { + "epoch": 1.65, + "learning_rate": 9.183543543543543e-06, + "loss": 0.2617, + "step": 41300 + }, + { + "epoch": 1.65, + "learning_rate": 9.183043043043044e-06, + "loss": 0.2573, + "step": 41325 + }, + { + "epoch": 1.65, + "learning_rate": 9.182542542542543e-06, + "loss": 0.2622, + "step": 41350 + }, + { + "epoch": 1.65, + "learning_rate": 9.182042042042043e-06, + "loss": 0.2472, + "step": 41375 + }, + { + "epoch": 1.65, + "learning_rate": 9.181541541541542e-06, + "loss": 0.262, + "step": 41400 + }, + { + "epoch": 1.65, + "learning_rate": 9.181041041041043e-06, + "loss": 0.2558, + "step": 41425 + }, + { + "epoch": 1.65, + "learning_rate": 9.18054054054054e-06, + "loss": 0.2572, + "step": 41450 + }, + { + "epoch": 1.65, + "learning_rate": 9.180040040040042e-06, + "loss": 0.2618, + "step": 41475 + }, + { + "epoch": 1.65, + "learning_rate": 9.17953953953954e-06, + "loss": 0.2532, + "step": 41500 + }, + { + "epoch": 1.66, + "learning_rate": 9.17903903903904e-06, + "loss": 0.2522, + "step": 41525 + }, + { + "epoch": 1.66, + "learning_rate": 9.17853853853854e-06, + "loss": 0.275, + "step": 41550 + }, + { + "epoch": 1.66, + "learning_rate": 9.178038038038039e-06, + "loss": 0.2754, + "step": 41575 + }, + { + "epoch": 1.66, + "learning_rate": 9.177537537537538e-06, + "loss": 0.2599, + "step": 41600 + }, + { + "epoch": 1.66, + "learning_rate": 9.177037037037037e-06, + "loss": 0.2509, + "step": 41625 + }, + { + "epoch": 1.66, + "learning_rate": 9.176536536536538e-06, + "loss": 0.2554, + "step": 41650 + }, + { + "epoch": 1.66, + "learning_rate": 9.176036036036036e-06, + "loss": 0.2426, + "step": 41675 + }, + { + "epoch": 1.66, + "learning_rate": 9.175535535535535e-06, + "loss": 0.2675, + "step": 41700 + }, + { + "epoch": 1.66, + "learning_rate": 9.175035035035036e-06, + "loss": 0.2559, + "step": 41725 + }, + { + "epoch": 1.66, + "learning_rate": 9.174534534534536e-06, + "loss": 0.2716, + "step": 41750 + }, + { + "epoch": 1.67, + "learning_rate": 9.174034034034035e-06, + "loss": 0.2686, + "step": 41775 + }, + { + "epoch": 1.67, + "learning_rate": 9.173533533533534e-06, + "loss": 0.259, + "step": 41800 + }, + { + "epoch": 1.67, + "learning_rate": 9.173033033033033e-06, + "loss": 0.2747, + "step": 41825 + }, + { + "epoch": 1.67, + "learning_rate": 9.172532532532533e-06, + "loss": 0.2507, + "step": 41850 + }, + { + "epoch": 1.67, + "learning_rate": 9.172032032032034e-06, + "loss": 0.2573, + "step": 41875 + }, + { + "epoch": 1.67, + "learning_rate": 9.171531531531533e-06, + "loss": 0.2542, + "step": 41900 + }, + { + "epoch": 1.67, + "learning_rate": 9.17103103103103e-06, + "loss": 0.2584, + "step": 41925 + }, + { + "epoch": 1.67, + "learning_rate": 9.170530530530532e-06, + "loss": 0.2459, + "step": 41950 + }, + { + "epoch": 1.67, + "learning_rate": 9.170030030030031e-06, + "loss": 0.2533, + "step": 41975 + }, + { + "epoch": 1.67, + "learning_rate": 9.16952952952953e-06, + "loss": 0.2518, + "step": 42000 + }, + { + "epoch": 1.67, + "eval_loss": 0.42200759053230286, + "eval_runtime": 2416.12, + "eval_samples_per_second": 6.71, + "eval_steps_per_second": 0.168, + "eval_wer": 24.71689240755159, + "step": 42000 + }, + { + "epoch": 1.68, + "learning_rate": 9.16902902902903e-06, + "loss": 0.2759, + "step": 42025 + }, + { + "epoch": 1.68, + "learning_rate": 9.16852852852853e-06, + "loss": 0.258, + "step": 42050 + }, + { + "epoch": 1.68, + "learning_rate": 9.168028028028028e-06, + "loss": 0.2424, + "step": 42075 + }, + { + "epoch": 1.68, + "learning_rate": 9.167527527527527e-06, + "loss": 0.258, + "step": 42100 + }, + { + "epoch": 1.68, + "learning_rate": 9.167027027027028e-06, + "loss": 0.274, + "step": 42125 + }, + { + "epoch": 1.68, + "learning_rate": 9.166526526526528e-06, + "loss": 0.2479, + "step": 42150 + }, + { + "epoch": 1.68, + "learning_rate": 9.166026026026027e-06, + "loss": 0.2697, + "step": 42175 + }, + { + "epoch": 1.68, + "learning_rate": 9.165525525525526e-06, + "loss": 0.2621, + "step": 42200 + }, + { + "epoch": 1.68, + "learning_rate": 9.165025025025026e-06, + "loss": 0.2645, + "step": 42225 + }, + { + "epoch": 1.68, + "learning_rate": 9.164524524524525e-06, + "loss": 0.2624, + "step": 42250 + }, + { + "epoch": 1.69, + "learning_rate": 9.164024024024026e-06, + "loss": 0.2592, + "step": 42275 + }, + { + "epoch": 1.69, + "learning_rate": 9.163523523523523e-06, + "loss": 0.255, + "step": 42300 + }, + { + "epoch": 1.69, + "learning_rate": 9.163023023023023e-06, + "loss": 0.262, + "step": 42325 + }, + { + "epoch": 1.69, + "learning_rate": 9.162522522522524e-06, + "loss": 0.2687, + "step": 42350 + }, + { + "epoch": 1.69, + "learning_rate": 9.162022022022023e-06, + "loss": 0.2566, + "step": 42375 + }, + { + "epoch": 1.69, + "learning_rate": 9.161521521521522e-06, + "loss": 0.2563, + "step": 42400 + }, + { + "epoch": 1.69, + "learning_rate": 9.161021021021022e-06, + "loss": 0.2559, + "step": 42425 + }, + { + "epoch": 1.69, + "learning_rate": 9.160520520520521e-06, + "loss": 0.2641, + "step": 42450 + }, + { + "epoch": 1.69, + "learning_rate": 9.16002002002002e-06, + "loss": 0.2729, + "step": 42475 + }, + { + "epoch": 1.69, + "learning_rate": 9.159519519519521e-06, + "loss": 0.2531, + "step": 42500 + }, + { + "epoch": 1.7, + "learning_rate": 9.15901901901902e-06, + "loss": 0.2819, + "step": 42525 + }, + { + "epoch": 1.7, + "learning_rate": 9.158518518518518e-06, + "loss": 0.2594, + "step": 42550 + }, + { + "epoch": 1.7, + "learning_rate": 9.158018018018019e-06, + "loss": 0.2649, + "step": 42575 + }, + { + "epoch": 1.7, + "learning_rate": 9.157517517517518e-06, + "loss": 0.2593, + "step": 42600 + }, + { + "epoch": 1.7, + "learning_rate": 9.157017017017018e-06, + "loss": 0.2636, + "step": 42625 + }, + { + "epoch": 1.7, + "learning_rate": 9.156536536536539e-06, + "loss": 0.2698, + "step": 42650 + }, + { + "epoch": 1.7, + "learning_rate": 9.156036036036036e-06, + "loss": 0.254, + "step": 42675 + }, + { + "epoch": 1.7, + "learning_rate": 9.155535535535535e-06, + "loss": 0.2356, + "step": 42700 + }, + { + "epoch": 1.7, + "learning_rate": 9.155035035035036e-06, + "loss": 0.2506, + "step": 42725 + }, + { + "epoch": 1.7, + "learning_rate": 9.154534534534536e-06, + "loss": 0.2669, + "step": 42750 + }, + { + "epoch": 1.71, + "learning_rate": 9.154034034034035e-06, + "loss": 0.2576, + "step": 42775 + }, + { + "epoch": 1.71, + "learning_rate": 9.153533533533534e-06, + "loss": 0.2536, + "step": 42800 + }, + { + "epoch": 1.71, + "learning_rate": 9.153033033033034e-06, + "loss": 0.2686, + "step": 42825 + }, + { + "epoch": 1.71, + "learning_rate": 9.152532532532533e-06, + "loss": 0.2511, + "step": 42850 + }, + { + "epoch": 1.71, + "learning_rate": 9.152032032032034e-06, + "loss": 0.2667, + "step": 42875 + }, + { + "epoch": 1.71, + "learning_rate": 9.151531531531531e-06, + "loss": 0.2593, + "step": 42900 + }, + { + "epoch": 1.71, + "learning_rate": 9.15103103103103e-06, + "loss": 0.2656, + "step": 42925 + }, + { + "epoch": 1.71, + "learning_rate": 9.150530530530532e-06, + "loss": 0.2574, + "step": 42950 + }, + { + "epoch": 1.71, + "learning_rate": 9.150030030030031e-06, + "loss": 0.2557, + "step": 42975 + }, + { + "epoch": 1.71, + "learning_rate": 9.14952952952953e-06, + "loss": 0.255, + "step": 43000 + }, + { + "epoch": 1.71, + "eval_loss": 0.43135425448417664, + "eval_runtime": 2587.1846, + "eval_samples_per_second": 6.267, + "eval_steps_per_second": 0.157, + "eval_wer": 25.259595593620155, + "step": 43000 + }, + { + "epoch": 1.72, + "learning_rate": 9.14902902902903e-06, + "loss": 0.2639, + "step": 43025 + }, + { + "epoch": 1.72, + "learning_rate": 9.148528528528529e-06, + "loss": 0.256, + "step": 43050 + }, + { + "epoch": 1.72, + "learning_rate": 9.148028028028028e-06, + "loss": 0.2588, + "step": 43075 + }, + { + "epoch": 1.72, + "learning_rate": 9.14752752752753e-06, + "loss": 0.2768, + "step": 43100 + }, + { + "epoch": 1.72, + "learning_rate": 9.147027027027029e-06, + "loss": 0.2557, + "step": 43125 + }, + { + "epoch": 1.72, + "learning_rate": 9.146526526526526e-06, + "loss": 0.2506, + "step": 43150 + }, + { + "epoch": 1.72, + "learning_rate": 9.146026026026027e-06, + "loss": 0.2495, + "step": 43175 + }, + { + "epoch": 1.72, + "learning_rate": 9.145525525525526e-06, + "loss": 0.2652, + "step": 43200 + }, + { + "epoch": 1.72, + "learning_rate": 9.145025025025026e-06, + "loss": 0.2525, + "step": 43225 + }, + { + "epoch": 1.72, + "learning_rate": 9.144524524524525e-06, + "loss": 0.2694, + "step": 43250 + }, + { + "epoch": 1.73, + "learning_rate": 9.144024024024026e-06, + "loss": 0.2489, + "step": 43275 + }, + { + "epoch": 1.73, + "learning_rate": 9.143523523523524e-06, + "loss": 0.2531, + "step": 43300 + }, + { + "epoch": 1.73, + "learning_rate": 9.143023023023023e-06, + "loss": 0.2549, + "step": 43325 + }, + { + "epoch": 1.73, + "learning_rate": 9.142522522522524e-06, + "loss": 0.2526, + "step": 43350 + }, + { + "epoch": 1.73, + "learning_rate": 9.142022022022023e-06, + "loss": 0.2604, + "step": 43375 + }, + { + "epoch": 1.73, + "learning_rate": 9.141521521521523e-06, + "loss": 0.2683, + "step": 43400 + }, + { + "epoch": 1.73, + "learning_rate": 9.141021021021022e-06, + "loss": 0.2659, + "step": 43425 + }, + { + "epoch": 1.73, + "learning_rate": 9.140520520520521e-06, + "loss": 0.2569, + "step": 43450 + }, + { + "epoch": 1.73, + "learning_rate": 9.14002002002002e-06, + "loss": 0.2556, + "step": 43475 + }, + { + "epoch": 1.73, + "learning_rate": 9.139519519519521e-06, + "loss": 0.2752, + "step": 43500 + }, + { + "epoch": 1.74, + "learning_rate": 9.139019019019019e-06, + "loss": 0.2562, + "step": 43525 + }, + { + "epoch": 1.74, + "learning_rate": 9.138518518518518e-06, + "loss": 0.2848, + "step": 43550 + }, + { + "epoch": 1.74, + "learning_rate": 9.13801801801802e-06, + "loss": 0.2598, + "step": 43575 + }, + { + "epoch": 1.74, + "learning_rate": 9.137517517517519e-06, + "loss": 0.2663, + "step": 43600 + }, + { + "epoch": 1.74, + "learning_rate": 9.137017017017018e-06, + "loss": 0.2582, + "step": 43625 + }, + { + "epoch": 1.74, + "learning_rate": 9.136516516516517e-06, + "loss": 0.2646, + "step": 43650 + }, + { + "epoch": 1.74, + "learning_rate": 9.136016016016016e-06, + "loss": 0.2623, + "step": 43675 + }, + { + "epoch": 1.74, + "learning_rate": 9.135515515515516e-06, + "loss": 0.2569, + "step": 43700 + }, + { + "epoch": 1.74, + "learning_rate": 9.135015015015017e-06, + "loss": 0.2504, + "step": 43725 + }, + { + "epoch": 1.74, + "learning_rate": 9.134514514514516e-06, + "loss": 0.2726, + "step": 43750 + }, + { + "epoch": 1.75, + "learning_rate": 9.134014014014014e-06, + "loss": 0.2593, + "step": 43775 + }, + { + "epoch": 1.75, + "learning_rate": 9.133513513513515e-06, + "loss": 0.2478, + "step": 43800 + }, + { + "epoch": 1.75, + "learning_rate": 9.133013013013014e-06, + "loss": 0.2582, + "step": 43825 + }, + { + "epoch": 1.75, + "learning_rate": 9.132512512512513e-06, + "loss": 0.2646, + "step": 43850 + }, + { + "epoch": 1.75, + "learning_rate": 9.132012012012013e-06, + "loss": 0.2822, + "step": 43875 + }, + { + "epoch": 1.75, + "learning_rate": 9.131511511511514e-06, + "loss": 0.2379, + "step": 43900 + }, + { + "epoch": 1.75, + "learning_rate": 9.131011011011011e-06, + "loss": 0.2728, + "step": 43925 + }, + { + "epoch": 1.75, + "learning_rate": 9.13051051051051e-06, + "loss": 0.274, + "step": 43950 + }, + { + "epoch": 1.75, + "learning_rate": 9.130010010010011e-06, + "loss": 0.2838, + "step": 43975 + }, + { + "epoch": 1.75, + "learning_rate": 9.129509509509509e-06, + "loss": 0.2639, + "step": 44000 + }, + { + "epoch": 1.75, + "eval_loss": 0.43265146017074585, + "eval_runtime": 2614.8693, + "eval_samples_per_second": 6.2, + "eval_steps_per_second": 0.155, + "eval_wer": 25.521696564164632, + "step": 44000 + }, + { + "epoch": 1.76, + "learning_rate": 9.12900900900901e-06, + "loss": 0.2588, + "step": 44025 + }, + { + "epoch": 1.76, + "learning_rate": 9.12850850850851e-06, + "loss": 0.2764, + "step": 44050 + }, + { + "epoch": 1.76, + "learning_rate": 9.128008008008009e-06, + "loss": 0.263, + "step": 44075 + }, + { + "epoch": 1.76, + "learning_rate": 9.127507507507508e-06, + "loss": 0.2644, + "step": 44100 + }, + { + "epoch": 1.76, + "learning_rate": 9.127007007007009e-06, + "loss": 0.2476, + "step": 44125 + }, + { + "epoch": 1.76, + "learning_rate": 9.126506506506507e-06, + "loss": 0.2604, + "step": 44150 + }, + { + "epoch": 1.76, + "learning_rate": 9.126006006006006e-06, + "loss": 0.2747, + "step": 44175 + }, + { + "epoch": 1.76, + "learning_rate": 9.125505505505507e-06, + "loss": 0.265, + "step": 44200 + }, + { + "epoch": 1.76, + "learning_rate": 9.125005005005006e-06, + "loss": 0.2568, + "step": 44225 + }, + { + "epoch": 1.76, + "learning_rate": 9.124504504504505e-06, + "loss": 0.2485, + "step": 44250 + }, + { + "epoch": 1.77, + "learning_rate": 9.124004004004005e-06, + "loss": 0.2742, + "step": 44275 + }, + { + "epoch": 1.77, + "learning_rate": 9.123503503503504e-06, + "loss": 0.2634, + "step": 44300 + }, + { + "epoch": 1.77, + "learning_rate": 9.123003003003003e-06, + "loss": 0.2805, + "step": 44325 + }, + { + "epoch": 1.77, + "learning_rate": 9.122502502502504e-06, + "loss": 0.2543, + "step": 44350 + }, + { + "epoch": 1.77, + "learning_rate": 9.122002002002004e-06, + "loss": 0.2753, + "step": 44375 + }, + { + "epoch": 1.77, + "learning_rate": 9.121501501501501e-06, + "loss": 0.2607, + "step": 44400 + }, + { + "epoch": 1.77, + "learning_rate": 9.121001001001002e-06, + "loss": 0.242, + "step": 44425 + }, + { + "epoch": 1.77, + "learning_rate": 9.120500500500501e-06, + "loss": 0.2633, + "step": 44450 + }, + { + "epoch": 1.77, + "learning_rate": 9.12e-06, + "loss": 0.2686, + "step": 44475 + }, + { + "epoch": 1.77, + "learning_rate": 9.1194994994995e-06, + "loss": 0.2608, + "step": 44500 + }, + { + "epoch": 1.78, + "learning_rate": 9.118998998999e-06, + "loss": 0.2779, + "step": 44525 + }, + { + "epoch": 1.78, + "learning_rate": 9.118498498498499e-06, + "loss": 0.2648, + "step": 44550 + }, + { + "epoch": 1.78, + "learning_rate": 9.117997997997998e-06, + "loss": 0.2701, + "step": 44575 + }, + { + "epoch": 1.78, + "learning_rate": 9.117497497497499e-06, + "loss": 0.245, + "step": 44600 + }, + { + "epoch": 1.78, + "learning_rate": 9.116996996996997e-06, + "loss": 0.2607, + "step": 44625 + }, + { + "epoch": 1.78, + "learning_rate": 9.116516516516517e-06, + "loss": 0.2622, + "step": 44650 + }, + { + "epoch": 1.78, + "learning_rate": 9.116016016016017e-06, + "loss": 0.2466, + "step": 44675 + }, + { + "epoch": 1.78, + "learning_rate": 9.115515515515516e-06, + "loss": 0.2627, + "step": 44700 + }, + { + "epoch": 1.78, + "learning_rate": 9.115015015015017e-06, + "loss": 0.26, + "step": 44725 + }, + { + "epoch": 1.78, + "learning_rate": 9.114514514514515e-06, + "loss": 0.2837, + "step": 44750 + }, + { + "epoch": 1.79, + "learning_rate": 9.114014014014014e-06, + "loss": 0.2417, + "step": 44775 + }, + { + "epoch": 1.79, + "learning_rate": 9.113513513513515e-06, + "loss": 0.2663, + "step": 44800 + }, + { + "epoch": 1.79, + "learning_rate": 9.113013013013014e-06, + "loss": 0.2606, + "step": 44825 + }, + { + "epoch": 1.79, + "learning_rate": 9.112512512512513e-06, + "loss": 0.2416, + "step": 44850 + }, + { + "epoch": 1.79, + "learning_rate": 9.112012012012013e-06, + "loss": 0.2537, + "step": 44875 + }, + { + "epoch": 1.79, + "learning_rate": 9.111511511511512e-06, + "loss": 0.2587, + "step": 44900 + }, + { + "epoch": 1.79, + "learning_rate": 9.111011011011011e-06, + "loss": 0.2658, + "step": 44925 + }, + { + "epoch": 1.79, + "learning_rate": 9.11051051051051e-06, + "loss": 0.2653, + "step": 44950 + }, + { + "epoch": 1.79, + "learning_rate": 9.110010010010012e-06, + "loss": 0.2643, + "step": 44975 + }, + { + "epoch": 1.79, + "learning_rate": 9.10950950950951e-06, + "loss": 0.2638, + "step": 45000 + }, + { + "epoch": 1.79, + "eval_loss": 0.432108074426651, + "eval_runtime": 2486.7031, + "eval_samples_per_second": 6.52, + "eval_steps_per_second": 0.163, + "eval_wer": 24.733851882116234, + "step": 45000 + }, + { + "epoch": 1.8, + "learning_rate": 9.10900900900901e-06, + "loss": 0.268, + "step": 45025 + }, + { + "epoch": 1.8, + "learning_rate": 9.10850850850851e-06, + "loss": 0.2566, + "step": 45050 + }, + { + "epoch": 1.8, + "learning_rate": 9.108008008008009e-06, + "loss": 0.2603, + "step": 45075 + }, + { + "epoch": 1.8, + "learning_rate": 9.107507507507508e-06, + "loss": 0.2463, + "step": 45100 + }, + { + "epoch": 1.8, + "learning_rate": 9.107007007007007e-06, + "loss": 0.2597, + "step": 45125 + }, + { + "epoch": 1.8, + "learning_rate": 9.106506506506507e-06, + "loss": 0.2531, + "step": 45150 + }, + { + "epoch": 1.8, + "learning_rate": 9.106006006006006e-06, + "loss": 0.2675, + "step": 45175 + }, + { + "epoch": 1.8, + "learning_rate": 9.105505505505507e-06, + "loss": 0.2445, + "step": 45200 + }, + { + "epoch": 1.8, + "learning_rate": 9.105005005005005e-06, + "loss": 0.2576, + "step": 45225 + }, + { + "epoch": 1.8, + "learning_rate": 9.104504504504506e-06, + "loss": 0.2473, + "step": 45250 + }, + { + "epoch": 1.81, + "learning_rate": 9.104004004004005e-06, + "loss": 0.2551, + "step": 45275 + }, + { + "epoch": 1.81, + "learning_rate": 9.103503503503504e-06, + "loss": 0.2658, + "step": 45300 + }, + { + "epoch": 1.81, + "learning_rate": 9.103003003003003e-06, + "loss": 0.2603, + "step": 45325 + }, + { + "epoch": 1.81, + "learning_rate": 9.102502502502504e-06, + "loss": 0.2618, + "step": 45350 + }, + { + "epoch": 1.81, + "learning_rate": 9.102002002002002e-06, + "loss": 0.2405, + "step": 45375 + }, + { + "epoch": 1.81, + "learning_rate": 9.101501501501501e-06, + "loss": 0.263, + "step": 45400 + }, + { + "epoch": 1.81, + "learning_rate": 9.101001001001002e-06, + "loss": 0.2673, + "step": 45425 + }, + { + "epoch": 1.81, + "learning_rate": 9.100500500500502e-06, + "loss": 0.2638, + "step": 45450 + }, + { + "epoch": 1.81, + "learning_rate": 9.100000000000001e-06, + "loss": 0.2583, + "step": 45475 + }, + { + "epoch": 1.81, + "learning_rate": 9.0994994994995e-06, + "loss": 0.2695, + "step": 45500 + }, + { + "epoch": 1.82, + "learning_rate": 9.098998998999e-06, + "loss": 0.2544, + "step": 45525 + }, + { + "epoch": 1.82, + "learning_rate": 9.098498498498499e-06, + "loss": 0.2634, + "step": 45550 + }, + { + "epoch": 1.82, + "learning_rate": 9.097997997997998e-06, + "loss": 0.2532, + "step": 45575 + }, + { + "epoch": 1.82, + "learning_rate": 9.097497497497499e-06, + "loss": 0.2559, + "step": 45600 + }, + { + "epoch": 1.82, + "learning_rate": 9.096996996996997e-06, + "loss": 0.2459, + "step": 45625 + }, + { + "epoch": 1.82, + "learning_rate": 9.096496496496498e-06, + "loss": 0.2781, + "step": 45650 + }, + { + "epoch": 1.82, + "learning_rate": 9.095995995995997e-06, + "loss": 0.2712, + "step": 45675 + }, + { + "epoch": 1.82, + "learning_rate": 9.095495495495496e-06, + "loss": 0.2597, + "step": 45700 + }, + { + "epoch": 1.82, + "learning_rate": 9.094994994994996e-06, + "loss": 0.275, + "step": 45725 + }, + { + "epoch": 1.82, + "learning_rate": 9.094494494494495e-06, + "loss": 0.2458, + "step": 45750 + }, + { + "epoch": 1.83, + "learning_rate": 9.093993993993994e-06, + "loss": 0.2752, + "step": 45775 + }, + { + "epoch": 1.83, + "learning_rate": 9.093493493493494e-06, + "loss": 0.261, + "step": 45800 + }, + { + "epoch": 1.83, + "learning_rate": 9.092992992992995e-06, + "loss": 0.2532, + "step": 45825 + }, + { + "epoch": 1.83, + "learning_rate": 9.092492492492492e-06, + "loss": 0.2847, + "step": 45850 + }, + { + "epoch": 1.83, + "learning_rate": 9.091991991991993e-06, + "loss": 0.2607, + "step": 45875 + }, + { + "epoch": 1.83, + "learning_rate": 9.091491491491492e-06, + "loss": 0.2678, + "step": 45900 + }, + { + "epoch": 1.83, + "learning_rate": 9.090990990990992e-06, + "loss": 0.2488, + "step": 45925 + }, + { + "epoch": 1.83, + "learning_rate": 9.090490490490491e-06, + "loss": 0.2628, + "step": 45950 + }, + { + "epoch": 1.83, + "learning_rate": 9.089989989989992e-06, + "loss": 0.2625, + "step": 45975 + }, + { + "epoch": 1.83, + "learning_rate": 9.08948948948949e-06, + "loss": 0.2647, + "step": 46000 + }, + { + "epoch": 1.83, + "eval_loss": 0.44105586409568787, + "eval_runtime": 2496.4644, + "eval_samples_per_second": 6.494, + "eval_steps_per_second": 0.163, + "eval_wer": 24.86027705614357, + "step": 46000 + } + ], + "max_steps": 500000, + "num_train_epochs": 20, + "total_flos": 5.309913924895223e+20, + "trial_name": null, + "trial_params": null +}