diff --git "a/trainer_state.json" "b/trainer_state.json" --- "a/trainer_state.json" +++ "b/trainer_state.json" @@ -1,3271 +1,856 @@ { "best_metric": null, "best_model_checkpoint": null, - "epoch": 35.986119743111665, - "global_step": 43400, + "epoch": 72.72103004291846, + "global_step": 5600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { - "epoch": 0.17, - "learning_rate": 9.95e-05, - "loss": 0.6982, - "step": 200 - }, - { - "epoch": 0.17, - "eval_loss": 0.25508013367652893, - "eval_runtime": 247.2382, - "eval_samples_per_second": 20.907, - "eval_steps_per_second": 2.617, - "eval_wer": 0.24512755506258913, - "step": 200 - }, - { - "epoch": 0.33, - "learning_rate": 9.972560975609757e-05, - "loss": 0.5209, - "step": 400 - }, - { - "epoch": 0.33, - "eval_loss": 0.21009531617164612, - "eval_runtime": 249.2779, - "eval_samples_per_second": 20.736, - "eval_steps_per_second": 2.595, - "eval_wer": 0.21507420905297628, - "step": 400 - }, - { - "epoch": 0.5, - "learning_rate": 9.944844789356985e-05, - "loss": 0.4885, - "step": 600 - }, - { - "epoch": 0.5, - "eval_loss": 0.20174096524715424, - "eval_runtime": 247.285, - "eval_samples_per_second": 20.903, - "eval_steps_per_second": 2.616, - "eval_wer": 0.20297892568531137, - "step": 600 - }, - { - "epoch": 0.66, - "learning_rate": 9.917128603104213e-05, - "loss": 0.474, - "step": 800 - }, - { - "epoch": 0.66, - "eval_loss": 0.18579010665416718, - "eval_runtime": 250.2088, - "eval_samples_per_second": 20.659, - "eval_steps_per_second": 2.586, - "eval_wer": 0.1948977974964348, - "step": 800 - }, - { - "epoch": 0.83, - "learning_rate": 9.889412416851441e-05, - "loss": 0.4683, - "step": 1000 - }, - { - "epoch": 0.83, - "eval_loss": 0.17479585111141205, - "eval_runtime": 251.8549, - "eval_samples_per_second": 20.524, - "eval_steps_per_second": 2.569, - "eval_wer": 0.17192204088100144, - "step": 1000 - }, - { - "epoch": 0.99, - "learning_rate": 9.86169623059867e-05, - "loss": 0.4497, - "step": 1200 - }, - { - "epoch": 0.99, - "eval_loss": 0.15883031487464905, - "eval_runtime": 251.9945, - "eval_samples_per_second": 20.512, - "eval_steps_per_second": 2.568, - "eval_wer": 0.17171076955580203, - "step": 1200 - }, - { - "epoch": 1.16, - "learning_rate": 9.833980044345899e-05, - "loss": 0.4037, - "step": 1400 - }, - { - "epoch": 1.16, - "eval_loss": 0.15540002286434174, - "eval_runtime": 253.8837, - "eval_samples_per_second": 20.36, - "eval_steps_per_second": 2.548, - "eval_wer": 0.15987957534463634, - "step": 1400 - }, - { - "epoch": 1.33, - "learning_rate": 9.806263858093127e-05, - "loss": 0.3999, - "step": 1600 - }, - { - "epoch": 1.33, - "eval_loss": 0.1569492369890213, - "eval_runtime": 253.8314, - "eval_samples_per_second": 20.364, - "eval_steps_per_second": 2.549, - "eval_wer": 0.1581365869117414, - "step": 1600 - }, - { - "epoch": 1.49, - "learning_rate": 9.778547671840356e-05, - "loss": 0.4014, - "step": 1800 - }, - { - "epoch": 1.49, - "eval_loss": 0.14257089793682098, - "eval_runtime": 253.5715, - "eval_samples_per_second": 20.385, - "eval_steps_per_second": 2.552, - "eval_wer": 0.1482068346273702, - "step": 1800 - }, - { - "epoch": 1.66, - "learning_rate": 9.750831485587584e-05, - "loss": 0.3887, - "step": 2000 - }, - { - "epoch": 1.66, - "eval_loss": 0.14761227369308472, - "eval_runtime": 262.7757, - "eval_samples_per_second": 19.671, - "eval_steps_per_second": 2.462, - "eval_wer": 0.14361168330428353, - "step": 2000 - }, - { - "epoch": 1.82, - "learning_rate": 9.723115299334812e-05, - "loss": 0.3861, - "step": 2200 - }, - { - "epoch": 1.82, - "eval_loss": 0.14095284044742584, - "eval_runtime": 253.9647, - "eval_samples_per_second": 20.353, - "eval_steps_per_second": 2.548, - "eval_wer": 0.14815401679607035, - "step": 2200 - }, - { - "epoch": 1.99, - "learning_rate": 9.695399113082039e-05, - "loss": 0.3881, - "step": 2400 - }, - { - "epoch": 1.99, - "eval_loss": 0.13986040651798248, - "eval_runtime": 253.8881, - "eval_samples_per_second": 20.359, - "eval_steps_per_second": 2.548, - "eval_wer": 0.14012570643849365, - "step": 2400 - }, - { - "epoch": 2.16, - "learning_rate": 9.667682926829269e-05, - "loss": 0.3397, - "step": 2600 - }, - { - "epoch": 2.16, - "eval_loss": 0.1451854407787323, - "eval_runtime": 255.702, - "eval_samples_per_second": 20.215, - "eval_steps_per_second": 2.53, - "eval_wer": 0.13178048909311785, - "step": 2600 - }, - { - "epoch": 2.32, - "learning_rate": 9.639966740576497e-05, - "loss": 0.3383, - "step": 2800 - }, - { - "epoch": 2.32, - "eval_loss": 0.13278624415397644, - "eval_runtime": 254.5924, - "eval_samples_per_second": 20.303, - "eval_steps_per_second": 2.541, - "eval_wer": 0.13019595415412244, - "step": 2800 - }, - { - "epoch": 2.49, - "learning_rate": 9.612250554323725e-05, - "loss": 0.3366, - "step": 3000 - }, - { - "epoch": 2.49, - "eval_loss": 0.1430414617061615, - "eval_runtime": 253.9896, - "eval_samples_per_second": 20.351, - "eval_steps_per_second": 2.547, - "eval_wer": 0.13251993873131568, - "step": 3000 - }, - { - "epoch": 2.65, - "learning_rate": 9.584534368070954e-05, - "loss": 0.3481, - "step": 3200 - }, - { - "epoch": 2.65, - "eval_loss": 0.1356772631406784, - "eval_runtime": 253.702, - "eval_samples_per_second": 20.374, - "eval_steps_per_second": 2.55, - "eval_wer": 0.12829451222732793, - "step": 3200 - }, - { - "epoch": 2.82, - "learning_rate": 9.556956762749447e-05, - "loss": 0.337, - "step": 3400 - }, - { - "epoch": 2.82, - "eval_loss": 0.1254938244819641, - "eval_runtime": 254.1064, - "eval_samples_per_second": 20.342, - "eval_steps_per_second": 2.546, - "eval_wer": 0.1273437912639307, - "step": 3400 - }, - { - "epoch": 2.98, - "learning_rate": 9.529240576496675e-05, - "loss": 0.3346, - "step": 3600 - }, - { - "epoch": 2.98, - "eval_loss": 0.13027481734752655, - "eval_runtime": 254.6218, - "eval_samples_per_second": 20.301, - "eval_steps_per_second": 2.541, - "eval_wer": 0.1280304230708287, - "step": 3600 - }, - { - "epoch": 3.15, - "learning_rate": 9.501524390243903e-05, - "loss": 0.3192, - "step": 3800 - }, - { - "epoch": 3.15, - "eval_loss": 0.13303972780704498, - "eval_runtime": 254.7219, - "eval_samples_per_second": 20.293, - "eval_steps_per_second": 2.54, - "eval_wer": 0.12280145777214388, - "step": 3800 - }, - { - "epoch": 3.32, - "learning_rate": 9.473808203991131e-05, - "loss": 0.3093, - "step": 4000 - }, - { - "epoch": 3.32, - "eval_loss": 0.13668616116046906, - "eval_runtime": 254.6369, - "eval_samples_per_second": 20.299, - "eval_steps_per_second": 2.541, - "eval_wer": 0.12206200813394602, - "step": 4000 - }, - { - "epoch": 3.48, - "learning_rate": 9.446092017738359e-05, - "loss": 0.3119, - "step": 4200 - }, - { - "epoch": 3.48, - "eval_loss": 0.1260731816291809, - "eval_runtime": 255.6853, - "eval_samples_per_second": 20.216, - "eval_steps_per_second": 2.53, - "eval_wer": 0.1149316009084667, - "step": 4200 - }, - { - "epoch": 3.65, - "learning_rate": 9.418375831485588e-05, - "loss": 0.3115, - "step": 4400 - }, - { - "epoch": 3.65, - "eval_loss": 0.11900634318590164, - "eval_runtime": 255.3718, - "eval_samples_per_second": 20.241, - "eval_steps_per_second": 2.534, - "eval_wer": 0.11514287223366608, - "step": 4400 - }, - { - "epoch": 3.81, - "learning_rate": 9.390659645232817e-05, - "loss": 0.3104, - "step": 4600 - }, - { - "epoch": 3.81, - "eval_loss": 0.11844547092914581, - "eval_runtime": 253.3424, - "eval_samples_per_second": 20.403, - "eval_steps_per_second": 2.554, - "eval_wer": 0.11994929488195215, - "step": 4600 - }, - { - "epoch": 3.98, - "learning_rate": 9.362943458980045e-05, - "loss": 0.3084, - "step": 4800 - }, - { - "epoch": 3.98, - "eval_loss": 0.12033428996801376, - "eval_runtime": 253.1313, - "eval_samples_per_second": 20.42, - "eval_steps_per_second": 2.556, - "eval_wer": 0.114139333438969, - "step": 4800 - }, - { - "epoch": 4.15, - "learning_rate": 9.335227272727273e-05, - "loss": 0.2879, - "step": 5000 - }, - { - "epoch": 4.15, - "eval_loss": 0.1269288957118988, - "eval_runtime": 252.0701, - "eval_samples_per_second": 20.506, - "eval_steps_per_second": 2.567, - "eval_wer": 0.11239634500607405, - "step": 5000 - }, - { - "epoch": 4.31, - "learning_rate": 9.307511086474502e-05, - "loss": 0.2865, - "step": 5200 - }, - { - "epoch": 4.31, - "eval_loss": 0.13235774636268616, - "eval_runtime": 253.6428, - "eval_samples_per_second": 20.379, - "eval_steps_per_second": 2.551, - "eval_wer": 0.11118153488617757, - "step": 5200 - }, - { - "epoch": 4.48, - "learning_rate": 9.27979490022173e-05, - "loss": 0.2845, - "step": 5400 - }, - { - "epoch": 4.48, - "eval_loss": 0.12866514921188354, - "eval_runtime": 257.2798, - "eval_samples_per_second": 20.091, - "eval_steps_per_second": 2.515, - "eval_wer": 0.11424496910156869, - "step": 5400 - }, - { - "epoch": 4.64, - "learning_rate": 9.252078713968959e-05, - "loss": 0.2856, - "step": 5600 - }, - { - "epoch": 4.64, - "eval_loss": 0.12589029967784882, - "eval_runtime": 254.2212, - "eval_samples_per_second": 20.333, - "eval_steps_per_second": 2.545, - "eval_wer": 0.11012517826018063, - "step": 5600 - }, - { - "epoch": 4.81, - "learning_rate": 9.224362527716187e-05, - "loss": 0.2801, - "step": 5800 - }, - { - "epoch": 4.81, - "eval_loss": 0.12850765883922577, - "eval_runtime": 252.9838, - "eval_samples_per_second": 20.432, - "eval_steps_per_second": 2.557, - "eval_wer": 0.11023081392278034, - "step": 5800 - }, - { - "epoch": 4.97, - "learning_rate": 9.196646341463415e-05, - "loss": 0.2882, - "step": 6000 - }, - { - "epoch": 4.97, - "eval_loss": 0.13433855772018433, - "eval_runtime": 253.6459, - "eval_samples_per_second": 20.379, - "eval_steps_per_second": 2.551, - "eval_wer": 0.10880473247768446, - "step": 6000 - }, - { - "epoch": 5.14, - "learning_rate": 9.168930155210643e-05, - "loss": 0.2701, - "step": 6200 - }, - { - "epoch": 5.14, - "eval_loss": 0.14238382875919342, - "eval_runtime": 253.374, - "eval_samples_per_second": 20.401, - "eval_steps_per_second": 2.554, - "eval_wer": 0.10531875561189458, - "step": 6200 - }, - { - "epoch": 5.31, - "learning_rate": 9.141213968957871e-05, - "loss": 0.2688, - "step": 6400 - }, - { - "epoch": 5.31, - "eval_loss": 0.1337863802909851, - "eval_runtime": 253.8454, - "eval_samples_per_second": 20.363, - "eval_steps_per_second": 2.549, - "eval_wer": 0.10288913537210162, - "step": 6400 - }, - { - "epoch": 5.47, - "learning_rate": 9.1134977827051e-05, - "loss": 0.2683, - "step": 6600 - }, - { - "epoch": 5.47, - "eval_loss": 0.14259789884090424, - "eval_runtime": 252.7728, - "eval_samples_per_second": 20.449, - "eval_steps_per_second": 2.56, - "eval_wer": 0.10732583320128876, - "step": 6600 - }, - { - "epoch": 5.64, - "learning_rate": 9.085781596452329e-05, - "loss": 0.2609, - "step": 6800 - }, - { - "epoch": 5.64, - "eval_loss": 0.13099780678749084, - "eval_runtime": 252.7442, - "eval_samples_per_second": 20.452, - "eval_steps_per_second": 2.56, - "eval_wer": 0.10257222838430254, - "step": 6800 - }, - { - "epoch": 5.8, - "learning_rate": 9.058065410199557e-05, - "loss": 0.267, - "step": 7000 - }, - { - "epoch": 5.8, - "eval_loss": 0.14180444180965424, - "eval_runtime": 254.0779, - "eval_samples_per_second": 20.344, - "eval_steps_per_second": 2.546, - "eval_wer": 0.10119896477050652, - "step": 7000 - }, - { - "epoch": 5.97, - "learning_rate": 9.030487804878049e-05, - "loss": 0.2638, - "step": 7200 - }, - { - "epoch": 5.97, - "eval_loss": 0.13856083154678345, - "eval_runtime": 253.6851, - "eval_samples_per_second": 20.376, - "eval_steps_per_second": 2.55, - "eval_wer": 0.1007236042888079, - "step": 7200 - }, - { - "epoch": 6.14, - "learning_rate": 9.002771618625277e-05, - "loss": 0.2604, - "step": 7400 - }, - { - "epoch": 6.14, - "eval_loss": 0.14975795149803162, - "eval_runtime": 255.6414, - "eval_samples_per_second": 20.22, - "eval_steps_per_second": 2.531, - "eval_wer": 0.10389267416679872, - "step": 7400 - }, - { - "epoch": 6.3, - "learning_rate": 8.975055432372505e-05, - "loss": 0.2484, - "step": 7600 - }, - { - "epoch": 6.3, - "eval_loss": 0.1300615817308426, - "eval_runtime": 256.8835, - "eval_samples_per_second": 20.122, - "eval_steps_per_second": 2.519, - "eval_wer": 0.10230813922780331, - "step": 7600 - }, - { - "epoch": 6.47, - "learning_rate": 8.947339246119735e-05, - "loss": 0.2515, - "step": 7800 - }, - { - "epoch": 6.47, - "eval_loss": 0.13480910658836365, - "eval_runtime": 254.0211, - "eval_samples_per_second": 20.349, - "eval_steps_per_second": 2.547, - "eval_wer": 0.10310040669730101, - "step": 7800 - }, - { - "epoch": 6.63, - "learning_rate": 8.919623059866963e-05, - "loss": 0.2529, - "step": 8000 - }, - { - "epoch": 6.63, - "eval_loss": 0.12069129198789597, - "eval_runtime": 254.8765, - "eval_samples_per_second": 20.28, - "eval_steps_per_second": 2.538, - "eval_wer": 0.10146305392700576, - "step": 8000 - }, - { - "epoch": 6.8, - "learning_rate": 8.891906873614191e-05, - "loss": 0.2498, - "step": 8200 - }, - { - "epoch": 6.8, - "eval_loss": 0.14146772027015686, - "eval_runtime": 254.7381, - "eval_samples_per_second": 20.291, - "eval_steps_per_second": 2.54, - "eval_wer": 0.1016215074209053, - "step": 8200 - }, - { - "epoch": 6.96, - "learning_rate": 8.86419068736142e-05, - "loss": 0.2502, - "step": 8400 - }, - { - "epoch": 6.96, - "eval_loss": 0.12623198330402374, - "eval_runtime": 254.5919, - "eval_samples_per_second": 20.303, - "eval_steps_per_second": 2.541, - "eval_wer": 0.09760735224211693, - "step": 8400 - }, - { - "epoch": 7.13, - "learning_rate": 8.836474501108648e-05, - "loss": 0.2404, - "step": 8600 - }, - { - "epoch": 7.13, - "eval_loss": 0.13511496782302856, - "eval_runtime": 254.4607, - "eval_samples_per_second": 20.314, - "eval_steps_per_second": 2.543, - "eval_wer": 0.09929752284371204, - "step": 8600 - }, - { - "epoch": 7.3, - "learning_rate": 8.808758314855876e-05, - "loss": 0.2337, - "step": 8800 - }, - { - "epoch": 7.3, - "eval_loss": 0.13152754306793213, - "eval_runtime": 254.1423, - "eval_samples_per_second": 20.339, - "eval_steps_per_second": 2.546, - "eval_wer": 0.09876934453071357, - "step": 8800 - }, - { - "epoch": 7.46, - "learning_rate": 8.781042128603105e-05, - "loss": 0.2396, - "step": 9000 - }, - { - "epoch": 7.46, - "eval_loss": 0.135118767619133, - "eval_runtime": 255.0124, - "eval_samples_per_second": 20.27, - "eval_steps_per_second": 2.537, - "eval_wer": 0.09834680188031479, - "step": 9000 - }, - { - "epoch": 7.63, - "learning_rate": 8.753325942350333e-05, - "loss": 0.2431, - "step": 9200 - }, - { - "epoch": 7.63, - "eval_loss": 0.13074836134910583, - "eval_runtime": 255.0093, - "eval_samples_per_second": 20.27, - "eval_steps_per_second": 2.537, - "eval_wer": 0.09707917392911847, - "step": 9200 - }, - { - "epoch": 7.79, - "learning_rate": 8.725609756097561e-05, - "loss": 0.2379, - "step": 9400 - }, - { - "epoch": 7.79, - "eval_loss": 0.13186238706111908, - "eval_runtime": 255.2219, - "eval_samples_per_second": 20.253, - "eval_steps_per_second": 2.535, - "eval_wer": 0.09950879416891142, - "step": 9400 - }, - { - "epoch": 7.96, - "learning_rate": 8.697893569844789e-05, - "loss": 0.2421, - "step": 9600 - }, - { - "epoch": 7.96, - "eval_loss": 0.1254909485578537, - "eval_runtime": 255.0666, - "eval_samples_per_second": 20.265, - "eval_steps_per_second": 2.537, - "eval_wer": 0.09882216236201341, - "step": 9600 - }, - { - "epoch": 8.13, - "learning_rate": 8.670177383592018e-05, - "loss": 0.2324, - "step": 9800 - }, - { - "epoch": 8.13, - "eval_loss": 0.13816988468170166, - "eval_runtime": 257.5755, - "eval_samples_per_second": 20.068, - "eval_steps_per_second": 2.512, - "eval_wer": 0.09628690645962076, - "step": 9800 - }, - { - "epoch": 8.29, - "learning_rate": 8.642461197339246e-05, - "loss": 0.2258, - "step": 10000 - }, - { - "epoch": 8.29, - "eval_loss": 0.15982431173324585, - "eval_runtime": 257.1975, - "eval_samples_per_second": 20.097, - "eval_steps_per_second": 2.516, - "eval_wer": 0.09750171657951724, - "step": 10000 - }, - { - "epoch": 8.46, - "learning_rate": 8.614745011086475e-05, - "loss": 0.2253, - "step": 10200 - }, - { - "epoch": 8.46, - "eval_loss": 0.15032005310058594, - "eval_runtime": 256.9993, - "eval_samples_per_second": 20.113, - "eval_steps_per_second": 2.518, - "eval_wer": 0.09422701103892674, - "step": 10200 - }, - { - "epoch": 8.62, - "learning_rate": 8.587028824833703e-05, - "loss": 0.2228, - "step": 10400 - }, - { - "epoch": 8.62, - "eval_loss": 0.12655803561210632, - "eval_runtime": 258.0019, - "eval_samples_per_second": 20.035, - "eval_steps_per_second": 2.508, - "eval_wer": 0.09581154597792214, - "step": 10400 - }, - { - "epoch": 8.79, - "learning_rate": 8.559312638580932e-05, - "loss": 0.2255, - "step": 10600 - }, - { - "epoch": 8.79, - "eval_loss": 0.14087137579917908, - "eval_runtime": 252.7692, - "eval_samples_per_second": 20.449, - "eval_steps_per_second": 2.56, - "eval_wer": 0.09623408862832092, - "step": 10600 - }, - { - "epoch": 8.95, - "learning_rate": 8.53159645232816e-05, - "loss": 0.2307, - "step": 10800 - }, - { - "epoch": 8.95, - "eval_loss": 0.13605473935604095, - "eval_runtime": 255.7465, - "eval_samples_per_second": 20.211, - "eval_steps_per_second": 2.53, - "eval_wer": 0.0974488987482174, - "step": 10800 - }, - { - "epoch": 9.12, - "learning_rate": 8.503880266075388e-05, - "loss": 0.2149, - "step": 11000 - }, - { - "epoch": 9.12, - "eval_loss": 0.13241790235042572, - "eval_runtime": 254.7831, - "eval_samples_per_second": 20.288, - "eval_steps_per_second": 2.539, - "eval_wer": 0.09338192573812919, - "step": 11000 - }, - { - "epoch": 9.29, - "learning_rate": 8.476164079822618e-05, - "loss": 0.2168, - "step": 11200 - }, - { - "epoch": 9.29, - "eval_loss": 0.1478220671415329, - "eval_runtime": 255.9893, - "eval_samples_per_second": 20.192, - "eval_steps_per_second": 2.527, - "eval_wer": 0.09792425922991602, - "step": 11200 - }, - { - "epoch": 9.45, - "learning_rate": 8.448447893569845e-05, - "loss": 0.2152, - "step": 11400 - }, - { - "epoch": 9.45, - "eval_loss": 0.13686269521713257, - "eval_runtime": 254.4314, - "eval_samples_per_second": 20.316, - "eval_steps_per_second": 2.543, - "eval_wer": 0.09306501875033012, - "step": 11400 - }, - { - "epoch": 9.62, - "learning_rate": 8.420731707317073e-05, - "loss": 0.2155, - "step": 11600 - }, - { - "epoch": 9.62, - "eval_loss": 0.13407327234745026, - "eval_runtime": 254.6769, - "eval_samples_per_second": 20.296, - "eval_steps_per_second": 2.54, - "eval_wer": 0.09449110019542598, - "step": 11600 - }, - { - "epoch": 9.78, - "learning_rate": 8.393154101995566e-05, - "loss": 0.2108, - "step": 11800 - }, - { - "epoch": 9.78, - "eval_loss": 0.13564249873161316, - "eval_runtime": 254.2947, - "eval_samples_per_second": 20.327, - "eval_steps_per_second": 2.544, - "eval_wer": 0.0948608250145249, - "step": 11800 - }, - { - "epoch": 9.95, - "learning_rate": 8.365437915742794e-05, - "loss": 0.2179, - "step": 12000 - }, - { - "epoch": 9.95, - "eval_loss": 0.15698903799057007, - "eval_runtime": 254.2869, - "eval_samples_per_second": 20.327, - "eval_steps_per_second": 2.544, - "eval_wer": 0.08994876670363915, - "step": 12000 - }, - { - "epoch": 10.12, - "learning_rate": 8.337721729490022e-05, - "loss": 0.1988, - "step": 12200 - }, - { - "epoch": 10.12, - "eval_loss": 0.14923857152462006, - "eval_runtime": 254.962, - "eval_samples_per_second": 20.274, - "eval_steps_per_second": 2.538, - "eval_wer": 0.09132203031743516, - "step": 12200 - }, - { - "epoch": 10.28, - "learning_rate": 8.310005543237252e-05, - "loss": 0.2051, - "step": 12400 - }, - { - "epoch": 10.28, - "eval_loss": 0.1382753700017929, - "eval_runtime": 254.97, - "eval_samples_per_second": 20.273, - "eval_steps_per_second": 2.538, - "eval_wer": 0.08973749537843977, - "step": 12400 - }, - { - "epoch": 10.45, - "learning_rate": 8.28228935698448e-05, - "loss": 0.2079, - "step": 12600 - }, - { - "epoch": 10.45, - "eval_loss": 0.14029560983181, - "eval_runtime": 255.2219, - "eval_samples_per_second": 20.253, - "eval_steps_per_second": 2.535, - "eval_wer": 0.09132203031743516, - "step": 12600 - }, - { - "epoch": 10.61, - "learning_rate": 8.254573170731708e-05, - "loss": 0.2056, - "step": 12800 - }, - { - "epoch": 10.61, - "eval_loss": 0.13067609071731567, - "eval_runtime": 255.0916, - "eval_samples_per_second": 20.263, - "eval_steps_per_second": 2.536, - "eval_wer": 0.08994876670363915, - "step": 12800 - }, - { - "epoch": 10.78, - "learning_rate": 8.226856984478936e-05, - "loss": 0.2053, - "step": 13000 - }, - { - "epoch": 10.78, - "eval_loss": 0.13401809334754944, - "eval_runtime": 255.8654, - "eval_samples_per_second": 20.202, - "eval_steps_per_second": 2.529, - "eval_wer": 0.09031849152273808, - "step": 13000 - }, - { - "epoch": 10.94, - "learning_rate": 8.199140798226164e-05, - "loss": 0.2015, - "step": 13200 - }, - { - "epoch": 10.94, - "eval_loss": 0.12882278859615326, - "eval_runtime": 263.8909, - "eval_samples_per_second": 19.588, - "eval_steps_per_second": 2.452, - "eval_wer": 0.0923783869434321, - "step": 13200 - }, - { - "epoch": 11.11, - "learning_rate": 8.171424611973392e-05, - "loss": 0.2, - "step": 13400 - }, - { - "epoch": 11.11, - "eval_loss": 0.12576742470264435, - "eval_runtime": 255.4818, - "eval_samples_per_second": 20.232, - "eval_steps_per_second": 2.532, - "eval_wer": 0.08683251465694819, - "step": 13400 - }, - { - "epoch": 11.28, - "learning_rate": 8.14370842572062e-05, - "loss": 0.2029, - "step": 13600 - }, - { - "epoch": 11.28, - "eval_loss": 0.13859006762504578, - "eval_runtime": 254.423, - "eval_samples_per_second": 20.317, - "eval_steps_per_second": 2.543, - "eval_wer": 0.09000158453493899, - "step": 13600 - }, - { - "epoch": 11.44, - "learning_rate": 8.11599223946785e-05, - "loss": 0.2044, - "step": 13800 - }, - { - "epoch": 11.44, - "eval_loss": 0.138057678937912, - "eval_runtime": 255.1183, - "eval_samples_per_second": 20.261, - "eval_steps_per_second": 2.536, - "eval_wer": 0.09185020863043364, - "step": 13800 - }, - { - "epoch": 11.61, - "learning_rate": 8.088414634146342e-05, - "loss": 0.1943, - "step": 14000 - }, - { - "epoch": 11.61, - "eval_loss": 0.1461963802576065, - "eval_runtime": 255.5721, - "eval_samples_per_second": 20.225, - "eval_steps_per_second": 2.532, - "eval_wer": 0.09206147995563302, - "step": 14000 - }, - { - "epoch": 11.77, - "learning_rate": 8.06069844789357e-05, - "loss": 0.2072, - "step": 14200 - }, - { - "epoch": 11.77, - "eval_loss": 0.14551697671413422, - "eval_runtime": 256.1094, - "eval_samples_per_second": 20.183, - "eval_steps_per_second": 2.526, - "eval_wer": 0.08846986742724344, - "step": 14200 - }, - { - "epoch": 11.94, - "learning_rate": 8.032982261640798e-05, - "loss": 0.1998, - "step": 14400 - }, - { - "epoch": 11.94, - "eval_loss": 0.13519984483718872, - "eval_runtime": 255.2141, - "eval_samples_per_second": 20.254, - "eval_steps_per_second": 2.535, - "eval_wer": 0.09190302646173348, - "step": 14400 - }, - { - "epoch": 12.11, - "learning_rate": 8.00540465631929e-05, - "loss": 0.1952, - "step": 14600 - }, - { - "epoch": 12.11, - "eval_loss": 0.1399640440940857, - "eval_runtime": 254.8364, - "eval_samples_per_second": 20.284, - "eval_steps_per_second": 2.539, - "eval_wer": 0.090688216341837, - "step": 14600 - }, - { - "epoch": 12.27, - "learning_rate": 7.977688470066519e-05, - "loss": 0.1932, - "step": 14800 - }, - { - "epoch": 12.27, - "eval_loss": 0.13122260570526123, - "eval_runtime": 255.4641, - "eval_samples_per_second": 20.234, - "eval_steps_per_second": 2.533, - "eval_wer": 0.09084666983573654, - "step": 14800 - }, - { - "epoch": 12.44, - "learning_rate": 7.949972283813748e-05, - "loss": 0.1885, - "step": 15000 - }, - { - "epoch": 12.44, - "eval_loss": 0.14805012941360474, - "eval_runtime": 255.9292, - "eval_samples_per_second": 20.197, - "eval_steps_per_second": 2.528, - "eval_wer": 0.08883959224634237, - "step": 15000 - }, - { - "epoch": 12.6, - "learning_rate": 7.922256097560976e-05, - "loss": 0.1904, - "step": 15200 - }, - { - "epoch": 12.6, - "eval_loss": 0.13773396611213684, - "eval_runtime": 254.593, - "eval_samples_per_second": 20.303, - "eval_steps_per_second": 2.541, - "eval_wer": 0.08825859610204405, - "step": 15200 - }, - { - "epoch": 12.77, - "learning_rate": 7.894539911308204e-05, - "loss": 0.1924, - "step": 15400 - }, - { - "epoch": 12.77, - "eval_loss": 0.14221470057964325, - "eval_runtime": 254.58, - "eval_samples_per_second": 20.304, - "eval_steps_per_second": 2.541, - "eval_wer": 0.09026567369143823, - "step": 15400 - }, - { - "epoch": 12.93, - "learning_rate": 7.866823725055434e-05, - "loss": 0.188, - "step": 15600 - }, - { - "epoch": 12.93, - "eval_loss": 0.14350585639476776, - "eval_runtime": 258.9085, - "eval_samples_per_second": 19.965, - "eval_steps_per_second": 2.499, - "eval_wer": 0.08540643321185232, - "step": 15600 - }, - { - "epoch": 13.1, - "learning_rate": 7.839107538802661e-05, - "loss": 0.1877, - "step": 15800 - }, - { - "epoch": 13.1, - "eval_loss": 0.1520785242319107, - "eval_runtime": 255.8963, - "eval_samples_per_second": 20.2, - "eval_steps_per_second": 2.528, - "eval_wer": 0.08899804574024191, - "step": 15800 - }, - { - "epoch": 13.27, - "learning_rate": 7.811391352549889e-05, - "loss": 0.1825, - "step": 16000 - }, - { - "epoch": 13.27, - "eval_loss": 0.13483111560344696, - "eval_runtime": 256.5689, - "eval_samples_per_second": 20.147, - "eval_steps_per_second": 2.522, - "eval_wer": 0.08905086357154175, - "step": 16000 - }, - { - "epoch": 13.43, - "learning_rate": 7.783675166297117e-05, - "loss": 0.185, - "step": 16200 - }, - { - "epoch": 13.43, - "eval_loss": 0.13759800791740417, - "eval_runtime": 258.0191, - "eval_samples_per_second": 20.033, - "eval_steps_per_second": 2.508, - "eval_wer": 0.08672687899434849, - "step": 16200 - }, - { - "epoch": 13.6, - "learning_rate": 7.755958980044346e-05, - "loss": 0.1805, - "step": 16400 - }, - { - "epoch": 13.6, - "eval_loss": 0.14212605357170105, - "eval_runtime": 258.5566, - "eval_samples_per_second": 19.992, - "eval_steps_per_second": 2.502, - "eval_wer": 0.0883114139333439, - "step": 16400 - }, - { - "epoch": 13.76, - "learning_rate": 7.728242793791574e-05, - "loss": 0.186, - "step": 16600 - }, - { - "epoch": 13.76, - "eval_loss": 0.1396447867155075, - "eval_runtime": 257.807, - "eval_samples_per_second": 20.05, - "eval_steps_per_second": 2.51, - "eval_wer": 0.08514234405535309, - "step": 16600 - }, - { - "epoch": 13.93, - "learning_rate": 7.700526607538803e-05, - "loss": 0.1869, - "step": 16800 - }, - { - "epoch": 13.93, - "eval_loss": 0.14811939001083374, - "eval_runtime": 257.7698, - "eval_samples_per_second": 20.053, - "eval_steps_per_second": 2.51, - "eval_wer": 0.08456134791105477, - "step": 16800 - }, - { - "epoch": 14.1, - "learning_rate": 7.672949002217296e-05, - "loss": 0.1808, - "step": 17000 - }, - { - "epoch": 14.1, - "eval_loss": 0.15346239507198334, - "eval_runtime": 259.8127, - "eval_samples_per_second": 19.895, - "eval_steps_per_second": 2.49, - "eval_wer": 0.08503670839275339, - "step": 17000 - }, - { - "epoch": 14.26, - "learning_rate": 7.645232815964524e-05, - "loss": 0.1775, - "step": 17200 - }, - { - "epoch": 14.26, - "eval_loss": 0.14250528812408447, - "eval_runtime": 257.4388, - "eval_samples_per_second": 20.079, - "eval_steps_per_second": 2.513, - "eval_wer": 0.0876247821264459, - "step": 17200 - }, - { - "epoch": 14.43, - "learning_rate": 7.617516629711752e-05, - "loss": 0.1773, - "step": 17400 - }, - { - "epoch": 14.43, - "eval_loss": 0.14766837656497955, - "eval_runtime": 258.0221, - "eval_samples_per_second": 20.033, - "eval_steps_per_second": 2.508, - "eval_wer": 0.08471980140495432, - "step": 17400 - }, - { - "epoch": 14.59, - "learning_rate": 7.58980044345898e-05, - "loss": 0.1851, - "step": 17600 - }, - { - "epoch": 14.59, - "eval_loss": 0.15123723447322845, - "eval_runtime": 262.1208, - "eval_samples_per_second": 19.72, - "eval_steps_per_second": 2.468, - "eval_wer": 0.08667406116304864, - "step": 17600 - }, - { - "epoch": 14.76, - "learning_rate": 7.562084257206209e-05, - "loss": 0.1775, - "step": 17800 - }, - { - "epoch": 14.76, - "eval_loss": 0.14902031421661377, - "eval_runtime": 257.8432, - "eval_samples_per_second": 20.047, - "eval_steps_per_second": 2.509, - "eval_wer": 0.08329371995985844, - "step": 17800 - }, - { - "epoch": 14.92, - "learning_rate": 7.534368070953437e-05, - "loss": 0.1802, - "step": 18000 - }, - { - "epoch": 14.92, - "eval_loss": 0.15108011662960052, - "eval_runtime": 257.3237, - "eval_samples_per_second": 20.088, - "eval_steps_per_second": 2.514, - "eval_wer": 0.08709660381344742, - "step": 18000 - }, - { - "epoch": 15.09, - "learning_rate": 7.50679046563193e-05, - "loss": 0.1829, - "step": 18200 - }, - { - "epoch": 15.09, - "eval_loss": 0.14215655624866486, - "eval_runtime": 258.1845, - "eval_samples_per_second": 20.021, - "eval_steps_per_second": 2.506, - "eval_wer": 0.0859346115248508, - "step": 18200 - }, - { - "epoch": 15.26, - "learning_rate": 7.479074279379158e-05, - "loss": 0.1704, - "step": 18400 - }, - { - "epoch": 15.26, - "eval_loss": 0.1536380648612976, - "eval_runtime": 258.2175, - "eval_samples_per_second": 20.018, - "eval_steps_per_second": 2.506, - "eval_wer": 0.08535361538055247, - "step": 18400 - }, - { - "epoch": 15.42, - "learning_rate": 7.451358093126386e-05, - "loss": 0.1707, - "step": 18600 - }, - { - "epoch": 15.42, - "eval_loss": 0.15412335097789764, - "eval_runtime": 259.6526, - "eval_samples_per_second": 19.907, - "eval_steps_per_second": 2.492, - "eval_wer": 0.08366344477895737, - "step": 18600 - }, - { - "epoch": 15.59, - "learning_rate": 7.423641906873615e-05, - "loss": 0.1716, - "step": 18800 - }, - { - "epoch": 15.59, - "eval_loss": 0.15734080970287323, - "eval_runtime": 256.5213, - "eval_samples_per_second": 20.15, - "eval_steps_per_second": 2.522, - "eval_wer": 0.08419162309195584, - "step": 18800 - }, - { - "epoch": 15.75, - "learning_rate": 7.395925720620843e-05, - "loss": 0.1755, - "step": 19000 - }, - { - "epoch": 15.75, - "eval_loss": 0.1497374176979065, - "eval_runtime": 255.8623, - "eval_samples_per_second": 20.202, - "eval_steps_per_second": 2.529, - "eval_wer": 0.08408598742935615, - "step": 19000 - }, - { - "epoch": 15.92, - "learning_rate": 7.368209534368071e-05, - "loss": 0.1695, - "step": 19200 - }, - { - "epoch": 15.92, - "eval_loss": 0.14581099152565002, - "eval_runtime": 256.4224, - "eval_samples_per_second": 20.158, - "eval_steps_per_second": 2.523, - "eval_wer": 0.08371626261025722, - "step": 19200 - }, - { - "epoch": 16.09, - "learning_rate": 7.340493348115299e-05, - "loss": 0.1761, - "step": 19400 - }, - { - "epoch": 16.09, - "eval_loss": 0.14683474600315094, - "eval_runtime": 271.7581, - "eval_samples_per_second": 19.021, - "eval_steps_per_second": 2.381, - "eval_wer": 0.08545925104315216, - "step": 19400 - }, - { - "epoch": 16.25, - "learning_rate": 7.312777161862528e-05, - "loss": 0.1667, - "step": 19600 - }, - { - "epoch": 16.25, - "eval_loss": 0.1606747955083847, - "eval_runtime": 271.8508, - "eval_samples_per_second": 19.014, - "eval_steps_per_second": 2.38, - "eval_wer": 0.08751914646384619, - "step": 19600 - }, - { - "epoch": 16.42, - "learning_rate": 7.285060975609756e-05, - "loss": 0.1667, - "step": 19800 - }, - { - "epoch": 16.42, - "eval_loss": 0.14115694165229797, - "eval_runtime": 271.6689, - "eval_samples_per_second": 19.027, - "eval_steps_per_second": 2.382, - "eval_wer": 0.08524797971795278, - "step": 19800 - }, - { - "epoch": 16.58, - "learning_rate": 7.257344789356985e-05, - "loss": 0.1653, - "step": 20000 - }, - { - "epoch": 16.58, - "eval_loss": 0.13544563949108124, - "eval_runtime": 271.5302, - "eval_samples_per_second": 19.037, - "eval_steps_per_second": 2.383, - "eval_wer": 0.08477261923625416, - "step": 20000 - }, - { - "epoch": 16.75, - "learning_rate": 7.229628603104214e-05, - "loss": 0.1695, - "step": 20200 - }, - { - "epoch": 16.75, - "eval_loss": 0.1354389786720276, - "eval_runtime": 271.5697, - "eval_samples_per_second": 19.034, - "eval_steps_per_second": 2.382, - "eval_wer": 0.08350499128505784, - "step": 20200 - }, - { - "epoch": 16.91, - "learning_rate": 7.201912416851442e-05, - "loss": 0.171, - "step": 20400 - }, - { - "epoch": 16.91, - "eval_loss": 0.14289897680282593, - "eval_runtime": 258.0663, - "eval_samples_per_second": 20.03, - "eval_steps_per_second": 2.507, - "eval_wer": 0.08435007658585539, - "step": 20400 - }, - { - "epoch": 17.08, - "learning_rate": 7.17419623059867e-05, - "loss": 0.167, - "step": 20600 - }, - { - "epoch": 17.08, - "eval_loss": 0.13994231820106506, - "eval_runtime": 256.5044, - "eval_samples_per_second": 20.152, - "eval_steps_per_second": 2.522, - "eval_wer": 0.08207890983996197, - "step": 20600 - }, - { - "epoch": 17.25, - "learning_rate": 7.146480044345898e-05, - "loss": 0.1595, - "step": 20800 - }, - { - "epoch": 17.25, - "eval_loss": 0.16428013145923615, - "eval_runtime": 256.5622, - "eval_samples_per_second": 20.147, - "eval_steps_per_second": 2.522, - "eval_wer": 0.08192045634606243, - "step": 20800 - }, - { - "epoch": 17.41, - "learning_rate": 7.118763858093127e-05, - "loss": 0.1565, - "step": 21000 - }, - { - "epoch": 17.41, - "eval_loss": 0.1530633270740509, - "eval_runtime": 258.23, - "eval_samples_per_second": 20.017, - "eval_steps_per_second": 2.506, - "eval_wer": 0.08456134791105477, - "step": 21000 - }, - { - "epoch": 17.58, - "learning_rate": 7.091047671840355e-05, - "loss": 0.1589, - "step": 21200 - }, - { - "epoch": 17.58, - "eval_loss": 0.1481485366821289, - "eval_runtime": 257.1667, - "eval_samples_per_second": 20.1, - "eval_steps_per_second": 2.516, - "eval_wer": 0.08102255321396504, - "step": 21200 - }, - { - "epoch": 17.74, - "learning_rate": 7.063331485587583e-05, - "loss": 0.1602, - "step": 21400 - }, - { - "epoch": 17.74, - "eval_loss": 0.16114427149295807, - "eval_runtime": 257.6644, - "eval_samples_per_second": 20.061, - "eval_steps_per_second": 2.511, - "eval_wer": 0.07838166164897269, - "step": 21400 - }, - { - "epoch": 17.91, - "learning_rate": 7.035615299334812e-05, - "loss": 0.1622, - "step": 21600 - }, - { - "epoch": 17.91, - "eval_loss": 0.14328357577323914, - "eval_runtime": 258.6193, - "eval_samples_per_second": 19.987, - "eval_steps_per_second": 2.502, - "eval_wer": 0.0832409021285586, - "step": 21600 - }, - { - "epoch": 18.08, - "learning_rate": 7.00789911308204e-05, - "loss": 0.1629, - "step": 21800 - }, - { - "epoch": 18.08, - "eval_loss": 0.14952301979064941, - "eval_runtime": 253.7518, - "eval_samples_per_second": 20.37, - "eval_steps_per_second": 2.55, - "eval_wer": 0.08202609200866212, - "step": 21800 - }, - { - "epoch": 18.24, - "learning_rate": 6.980182926829268e-05, - "loss": 0.1542, - "step": 22000 - }, - { - "epoch": 18.24, - "eval_loss": 0.1603306531906128, - "eval_runtime": 252.9767, - "eval_samples_per_second": 20.433, - "eval_steps_per_second": 2.558, - "eval_wer": 0.07864575080547193, - "step": 22000 - }, - { - "epoch": 18.41, - "learning_rate": 6.952466740576497e-05, - "loss": 0.1577, - "step": 22200 - }, - { - "epoch": 18.41, - "eval_loss": 0.15311960875988007, - "eval_runtime": 253.1091, - "eval_samples_per_second": 20.422, - "eval_steps_per_second": 2.556, - "eval_wer": 0.08123382453916442, - "step": 22200 - }, - { - "epoch": 18.57, - "learning_rate": 6.924750554323726e-05, - "loss": 0.1592, - "step": 22400 - }, - { - "epoch": 18.57, - "eval_loss": 0.15086284279823303, - "eval_runtime": 257.495, - "eval_samples_per_second": 20.074, - "eval_steps_per_second": 2.513, - "eval_wer": 0.08170918502086304, - "step": 22400 - }, - { - "epoch": 18.74, - "learning_rate": 6.897172949002217e-05, - "loss": 0.1608, - "step": 22600 - }, - { - "epoch": 18.74, - "eval_loss": 0.14557667076587677, - "eval_runtime": 255.6435, - "eval_samples_per_second": 20.22, - "eval_steps_per_second": 2.531, - "eval_wer": 0.0799661965879681, - "step": 22600 - }, - { - "epoch": 18.9, - "learning_rate": 6.869456762749445e-05, - "loss": 0.1573, - "step": 22800 - }, - { - "epoch": 18.9, - "eval_loss": 0.15521085262298584, - "eval_runtime": 254.7778, - "eval_samples_per_second": 20.288, - "eval_steps_per_second": 2.539, - "eval_wer": 0.08081128188876564, - "step": 22800 - }, - { - "epoch": 19.07, - "learning_rate": 6.841740576496674e-05, - "loss": 0.1559, - "step": 23000 - }, - { - "epoch": 19.07, - "eval_loss": 0.1598125696182251, - "eval_runtime": 255.4991, - "eval_samples_per_second": 20.231, - "eval_steps_per_second": 2.532, - "eval_wer": 0.08123382453916442, - "step": 23000 - }, - { - "epoch": 19.24, - "learning_rate": 6.814024390243903e-05, - "loss": 0.1518, - "step": 23200 - }, - { - "epoch": 19.24, - "eval_loss": 0.15756739675998688, - "eval_runtime": 255.2152, - "eval_samples_per_second": 20.253, - "eval_steps_per_second": 2.535, - "eval_wer": 0.08229018116516136, - "step": 23200 - }, - { - "epoch": 19.4, - "learning_rate": 6.78630820399113e-05, - "loss": 0.1583, - "step": 23400 - }, - { - "epoch": 19.4, - "eval_loss": 0.1478932946920395, - "eval_runtime": 254.8478, - "eval_samples_per_second": 20.283, - "eval_steps_per_second": 2.539, - "eval_wer": 0.0790682934558707, - "step": 23400 - }, - { - "epoch": 19.57, - "learning_rate": 6.75859201773836e-05, - "loss": 0.1521, - "step": 23600 - }, - { - "epoch": 19.57, - "eval_loss": 0.15390987694263458, - "eval_runtime": 255.3412, - "eval_samples_per_second": 20.244, - "eval_steps_per_second": 2.534, - "eval_wer": 0.08144509586436381, - "step": 23600 - }, - { - "epoch": 19.73, - "learning_rate": 6.730875831485588e-05, - "loss": 0.1504, - "step": 23800 - }, - { - "epoch": 19.73, - "eval_loss": 0.15799568593502045, - "eval_runtime": 255.2877, - "eval_samples_per_second": 20.248, - "eval_steps_per_second": 2.534, - "eval_wer": 0.07980774309406856, - "step": 23800 - }, - { - "epoch": 19.9, - "learning_rate": 6.703159645232816e-05, - "loss": 0.1591, - "step": 24000 - }, - { - "epoch": 19.9, - "eval_loss": 0.14647792279720306, - "eval_runtime": 255.0201, - "eval_samples_per_second": 20.269, - "eval_steps_per_second": 2.537, - "eval_wer": 0.07700839803517667, - "step": 24000 - }, - { - "epoch": 20.07, - "learning_rate": 6.675443458980046e-05, - "loss": 0.1535, - "step": 24200 - }, - { - "epoch": 20.07, - "eval_loss": 0.1589883714914322, - "eval_runtime": 255.7034, - "eval_samples_per_second": 20.215, - "eval_steps_per_second": 2.53, - "eval_wer": 0.07669149104737759, - "step": 24200 - }, - { - "epoch": 20.23, - "learning_rate": 6.647727272727274e-05, - "loss": 0.146, - "step": 24400 - }, - { - "epoch": 20.23, - "eval_loss": 0.14599309861660004, - "eval_runtime": 254.7694, - "eval_samples_per_second": 20.289, - "eval_steps_per_second": 2.54, - "eval_wer": 0.07875138646807162, - "step": 24400 - }, - { - "epoch": 20.4, - "learning_rate": 6.6200110864745e-05, - "loss": 0.1492, - "step": 24600 - }, - { - "epoch": 20.4, - "eval_loss": 0.14993605017662048, - "eval_runtime": 254.9593, - "eval_samples_per_second": 20.274, - "eval_steps_per_second": 2.538, - "eval_wer": 0.07706121586647652, - "step": 24600 - }, - { - "epoch": 20.56, - "learning_rate": 6.592294900221729e-05, - "loss": 0.1508, - "step": 24800 - }, - { - "epoch": 20.56, - "eval_loss": 0.1447875052690506, - "eval_runtime": 255.7358, - "eval_samples_per_second": 20.212, - "eval_steps_per_second": 2.53, - "eval_wer": 0.07975492526276871, - "step": 24800 - }, - { - "epoch": 20.73, - "learning_rate": 6.564578713968958e-05, - "loss": 0.1525, - "step": 25000 - }, - { - "epoch": 20.73, - "eval_loss": 0.14607439935207367, - "eval_runtime": 255.9294, - "eval_samples_per_second": 20.197, - "eval_steps_per_second": 2.528, - "eval_wer": 0.07838166164897269, - "step": 25000 - }, - { - "epoch": 20.89, - "learning_rate": 6.53700110864745e-05, - "loss": 0.1503, - "step": 25200 - }, - { - "epoch": 20.89, - "eval_loss": 0.1411682814359665, - "eval_runtime": 255.8366, - "eval_samples_per_second": 20.204, - "eval_steps_per_second": 2.529, - "eval_wer": 0.07970210743146887, - "step": 25200 - }, - { - "epoch": 21.06, - "learning_rate": 6.509284922394679e-05, - "loss": 0.1497, - "step": 25400 - }, - { - "epoch": 21.06, - "eval_loss": 0.14832888543605804, - "eval_runtime": 255.5517, - "eval_samples_per_second": 20.227, - "eval_steps_per_second": 2.532, - "eval_wer": 0.07943801827496963, - "step": 25400 - }, - { - "epoch": 21.23, - "learning_rate": 6.481568736141908e-05, - "loss": 0.1444, - "step": 25600 - }, - { - "epoch": 21.23, - "eval_loss": 0.16129909455776215, - "eval_runtime": 255.967, - "eval_samples_per_second": 20.194, - "eval_steps_per_second": 2.528, - "eval_wer": 0.07864575080547193, - "step": 25600 - }, - { - "epoch": 21.39, - "learning_rate": 6.453852549889136e-05, - "loss": 0.1438, - "step": 25800 - }, - { - "epoch": 21.39, - "eval_loss": 0.1477702409029007, - "eval_runtime": 255.4815, - "eval_samples_per_second": 20.232, - "eval_steps_per_second": 2.532, - "eval_wer": 0.07890983996197116, - "step": 25800 - }, - { - "epoch": 21.56, - "learning_rate": 6.426136363636364e-05, - "loss": 0.1439, - "step": 26000 - }, - { - "epoch": 21.56, - "eval_loss": 0.15728013217449188, - "eval_runtime": 255.4616, - "eval_samples_per_second": 20.234, - "eval_steps_per_second": 2.533, - "eval_wer": 0.07774784767337453, - "step": 26000 - }, - { - "epoch": 21.72, - "learning_rate": 6.398420177383592e-05, - "loss": 0.1455, - "step": 26200 + "epoch": 1.3, + "learning_rate": 0.0001, + "loss": 0.0529, + "step": 100 }, { - "epoch": 21.72, - "eval_loss": 0.14868445694446564, - "eval_runtime": 255.9049, - "eval_samples_per_second": 20.199, - "eval_steps_per_second": 2.528, - "eval_wer": 0.0790682934558707, - "step": 26200 + "epoch": 1.3, + "eval_loss": 0.3332812786102295, + "eval_runtime": 188.2511, + "eval_samples_per_second": 16.558, + "eval_steps_per_second": 2.072, + "eval_wer": 0.2371088585279859, + "step": 100 }, { - "epoch": 21.89, - "learning_rate": 6.37070399113082e-05, - "loss": 0.1395, - "step": 26400 + "epoch": 2.59, + "learning_rate": 9.98699609882965e-05, + "loss": 0.0471, + "step": 200 }, { - "epoch": 21.89, - "eval_loss": 0.16429665684700012, - "eval_runtime": 262.3659, - "eval_samples_per_second": 19.701, - "eval_steps_per_second": 2.466, - "eval_wer": 0.07600485924047959, - "step": 26400 + "epoch": 2.59, + "eval_loss": 0.35051167011260986, + "eval_runtime": 136.2299, + "eval_samples_per_second": 22.88, + "eval_steps_per_second": 2.863, + "eval_wer": 0.23723477932380532, + "step": 200 }, { - "epoch": 22.06, - "learning_rate": 6.342987804878049e-05, - "loss": 0.1428, - "step": 26600 + "epoch": 3.89, + "learning_rate": 9.973992197659299e-05, + "loss": 0.0463, + "step": 300 }, { - "epoch": 22.06, - "eval_loss": 0.1581258475780487, - "eval_runtime": 255.8292, - "eval_samples_per_second": 20.205, - "eval_steps_per_second": 2.529, - "eval_wer": 0.0781703903237733, - "step": 26600 + "epoch": 3.89, + "eval_loss": 0.3505023121833801, + "eval_runtime": 142.4796, + "eval_samples_per_second": 21.877, + "eval_steps_per_second": 2.737, + "eval_wer": 0.23931247245482593, + "step": 300 }, { - "epoch": 22.22, - "learning_rate": 6.315271618625277e-05, - "loss": 0.1342, - "step": 26800 + "epoch": 5.19, + "learning_rate": 9.960988296488946e-05, + "loss": 0.0461, + "step": 400 }, { - "epoch": 22.22, - "eval_loss": 0.16277597844600677, - "eval_runtime": 259.5604, - "eval_samples_per_second": 19.914, - "eval_steps_per_second": 2.493, - "eval_wer": 0.0773781228542756, - "step": 26800 + "epoch": 5.19, + "eval_loss": 0.4004528224468231, + "eval_runtime": 143.9556, + "eval_samples_per_second": 21.653, + "eval_steps_per_second": 2.709, + "eval_wer": 0.2405716804130202, + "step": 400 }, { - "epoch": 22.39, - "learning_rate": 6.28769401330377e-05, - "loss": 0.1401, - "step": 27000 + "epoch": 6.49, + "learning_rate": 9.947984395318596e-05, + "loss": 0.0442, + "step": 500 }, { - "epoch": 22.39, - "eval_loss": 0.1531515270471573, - "eval_runtime": 260.5139, - "eval_samples_per_second": 19.842, - "eval_steps_per_second": 2.484, - "eval_wer": 0.07859293297417208, - "step": 27000 + "epoch": 6.49, + "eval_loss": 0.4172374904155731, + "eval_runtime": 151.5028, + "eval_samples_per_second": 20.574, + "eval_steps_per_second": 2.574, + "eval_wer": 0.24863061134546371, + "step": 500 }, { - "epoch": 22.55, - "learning_rate": 6.259977827050998e-05, - "loss": 0.1401, - "step": 27200 + "epoch": 7.79, + "learning_rate": 9.934980494148245e-05, + "loss": 0.0431, + "step": 600 }, { - "epoch": 22.55, - "eval_loss": 0.15395356714725494, - "eval_runtime": 257.8197, + "epoch": 7.79, + "eval_loss": 0.3723874092102051, + "eval_runtime": 155.4666, "eval_samples_per_second": 20.049, - "eval_steps_per_second": 2.51, - "eval_wer": 0.07727248719167591, - "step": 27200 - }, - { - "epoch": 22.72, - "learning_rate": 6.232261640798226e-05, - "loss": 0.1397, - "step": 27400 - }, - { - "epoch": 22.72, - "eval_loss": 0.1657487452030182, - "eval_runtime": 258.5849, - "eval_samples_per_second": 19.99, - "eval_steps_per_second": 2.502, - "eval_wer": 0.07774784767337453, - "step": 27400 - }, - { - "epoch": 22.89, - "learning_rate": 6.204545454545455e-05, - "loss": 0.1396, - "step": 27600 - }, - { - "epoch": 22.89, - "eval_loss": 0.1595001220703125, - "eval_runtime": 258.8028, - "eval_samples_per_second": 19.973, - "eval_steps_per_second": 2.5, - "eval_wer": 0.07695558020387683, - "step": 27600 - }, - { - "epoch": 23.05, - "learning_rate": 6.176829268292683e-05, - "loss": 0.1425, - "step": 27800 - }, - { - "epoch": 23.05, - "eval_loss": 0.14454737305641174, - "eval_runtime": 257.5774, - "eval_samples_per_second": 20.068, - "eval_steps_per_second": 2.512, - "eval_wer": 0.07695558020387683, - "step": 27800 - }, - { - "epoch": 23.22, - "learning_rate": 6.149113082039911e-05, - "loss": 0.1343, - "step": 28000 - }, - { - "epoch": 23.22, - "eval_loss": 0.15258438885211945, - "eval_runtime": 257.4198, - "eval_samples_per_second": 20.08, - "eval_steps_per_second": 2.513, - "eval_wer": 0.07700839803517667, - "step": 28000 - }, - { - "epoch": 23.38, - "learning_rate": 6.12139689578714e-05, - "loss": 0.1388, - "step": 28200 - }, - { - "epoch": 23.38, - "eval_loss": 0.15189868211746216, - "eval_runtime": 261.1531, - "eval_samples_per_second": 19.793, - "eval_steps_per_second": 2.477, - "eval_wer": 0.07447314213278403, - "step": 28200 - }, - { - "epoch": 23.55, - "learning_rate": 6.0936807095343684e-05, - "loss": 0.1364, - "step": 28400 - }, - { - "epoch": 23.55, - "eval_loss": 0.15030239522457123, - "eval_runtime": 259.6413, - "eval_samples_per_second": 19.908, - "eval_steps_per_second": 2.492, - "eval_wer": 0.07415623514498494, - "step": 28400 - }, - { - "epoch": 23.71, - "learning_rate": 6.0659645232815965e-05, - "loss": 0.1444, - "step": 28600 - }, - { - "epoch": 23.71, - "eval_loss": 0.16646933555603027, - "eval_runtime": 260.1679, - "eval_samples_per_second": 19.868, - "eval_steps_per_second": 2.487, - "eval_wer": 0.07875138646807162, - "step": 28600 - }, - { - "epoch": 23.88, - "learning_rate": 6.038248337028826e-05, - "loss": 0.1361, - "step": 28800 - }, - { - "epoch": 23.88, - "eval_loss": 0.15915772318840027, - "eval_runtime": 259.5414, - "eval_samples_per_second": 19.916, - "eval_steps_per_second": 2.493, - "eval_wer": 0.0757935879152802, - "step": 28800 - }, - { - "epoch": 24.05, - "learning_rate": 6.0105321507760534e-05, - "loss": 0.1398, - "step": 29000 - }, - { - "epoch": 24.05, - "eval_loss": 0.1606004387140274, - "eval_runtime": 259.8476, - "eval_samples_per_second": 19.892, - "eval_steps_per_second": 2.49, - "eval_wer": 0.07632176622827867, - "step": 29000 - }, - { - "epoch": 24.21, - "learning_rate": 5.9828159645232815e-05, - "loss": 0.1322, - "step": 29200 - }, - { - "epoch": 24.21, - "eval_loss": 0.1486821323633194, - "eval_runtime": 259.5122, - "eval_samples_per_second": 19.918, - "eval_steps_per_second": 2.493, - "eval_wer": 0.07848729731157239, - "step": 29200 - }, - { - "epoch": 24.38, - "learning_rate": 5.9550997782705096e-05, - "loss": 0.1309, - "step": 29400 - }, - { - "epoch": 24.38, - "eval_loss": 0.16220000386238098, - "eval_runtime": 259.2803, - "eval_samples_per_second": 19.936, - "eval_steps_per_second": 2.495, - "eval_wer": 0.07626894839697881, - "step": 29400 - }, - { - "epoch": 24.54, - "learning_rate": 5.927383592017739e-05, - "loss": 0.1351, - "step": 29600 - }, - { - "epoch": 24.54, - "eval_loss": 0.17341530323028564, - "eval_runtime": 262.8143, - "eval_samples_per_second": 19.668, - "eval_steps_per_second": 2.462, - "eval_wer": 0.07795911899857391, - "step": 29600 - }, - { - "epoch": 24.71, - "learning_rate": 5.899667405764967e-05, - "loss": 0.1298, - "step": 29800 - }, - { - "epoch": 24.71, - "eval_loss": 0.1510027050971985, - "eval_runtime": 263.1767, - "eval_samples_per_second": 19.641, - "eval_steps_per_second": 2.458, - "eval_wer": 0.07563513442138066, - "step": 29800 - }, - { - "epoch": 24.88, - "learning_rate": 5.871951219512195e-05, - "loss": 0.1369, - "step": 30000 - }, - { - "epoch": 24.88, - "eval_loss": 0.13624520599842072, - "eval_runtime": 263.8718, - "eval_samples_per_second": 19.589, - "eval_steps_per_second": 2.452, - "eval_wer": 0.07626894839697881, - "step": 30000 - }, - { - "epoch": 25.04, - "learning_rate": 5.844235033259424e-05, - "loss": 0.1341, - "step": 30200 - }, - { - "epoch": 25.04, - "eval_loss": 0.15082810819149017, - "eval_runtime": 261.0919, - "eval_samples_per_second": 19.798, - "eval_steps_per_second": 2.478, - "eval_wer": 0.07854011514287224, - "step": 30200 + "eval_steps_per_second": 2.509, + "eval_wer": 0.24006799722974248, + "step": 600 }, { - "epoch": 25.21, - "learning_rate": 5.816518847006652e-05, - "loss": 0.1249, - "step": 30400 + "epoch": 9.09, + "learning_rate": 9.921976592977894e-05, + "loss": 0.0413, + "step": 700 }, { - "epoch": 25.21, - "eval_loss": 0.16026806831359863, - "eval_runtime": 260.2227, - "eval_samples_per_second": 19.864, - "eval_steps_per_second": 2.486, - "eval_wer": 0.07558231659008081, - "step": 30400 + "epoch": 9.09, + "eval_loss": 0.38365304470062256, + "eval_runtime": 157.1121, + "eval_samples_per_second": 19.839, + "eval_steps_per_second": 2.482, + "eval_wer": 0.24466410627715168, + "step": 700 }, { - "epoch": 25.37, - "learning_rate": 5.78880266075388e-05, - "loss": 0.129, - "step": 30600 + "epoch": 10.39, + "learning_rate": 9.908972691807543e-05, + "loss": 0.0417, + "step": 800 }, { - "epoch": 25.37, - "eval_loss": 0.16147717833518982, - "eval_runtime": 258.8644, - "eval_samples_per_second": 19.968, - "eval_steps_per_second": 2.499, - "eval_wer": 0.07457877779538372, - "step": 30600 + "epoch": 10.39, + "eval_loss": 0.37991076707839966, + "eval_runtime": 160.431, + "eval_samples_per_second": 19.429, + "eval_steps_per_second": 2.431, + "eval_wer": 0.23786438330290247, + "step": 800 }, { - "epoch": 25.54, - "learning_rate": 5.7610864745011084e-05, - "loss": 0.1336, - "step": 30800 + "epoch": 11.68, + "learning_rate": 9.89596879063719e-05, + "loss": 0.0423, + "step": 900 }, { - "epoch": 25.54, - "eval_loss": 0.15992993116378784, - "eval_runtime": 258.9913, - "eval_samples_per_second": 19.958, - "eval_steps_per_second": 2.498, - "eval_wer": 0.07505413827708235, - "step": 30800 + "epoch": 11.68, + "eval_loss": 0.41009148955345154, + "eval_runtime": 161.1546, + "eval_samples_per_second": 19.342, + "eval_steps_per_second": 2.42, + "eval_wer": 0.24485298747088083, + "step": 900 }, { - "epoch": 25.7, - "learning_rate": 5.733370288248338e-05, - "loss": 0.127, - "step": 31000 + "epoch": 12.98, + "learning_rate": 9.88296488946684e-05, + "loss": 0.0425, + "step": 1000 }, { - "epoch": 25.7, - "eval_loss": 0.17056865990161896, - "eval_runtime": 259.4613, - "eval_samples_per_second": 19.922, - "eval_steps_per_second": 2.494, - "eval_wer": 0.07484286695188296, - "step": 31000 + "epoch": 12.98, + "eval_loss": 0.38417309522628784, + "eval_runtime": 162.4688, + "eval_samples_per_second": 19.185, + "eval_steps_per_second": 2.4, + "eval_wer": 0.23931247245482593, + "step": 1000 }, { - "epoch": 25.87, - "learning_rate": 5.705654101995565e-05, - "loss": 0.126, - "step": 31200 + "epoch": 14.28, + "learning_rate": 9.869960988296489e-05, + "loss": 0.0413, + "step": 1100 }, { - "epoch": 25.87, - "eval_loss": 0.1541663110256195, - "eval_runtime": 258.8605, - "eval_samples_per_second": 19.968, - "eval_steps_per_second": 2.499, - "eval_wer": 0.07442032430148418, - "step": 31200 + "epoch": 14.28, + "eval_loss": 0.37902718782424927, + "eval_runtime": 164.4062, + "eval_samples_per_second": 18.959, + "eval_steps_per_second": 2.372, + "eval_wer": 0.24491594786879053, + "step": 1100 }, { - "epoch": 26.04, - "learning_rate": 5.6780764966740575e-05, - "loss": 0.124, - "step": 31400 + "epoch": 15.58, + "learning_rate": 9.856957087126138e-05, + "loss": 0.0416, + "step": 1200 }, { - "epoch": 26.04, - "eval_loss": 0.16358500719070435, - "eval_runtime": 258.6242, - "eval_samples_per_second": 19.987, - "eval_steps_per_second": 2.502, - "eval_wer": 0.07531822743358157, - "step": 31400 + "epoch": 15.58, + "eval_loss": 0.38784804940223694, + "eval_runtime": 163.9531, + "eval_samples_per_second": 19.012, + "eval_steps_per_second": 2.379, + "eval_wer": 0.23931247245482593, + "step": 1200 }, { - "epoch": 26.2, - "learning_rate": 5.650360310421286e-05, - "loss": 0.1268, - "step": 31600 + "epoch": 16.88, + "learning_rate": 9.844083224967491e-05, + "loss": 0.0436, + "step": 1300 }, { - "epoch": 26.2, - "eval_loss": 0.16622310876846313, - "eval_runtime": 258.7306, - "eval_samples_per_second": 19.978, - "eval_steps_per_second": 2.501, - "eval_wer": 0.07220197538689062, - "step": 31600 + "epoch": 16.88, + "eval_loss": 0.36406952142715454, + "eval_runtime": 162.4063, + "eval_samples_per_second": 19.193, + "eval_steps_per_second": 2.401, + "eval_wer": 0.23817918529245105, + "step": 1300 }, { - "epoch": 26.37, - "learning_rate": 5.6227827050997785e-05, - "loss": 0.1286, - "step": 31800 + "epoch": 18.18, + "learning_rate": 9.83107932379714e-05, + "loss": 0.0424, + "step": 1400 }, { - "epoch": 26.37, - "eval_loss": 0.16970515251159668, - "eval_runtime": 258.9239, - "eval_samples_per_second": 19.963, - "eval_steps_per_second": 2.499, - "eval_wer": 0.07257170020598955, - "step": 31800 + "epoch": 18.18, + "eval_loss": 0.3773825764656067, + "eval_runtime": 161.8281, + "eval_samples_per_second": 19.261, + "eval_steps_per_second": 2.41, + "eval_wer": 0.2359126109677013, + "step": 1400 }, { - "epoch": 26.53, - "learning_rate": 5.5950665188470066e-05, - "loss": 0.1299, - "step": 32000 + "epoch": 19.48, + "learning_rate": 9.818075422626789e-05, + "loss": 0.0379, + "step": 1500 }, { - "epoch": 26.53, - "eval_loss": 0.17085173726081848, - "eval_runtime": 259.6854, - "eval_samples_per_second": 19.905, - "eval_steps_per_second": 2.491, - "eval_wer": 0.07167379707389214, - "step": 32000 + "epoch": 19.48, + "eval_loss": 0.39104992151260376, + "eval_runtime": 153.8281, + "eval_samples_per_second": 20.263, + "eval_steps_per_second": 2.535, + "eval_wer": 0.23396083863250017, + "step": 1500 }, { - "epoch": 26.7, - "learning_rate": 5.5673503325942354e-05, - "loss": 0.1303, - "step": 32200 + "epoch": 20.77, + "learning_rate": 9.805071521456437e-05, + "loss": 0.0401, + "step": 1600 }, { - "epoch": 26.7, - "eval_loss": 0.16575023531913757, - "eval_runtime": 259.4515, - "eval_samples_per_second": 19.923, - "eval_steps_per_second": 2.494, - "eval_wer": 0.07352242116938679, - "step": 32200 + "epoch": 20.77, + "eval_loss": 0.4012731611728668, + "eval_runtime": 166.1564, + "eval_samples_per_second": 18.759, + "eval_steps_per_second": 2.347, + "eval_wer": 0.23786438330290247, + "step": 1600 }, { - "epoch": 26.87, - "learning_rate": 5.5396341463414635e-05, - "loss": 0.1246, - "step": 32400 + "epoch": 22.08, + "learning_rate": 9.792067620286086e-05, + "loss": 0.0397, + "step": 1700 }, { - "epoch": 26.87, - "eval_loss": 0.16010864078998566, - "eval_runtime": 259.7317, - "eval_samples_per_second": 19.901, - "eval_steps_per_second": 2.491, - "eval_wer": 0.07204352189299107, - "step": 32400 + "epoch": 22.08, + "eval_loss": 0.3917081952095032, + "eval_runtime": 151.5157, + "eval_samples_per_second": 20.572, + "eval_steps_per_second": 2.574, + "eval_wer": 0.23981615563810363, + "step": 1700 }, { - "epoch": 27.03, - "learning_rate": 5.5119179600886916e-05, - "loss": 0.1234, - "step": 32600 + "epoch": 23.37, + "learning_rate": 9.779063719115735e-05, + "loss": 0.0399, + "step": 1800 }, { - "epoch": 27.03, - "eval_loss": 0.1471298187971115, - "eval_runtime": 259.2276, - "eval_samples_per_second": 19.94, - "eval_steps_per_second": 2.496, - "eval_wer": 0.07214915755559077, - "step": 32600 + "epoch": 23.37, + "eval_loss": 0.41352856159210205, + "eval_runtime": 169.9898, + "eval_samples_per_second": 18.336, + "eval_steps_per_second": 2.294, + "eval_wer": 0.24151608638166594, + "step": 1800 }, { - "epoch": 27.2, - "learning_rate": 5.484201773835921e-05, - "loss": 0.1179, - "step": 32800 + "epoch": 24.67, + "learning_rate": 9.766059817945384e-05, + "loss": 0.0407, + "step": 1900 }, { - "epoch": 27.2, - "eval_loss": 0.16308201849460602, - "eval_runtime": 259.2656, - "eval_samples_per_second": 19.937, - "eval_steps_per_second": 2.496, - "eval_wer": 0.07114561876089368, - "step": 32800 + "epoch": 24.67, + "eval_loss": 0.3818851113319397, + "eval_runtime": 176.1576, + "eval_samples_per_second": 17.694, + "eval_steps_per_second": 2.214, + "eval_wer": 0.23717181892589562, + "step": 1900 }, { - "epoch": 27.36, - "learning_rate": 5.456485587583149e-05, - "loss": 0.1218, - "step": 33000 + "epoch": 25.97, + "learning_rate": 9.753055916775033e-05, + "loss": 0.0392, + "step": 2000 }, { - "epoch": 27.36, - "eval_loss": 0.1502005010843277, - "eval_runtime": 259.8271, - "eval_samples_per_second": 19.894, - "eval_steps_per_second": 2.49, - "eval_wer": 0.07199070406169122, - "step": 33000 + "epoch": 25.97, + "eval_loss": 0.3882431983947754, + "eval_runtime": 167.0577, + "eval_samples_per_second": 18.658, + "eval_steps_per_second": 2.335, + "eval_wer": 0.23786438330290247, + "step": 2000 }, { - "epoch": 27.53, - "learning_rate": 5.4287694013303766e-05, - "loss": 0.1249, - "step": 33200 + "epoch": 27.27, + "learning_rate": 9.740052015604681e-05, + "loss": 0.0381, + "step": 2100 }, { - "epoch": 27.53, - "eval_loss": 0.15461181104183197, - "eval_runtime": 271.8472, - "eval_samples_per_second": 19.014, - "eval_steps_per_second": 2.38, - "eval_wer": 0.07214915755559077, - "step": 33200 + "epoch": 27.27, + "eval_loss": 0.3893887996673584, + "eval_runtime": 171.6954, + "eval_samples_per_second": 18.154, + "eval_steps_per_second": 2.271, + "eval_wer": 0.23943839325064534, + "step": 2100 }, { - "epoch": 27.69, - "learning_rate": 5.401053215077606e-05, - "loss": 0.1199, - "step": 33400 + "epoch": 28.57, + "learning_rate": 9.72704811443433e-05, + "loss": 0.0401, + "step": 2200 }, { - "epoch": 27.69, - "eval_loss": 0.14347407221794128, - "eval_runtime": 271.4782, - "eval_samples_per_second": 19.04, - "eval_steps_per_second": 2.383, - "eval_wer": 0.07304706068768817, - "step": 33400 + "epoch": 28.57, + "eval_loss": 0.3673301041126251, + "eval_runtime": 174.7303, + "eval_samples_per_second": 17.839, + "eval_steps_per_second": 2.232, + "eval_wer": 0.2357866901718819, + "step": 2200 }, { - "epoch": 27.86, - "learning_rate": 5.373337028824834e-05, - "loss": 0.1199, - "step": 33600 + "epoch": 29.86, + "learning_rate": 9.71404421326398e-05, + "loss": 0.0391, + "step": 2300 }, { - "epoch": 27.86, - "eval_loss": 0.16159255802631378, - "eval_runtime": 272.7821, - "eval_samples_per_second": 18.949, - "eval_steps_per_second": 2.372, - "eval_wer": 0.07262451803728939, - "step": 33600 + "epoch": 29.86, + "eval_loss": 0.3780101239681244, + "eval_runtime": 157.4375, + "eval_samples_per_second": 19.798, + "eval_steps_per_second": 2.477, + "eval_wer": 0.2354089277844236, + "step": 2300 }, { - "epoch": 28.03, - "learning_rate": 5.345620842572062e-05, - "loss": 0.1213, - "step": 33800 + "epoch": 31.17, + "learning_rate": 9.701040312093628e-05, + "loss": 0.0377, + "step": 2400 }, { - "epoch": 28.03, - "eval_loss": 0.1633623242378235, - "eval_runtime": 267.8584, - "eval_samples_per_second": 19.298, - "eval_steps_per_second": 2.415, - "eval_wer": 0.07188506839909153, - "step": 33800 + "epoch": 31.17, + "eval_loss": 0.3910522758960724, + "eval_runtime": 159.5625, + "eval_samples_per_second": 19.535, + "eval_steps_per_second": 2.444, + "eval_wer": 0.23654221494679847, + "step": 2400 }, { - "epoch": 28.19, - "learning_rate": 5.3179046563192904e-05, - "loss": 0.1166, - "step": 34000 + "epoch": 32.46, + "learning_rate": 9.688036410923278e-05, + "loss": 0.0378, + "step": 2500 }, { - "epoch": 28.19, - "eval_loss": 0.15763157606124878, - "eval_runtime": 258.2022, - "eval_samples_per_second": 20.019, - "eval_steps_per_second": 2.506, - "eval_wer": 0.07278297153118893, - "step": 34000 + "epoch": 32.46, + "eval_loss": 0.3806402087211609, + "eval_runtime": 170.7978, + "eval_samples_per_second": 18.25, + "eval_steps_per_second": 2.283, + "eval_wer": 0.23918655165900649, + "step": 2500 }, { - "epoch": 28.36, - "learning_rate": 5.290188470066519e-05, - "loss": 0.1123, - "step": 34200 + "epoch": 33.76, + "learning_rate": 9.675032509752925e-05, + "loss": 0.0347, + "step": 2600 }, { - "epoch": 28.36, - "eval_loss": 0.16512486338615417, - "eval_runtime": 256.1777, - "eval_samples_per_second": 20.177, - "eval_steps_per_second": 2.526, - "eval_wer": 0.07500132044578249, - "step": 34200 + "epoch": 33.76, + "eval_loss": 0.3844529390335083, + "eval_runtime": 160.3906, + "eval_samples_per_second": 19.434, + "eval_steps_per_second": 2.432, + "eval_wer": 0.23515708619278475, + "step": 2600 }, { - "epoch": 28.52, - "learning_rate": 5.262472283813747e-05, - "loss": 0.121, - "step": 34400 + "epoch": 35.06, + "learning_rate": 9.662028608582574e-05, + "loss": 0.0369, + "step": 2700 }, { - "epoch": 28.52, - "eval_loss": 0.15457598865032196, - "eval_runtime": 278.1382, - "eval_samples_per_second": 18.584, + "epoch": 35.06, + "eval_loss": 0.39440667629241943, + "eval_runtime": 167.7032, + "eval_samples_per_second": 18.586, "eval_steps_per_second": 2.326, - "eval_wer": 0.07452595996408387, - "step": 34400 - }, - { - "epoch": 28.69, - "learning_rate": 5.2347560975609754e-05, - "loss": 0.1197, - "step": 34600 - }, - { - "epoch": 28.69, - "eval_loss": 0.1601417064666748, - "eval_runtime": 278.0073, - "eval_samples_per_second": 18.593, - "eval_steps_per_second": 2.327, - "eval_wer": 0.07315269635028786, - "step": 34600 + "eval_wer": 0.23931247245482593, + "step": 2700 }, { - "epoch": 28.86, - "learning_rate": 5.207039911308205e-05, - "loss": 0.1168, - "step": 34800 + "epoch": 36.36, + "learning_rate": 9.649024707412224e-05, + "loss": 0.0375, + "step": 2800 }, { - "epoch": 28.86, - "eval_loss": 0.16127680242061615, - "eval_runtime": 278.2559, - "eval_samples_per_second": 18.576, - "eval_steps_per_second": 2.325, - "eval_wer": 0.07468441345798342, - "step": 34800 + "epoch": 36.36, + "eval_loss": 0.37219446897506714, + "eval_runtime": 165.2969, + "eval_samples_per_second": 18.857, + "eval_steps_per_second": 2.359, + "eval_wer": 0.23012025436000755, + "step": 2800 }, { - "epoch": 29.02, - "learning_rate": 5.179323725055433e-05, - "loss": 0.1205, - "step": 35000 + "epoch": 37.66, + "learning_rate": 9.636020806241873e-05, + "loss": 0.0363, + "step": 2900 }, { - "epoch": 29.02, - "eval_loss": 0.15306903421878815, - "eval_runtime": 276.9929, - "eval_samples_per_second": 18.661, - "eval_steps_per_second": 2.336, - "eval_wer": 0.07346960333808694, - "step": 35000 + "epoch": 37.66, + "eval_loss": 0.3664211332798004, + "eval_runtime": 167.8076, + "eval_samples_per_second": 18.575, + "eval_steps_per_second": 2.324, + "eval_wer": 0.23112762072656298, + "step": 2900 }, { - "epoch": 29.19, - "learning_rate": 5.151607538802661e-05, - "loss": 0.1165, - "step": 35200 + "epoch": 38.95, + "learning_rate": 9.623016905071522e-05, + "loss": 0.034, + "step": 3000 }, { - "epoch": 29.19, - "eval_loss": 0.15544754266738892, - "eval_runtime": 276.1997, - "eval_samples_per_second": 18.715, - "eval_steps_per_second": 2.343, - "eval_wer": 0.07431468863888449, - "step": 35200 + "epoch": 38.95, + "eval_loss": 0.392531156539917, + "eval_runtime": 173.8435, + "eval_samples_per_second": 17.93, + "eval_steps_per_second": 2.243, + "eval_wer": 0.23081281873701442, + "step": 3000 }, { - "epoch": 29.35, - "learning_rate": 5.1238913525498885e-05, - "loss": 0.1198, - "step": 35400 + "epoch": 40.26, + "learning_rate": 9.610013003901171e-05, + "loss": 0.0331, + "step": 3100 }, { - "epoch": 29.35, - "eval_loss": 0.15731526911258698, - "eval_runtime": 276.5622, - "eval_samples_per_second": 18.69, - "eval_steps_per_second": 2.339, - "eval_wer": 0.07288860719378862, - "step": 35400 + "epoch": 40.26, + "eval_loss": 0.3893636465072632, + "eval_runtime": 167.8125, + "eval_samples_per_second": 18.574, + "eval_steps_per_second": 2.324, + "eval_wer": 0.2323868286847573, + "step": 3100 }, { - "epoch": 29.52, - "learning_rate": 5.0963137472283814e-05, - "loss": 0.1192, - "step": 35600 + "epoch": 41.55, + "learning_rate": 9.59700910273082e-05, + "loss": 0.0339, + "step": 3200 }, { - "epoch": 29.52, - "eval_loss": 0.1620793640613556, - "eval_runtime": 278.1544, - "eval_samples_per_second": 18.583, - "eval_steps_per_second": 2.326, - "eval_wer": 0.07209633972429091, - "step": 35600 + "epoch": 41.55, + "eval_loss": 0.39426469802856445, + "eval_runtime": 168.7188, + "eval_samples_per_second": 18.475, + "eval_steps_per_second": 2.312, + "eval_wer": 0.233331234653403, + "step": 3200 }, { - "epoch": 29.68, - "learning_rate": 5.0685975609756095e-05, - "loss": 0.1184, - "step": 35800 + "epoch": 42.85, + "learning_rate": 9.584005201560469e-05, + "loss": 0.033, + "step": 3300 }, { - "epoch": 29.68, - "eval_loss": 0.15125353634357452, - "eval_runtime": 279.7716, - "eval_samples_per_second": 18.476, - "eval_steps_per_second": 2.313, - "eval_wer": 0.07177943273649184, - "step": 35800 + "epoch": 42.85, + "eval_loss": 0.3865768313407898, + "eval_runtime": 161.5781, + "eval_samples_per_second": 19.291, + "eval_steps_per_second": 2.414, + "eval_wer": 0.2350311653969653, + "step": 3300 }, { - "epoch": 29.85, - "learning_rate": 5.0408813747228376e-05, - "loss": 0.1141, - "step": 36000 + "epoch": 44.15, + "learning_rate": 9.571001300390118e-05, + "loss": 0.0334, + "step": 3400 }, { - "epoch": 29.85, - "eval_loss": 0.15804697573184967, - "eval_runtime": 279.7652, - "eval_samples_per_second": 18.476, - "eval_steps_per_second": 2.313, - "eval_wer": 0.07109280092959383, - "step": 36000 + "epoch": 44.15, + "eval_loss": 0.38849422335624695, + "eval_runtime": 166.5778, + "eval_samples_per_second": 18.712, + "eval_steps_per_second": 2.341, + "eval_wer": 0.2320720266952087, + "step": 3400 }, { - "epoch": 30.02, - "learning_rate": 5.013165188470067e-05, - "loss": 0.1147, - "step": 36200 + "epoch": 45.45, + "learning_rate": 9.557997399219767e-05, + "loss": 0.0331, + "step": 3500 }, { - "epoch": 30.02, - "eval_loss": 0.15915371477603912, - "eval_runtime": 260.2704, - "eval_samples_per_second": 19.86, - "eval_steps_per_second": 2.486, - "eval_wer": 0.0700364443035969, - "step": 36200 + "epoch": 45.45, + "eval_loss": 0.41077303886413574, + "eval_runtime": 165.0937, + "eval_samples_per_second": 18.88, + "eval_steps_per_second": 2.362, + "eval_wer": 0.232009066297299, + "step": 3500 }, { - "epoch": 30.18, - "learning_rate": 4.985449002217295e-05, - "loss": 0.1124, - "step": 36400 + "epoch": 46.75, + "learning_rate": 9.544993498049415e-05, + "loss": 0.0326, + "step": 3600 }, { - "epoch": 30.18, - "eval_loss": 0.17016097903251648, - "eval_runtime": 265.3722, - "eval_samples_per_second": 19.478, + "epoch": 46.75, + "eval_loss": 0.3925323784351349, + "eval_runtime": 159.9375, + "eval_samples_per_second": 19.489, "eval_steps_per_second": 2.438, - "eval_wer": 0.07214915755559077, - "step": 36400 - }, - { - "epoch": 30.35, - "learning_rate": 4.957732815964524e-05, - "loss": 0.1128, - "step": 36600 - }, - { - "epoch": 30.35, - "eval_loss": 0.16143444180488586, - "eval_runtime": 255.9611, - "eval_samples_per_second": 20.194, - "eval_steps_per_second": 2.528, - "eval_wer": 0.07193788623039138, - "step": 36600 - }, - { - "epoch": 30.51, - "learning_rate": 4.9300166297117514e-05, - "loss": 0.1082, - "step": 36800 - }, - { - "epoch": 30.51, - "eval_loss": 0.16003426909446716, - "eval_runtime": 255.199, - "eval_samples_per_second": 20.255, - "eval_steps_per_second": 2.535, - "eval_wer": 0.07220197538689062, - "step": 36800 - }, - { - "epoch": 30.68, - "learning_rate": 4.90230044345898e-05, - "loss": 0.1159, - "step": 37000 - }, - { - "epoch": 30.68, - "eval_loss": 0.15168212354183197, - "eval_runtime": 255.5835, - "eval_samples_per_second": 20.224, - "eval_steps_per_second": 2.531, - "eval_wer": 0.0748956847831828, - "step": 37000 - }, - { - "epoch": 30.85, - "learning_rate": 4.874584257206209e-05, - "loss": 0.1124, - "step": 37200 - }, - { - "epoch": 30.85, - "eval_loss": 0.1633358746767044, - "eval_runtime": 254.9468, - "eval_samples_per_second": 20.275, - "eval_steps_per_second": 2.538, - "eval_wer": 0.07135689008609307, - "step": 37200 - }, - { - "epoch": 31.01, - "learning_rate": 4.846868070953437e-05, - "loss": 0.1153, - "step": 37400 - }, - { - "epoch": 31.01, - "eval_loss": 0.14990398287773132, - "eval_runtime": 255.5087, - "eval_samples_per_second": 20.23, - "eval_steps_per_second": 2.532, - "eval_wer": 0.07294142502508846, - "step": 37400 - }, - { - "epoch": 31.18, - "learning_rate": 4.819151884700666e-05, - "loss": 0.1083, - "step": 37600 - }, - { - "epoch": 31.18, - "eval_loss": 0.15318718552589417, - "eval_runtime": 255.4906, - "eval_samples_per_second": 20.232, - "eval_steps_per_second": 2.532, - "eval_wer": 0.07146252574869276, - "step": 37600 - }, - { - "epoch": 31.34, - "learning_rate": 4.791435698447893e-05, - "loss": 0.1082, - "step": 37800 - }, - { - "epoch": 31.34, - "eval_loss": 0.15611271560192108, - "eval_runtime": 255.2065, - "eval_samples_per_second": 20.254, - "eval_steps_per_second": 2.535, - "eval_wer": 0.07183225056779169, - "step": 37800 - }, - { - "epoch": 31.51, - "learning_rate": 4.763719512195122e-05, - "loss": 0.1114, - "step": 38000 - }, - { - "epoch": 31.51, - "eval_loss": 0.15616507828235626, - "eval_runtime": 255.2918, - "eval_samples_per_second": 20.247, - "eval_steps_per_second": 2.534, - "eval_wer": 0.07204352189299107, - "step": 38000 - }, - { - "epoch": 31.67, - "learning_rate": 4.73600332594235e-05, - "loss": 0.1103, - "step": 38200 - }, - { - "epoch": 31.67, - "eval_loss": 0.1566246598958969, - "eval_runtime": 255.37, - "eval_samples_per_second": 20.241, - "eval_steps_per_second": 2.534, - "eval_wer": 0.07146252574869276, - "step": 38200 - }, - { - "epoch": 31.84, - "learning_rate": 4.708287139689579e-05, - "loss": 0.1091, - "step": 38400 - }, - { - "epoch": 31.84, - "eval_loss": 0.1507750004529953, - "eval_runtime": 255.5097, - "eval_samples_per_second": 20.23, - "eval_steps_per_second": 2.532, - "eval_wer": 0.07030053346009613, - "step": 38400 - }, - { - "epoch": 32.01, - "learning_rate": 4.680570953436808e-05, - "loss": 0.1111, - "step": 38600 - }, - { - "epoch": 32.01, - "eval_loss": 0.145137757062912, - "eval_runtime": 254.9212, - "eval_samples_per_second": 20.277, - "eval_steps_per_second": 2.538, - "eval_wer": 0.07336396767548724, - "step": 38600 - }, - { - "epoch": 32.17, - "learning_rate": 4.652854767184035e-05, - "loss": 0.1113, - "step": 38800 - }, - { - "epoch": 32.17, - "eval_loss": 0.15428981184959412, - "eval_runtime": 255.1259, - "eval_samples_per_second": 20.261, - "eval_steps_per_second": 2.536, - "eval_wer": 0.07415623514498494, - "step": 38800 - }, - { - "epoch": 32.34, - "learning_rate": 4.625138580931264e-05, - "loss": 0.1072, - "step": 39000 - }, - { - "epoch": 32.34, - "eval_loss": 0.14538711309432983, - "eval_runtime": 255.0771, - "eval_samples_per_second": 20.264, - "eval_steps_per_second": 2.536, - "eval_wer": 0.07299424285638832, - "step": 39000 - }, - { - "epoch": 32.5, - "learning_rate": 4.597422394678492e-05, - "loss": 0.1033, - "step": 39200 - }, - { - "epoch": 32.5, - "eval_loss": 0.16375206410884857, - "eval_runtime": 255.084, - "eval_samples_per_second": 20.264, - "eval_steps_per_second": 2.536, - "eval_wer": 0.07135689008609307, - "step": 39200 - }, - { - "epoch": 32.67, - "learning_rate": 4.569706208425721e-05, - "loss": 0.1019, - "step": 39400 - }, - { - "epoch": 32.67, - "eval_loss": 0.16679570078849792, - "eval_runtime": 254.9797, - "eval_samples_per_second": 20.272, - "eval_steps_per_second": 2.537, - "eval_wer": 0.07183225056779169, - "step": 39400 + "eval_wer": 0.2414531259837562, + "step": 3600 }, { - "epoch": 32.84, - "learning_rate": 4.54199002217295e-05, - "loss": 0.1053, - "step": 39600 + "epoch": 48.05, + "learning_rate": 9.531989596879064e-05, + "loss": 0.036, + "step": 3700 }, { - "epoch": 32.84, - "eval_loss": 0.16691266000270844, - "eval_runtime": 257.5588, - "eval_samples_per_second": 20.069, - "eval_steps_per_second": 2.512, - "eval_wer": 0.07082871177309459, - "step": 39600 + "epoch": 48.05, + "eval_loss": 0.3832598030567169, + "eval_runtime": 171.125, + "eval_samples_per_second": 18.215, + "eval_steps_per_second": 2.279, + "eval_wer": 0.2387458288736385, + "step": 3700 }, { - "epoch": 33.0, - "learning_rate": 4.514273835920178e-05, - "loss": 0.1097, - "step": 39800 + "epoch": 49.35, + "learning_rate": 9.518985695708713e-05, + "loss": 0.0346, + "step": 3800 }, { - "epoch": 33.0, - "eval_loss": 0.17189669609069824, - "eval_runtime": 258.3507, - "eval_samples_per_second": 20.008, - "eval_steps_per_second": 2.504, - "eval_wer": 0.07288860719378862, - "step": 39800 + "epoch": 49.35, + "eval_loss": 0.3931749761104584, + "eval_runtime": 166.4063, + "eval_samples_per_second": 18.731, + "eval_steps_per_second": 2.344, + "eval_wer": 0.23263867027639615, + "step": 3800 }, { - "epoch": 33.17, - "learning_rate": 4.486557649667406e-05, - "loss": 0.1021, - "step": 40000 + "epoch": 50.64, + "learning_rate": 9.505981794538362e-05, + "loss": 0.0349, + "step": 3900 }, { - "epoch": 33.17, - "eval_loss": 0.16738824546337128, - "eval_runtime": 257.6603, - "eval_samples_per_second": 20.061, - "eval_steps_per_second": 2.511, - "eval_wer": 0.07177943273649184, - "step": 40000 + "epoch": 50.64, + "eval_loss": 0.3744593858718872, + "eval_runtime": 157.9687, + "eval_samples_per_second": 19.732, + "eval_steps_per_second": 2.469, + "eval_wer": 0.2354089277844236, + "step": 3900 }, { - "epoch": 33.33, - "learning_rate": 4.458980044345898e-05, - "loss": 0.1056, - "step": 40200 + "epoch": 51.94, + "learning_rate": 9.492977893368012e-05, + "loss": 0.034, + "step": 4000 }, { - "epoch": 33.33, - "eval_loss": 0.15968775749206543, - "eval_runtime": 257.6821, - "eval_samples_per_second": 20.06, - "eval_steps_per_second": 2.511, - "eval_wer": 0.07098716526699414, - "step": 40200 + "epoch": 51.94, + "eval_loss": 0.39862367510795593, + "eval_runtime": 155.8749, + "eval_samples_per_second": 19.997, + "eval_steps_per_second": 2.502, + "eval_wer": 0.2328275514701253, + "step": 4000 }, { - "epoch": 33.5, - "learning_rate": 4.431263858093126e-05, - "loss": 0.1043, - "step": 40400 + "epoch": 53.24, + "learning_rate": 9.479973992197659e-05, + "loss": 0.0334, + "step": 4100 }, { - "epoch": 33.5, - "eval_loss": 0.16819486021995544, - "eval_runtime": 258.1617, - "eval_samples_per_second": 20.022, - "eval_steps_per_second": 2.506, - "eval_wer": 0.07294142502508846, - "step": 40400 + "epoch": 53.24, + "eval_loss": 0.39466869831085205, + "eval_runtime": 162.0467, + "eval_samples_per_second": 19.235, + "eval_steps_per_second": 2.407, + "eval_wer": 0.23352011584713214, + "step": 4100 }, { - "epoch": 33.66, - "learning_rate": 4.403547671840355e-05, - "loss": 0.1015, - "step": 40600 + "epoch": 54.54, + "learning_rate": 9.466970091027308e-05, + "loss": 0.0325, + "step": 4200 }, { - "epoch": 33.66, - "eval_loss": 0.17912797629833221, - "eval_runtime": 257.4928, - "eval_samples_per_second": 20.074, - "eval_steps_per_second": 2.513, - "eval_wer": 0.07389214598848572, - "step": 40600 + "epoch": 54.54, + "eval_loss": 0.39441126585006714, + "eval_runtime": 162.4844, + "eval_samples_per_second": 19.183, + "eval_steps_per_second": 2.4, + "eval_wer": 0.23616445255934018, + "step": 4200 }, { - "epoch": 33.83, - "learning_rate": 4.375831485587583e-05, - "loss": 0.1038, - "step": 40800 + "epoch": 55.84, + "learning_rate": 9.453966189856957e-05, + "loss": 0.0308, + "step": 4300 }, { - "epoch": 33.83, - "eval_loss": 0.16278141736984253, - "eval_runtime": 258.2425, - "eval_samples_per_second": 20.016, - "eval_steps_per_second": 2.505, - "eval_wer": 0.07299424285638832, - "step": 40800 + "epoch": 55.84, + "eval_loss": 0.39918699860572815, + "eval_runtime": 155.5625, + "eval_samples_per_second": 20.037, + "eval_steps_per_second": 2.507, + "eval_wer": 0.23477932380532646, + "step": 4300 }, { - "epoch": 34.0, - "learning_rate": 4.348115299334812e-05, - "loss": 0.1018, - "step": 41000 + "epoch": 57.14, + "learning_rate": 9.440962288686607e-05, + "loss": 0.0316, + "step": 4400 }, { - "epoch": 34.0, - "eval_loss": 0.17246678471565247, - "eval_runtime": 257.824, - "eval_samples_per_second": 20.049, - "eval_steps_per_second": 2.509, - "eval_wer": 0.07431468863888449, - "step": 41000 + "epoch": 57.14, + "eval_loss": 0.39010030031204224, + "eval_runtime": 163.0782, + "eval_samples_per_second": 19.114, + "eval_steps_per_second": 2.391, + "eval_wer": 0.229805452370459, + "step": 4400 }, { - "epoch": 34.16, - "learning_rate": 4.32039911308204e-05, - "loss": 0.1002, - "step": 41200 + "epoch": 58.44, + "learning_rate": 9.427958387516256e-05, + "loss": 0.0308, + "step": 4500 }, { - "epoch": 34.16, - "eval_loss": 0.17683491110801697, - "eval_runtime": 259.2472, - "eval_samples_per_second": 19.938, - "eval_steps_per_second": 2.496, - "eval_wer": 0.06998362647229704, - "step": 41200 + "epoch": 58.44, + "eval_loss": 0.404751718044281, + "eval_runtime": 161.3906, + "eval_samples_per_second": 19.313, + "eval_steps_per_second": 2.416, + "eval_wer": 0.23194610589938927, + "step": 4500 }, { - "epoch": 34.33, - "learning_rate": 4.292682926829268e-05, - "loss": 0.1004, - "step": 41400 + "epoch": 59.73, + "learning_rate": 9.414954486345903e-05, + "loss": 0.028, + "step": 4600 }, { - "epoch": 34.33, - "eval_loss": 0.1728859543800354, - "eval_runtime": 258.3657, - "eval_samples_per_second": 20.007, - "eval_steps_per_second": 2.504, - "eval_wer": 0.0709343474356943, - "step": 41400 + "epoch": 59.73, + "eval_loss": 0.41103655099868774, + "eval_runtime": 154.3905, + "eval_samples_per_second": 20.189, + "eval_steps_per_second": 2.526, + "eval_wer": 0.2277277592394384, + "step": 4600 }, { - "epoch": 34.49, - "learning_rate": 4.264966740576497e-05, - "loss": 0.1023, - "step": 41600 + "epoch": 61.04, + "learning_rate": 9.401950585175553e-05, + "loss": 0.0299, + "step": 4700 }, { - "epoch": 34.49, - "eval_loss": 0.1567125767469406, - "eval_runtime": 258.2421, - "eval_samples_per_second": 20.016, - "eval_steps_per_second": 2.505, - "eval_wer": 0.07378651032588601, - "step": 41600 + "epoch": 61.04, + "eval_loss": 0.40084338188171387, + "eval_runtime": 168.5468, + "eval_samples_per_second": 18.493, + "eval_steps_per_second": 2.314, + "eval_wer": 0.23295347226594473, + "step": 4700 }, { - "epoch": 34.66, - "learning_rate": 4.237250554323725e-05, - "loss": 0.1003, - "step": 41800 + "epoch": 62.33, + "learning_rate": 9.388946684005202e-05, + "loss": 0.033, + "step": 4800 }, { - "epoch": 34.66, - "eval_loss": 0.16443106532096863, - "eval_runtime": 258.2982, - "eval_samples_per_second": 20.012, - "eval_steps_per_second": 2.505, - "eval_wer": 0.07251888237468969, - "step": 41800 + "epoch": 62.33, + "eval_loss": 0.3985605835914612, + "eval_runtime": 168.5159, + "eval_samples_per_second": 18.497, + "eval_steps_per_second": 2.314, + "eval_wer": 0.23490524460114587, + "step": 4800 }, { - "epoch": 34.83, - "learning_rate": 4.209534368070954e-05, - "loss": 0.103, - "step": 42000 + "epoch": 63.63, + "learning_rate": 9.375942782834851e-05, + "loss": 0.0345, + "step": 4900 }, { - "epoch": 34.83, - "eval_loss": 0.17008621990680695, - "eval_runtime": 257.8252, - "eval_samples_per_second": 20.048, - "eval_steps_per_second": 2.509, - "eval_wer": 0.0716209792425923, - "step": 42000 + "epoch": 63.63, + "eval_loss": 0.3911936581134796, + "eval_runtime": 158.9531, + "eval_samples_per_second": 19.61, + "eval_steps_per_second": 2.454, + "eval_wer": 0.23559780897815275, + "step": 4900 }, { - "epoch": 34.99, - "learning_rate": 4.181818181818182e-05, - "loss": 0.1056, - "step": 42200 + "epoch": 64.93, + "learning_rate": 9.3629388816645e-05, + "loss": 0.0322, + "step": 5000 }, { - "epoch": 34.99, - "eval_loss": 0.16209852695465088, - "eval_runtime": 258.245, - "eval_samples_per_second": 20.016, - "eval_steps_per_second": 2.505, - "eval_wer": 0.06956108382189827, - "step": 42200 + "epoch": 64.93, + "eval_loss": 0.3985706567764282, + "eval_runtime": 175.1875, + "eval_samples_per_second": 17.792, + "eval_steps_per_second": 2.226, + "eval_wer": 0.231568343511931, + "step": 5000 }, { - "epoch": 35.16, - "learning_rate": 4.15410199556541e-05, - "loss": 0.102, - "step": 42400 + "epoch": 66.23, + "learning_rate": 9.349934980494148e-05, + "loss": 0.0313, + "step": 5100 }, { - "epoch": 35.16, - "eval_loss": 0.1503116935491562, - "eval_runtime": 258.2089, - "eval_samples_per_second": 20.019, - "eval_steps_per_second": 2.506, - "eval_wer": 0.07024771562879628, - "step": 42400 + "epoch": 66.23, + "eval_loss": 0.4163081645965576, + "eval_runtime": 179.4796, + "eval_samples_per_second": 17.367, + "eval_steps_per_second": 2.173, + "eval_wer": 0.23049801674746584, + "step": 5100 }, { - "epoch": 35.32, - "learning_rate": 4.126385809312639e-05, - "loss": 0.0979, - "step": 42600 + "epoch": 67.53, + "learning_rate": 9.336931079323797e-05, + "loss": 0.0315, + "step": 5200 }, { - "epoch": 35.32, - "eval_loss": 0.15129025280475616, - "eval_runtime": 258.9706, - "eval_samples_per_second": 19.96, - "eval_steps_per_second": 2.498, - "eval_wer": 0.06977235514709766, - "step": 42600 + "epoch": 67.53, + "eval_loss": 0.3985958993434906, + "eval_runtime": 170.0289, + "eval_samples_per_second": 18.332, + "eval_steps_per_second": 2.294, + "eval_wer": 0.23528300698860416, + "step": 5200 }, { - "epoch": 35.49, - "learning_rate": 4.098808203991131e-05, - "loss": 0.0969, - "step": 42800 + "epoch": 68.82, + "learning_rate": 9.323927178153446e-05, + "loss": 0.0294, + "step": 5300 }, { - "epoch": 35.49, - "eval_loss": 0.16101005673408508, - "eval_runtime": 258.464, - "eval_samples_per_second": 19.999, - "eval_steps_per_second": 2.503, - "eval_wer": 0.07082871177309459, - "step": 42800 + "epoch": 68.82, + "eval_loss": 0.40526434779167175, + "eval_runtime": 177.9803, + "eval_samples_per_second": 17.513, + "eval_steps_per_second": 2.191, + "eval_wer": 0.2295536107788201, + "step": 5300 }, { - "epoch": 35.65, - "learning_rate": 4.071092017738359e-05, - "loss": 0.1016, - "step": 43000 + "epoch": 70.13, + "learning_rate": 9.310923276983095e-05, + "loss": 0.0302, + "step": 5400 }, { - "epoch": 35.65, - "eval_loss": 0.17464140057563782, - "eval_runtime": 258.5693, - "eval_samples_per_second": 19.991, - "eval_steps_per_second": 2.502, - "eval_wer": 0.07140970791739291, - "step": 43000 + "epoch": 70.13, + "eval_loss": 0.3818342089653015, + "eval_runtime": 177.545, + "eval_samples_per_second": 17.556, + "eval_steps_per_second": 2.197, + "eval_wer": 0.23131650192029213, + "step": 5400 }, { - "epoch": 35.82, - "learning_rate": 4.043375831485588e-05, - "loss": 0.0994, - "step": 43200 + "epoch": 71.42, + "learning_rate": 9.297919375812744e-05, + "loss": 0.0318, + "step": 5500 }, { - "epoch": 35.82, - "eval_loss": 0.16432413458824158, - "eval_runtime": 259.177, - "eval_samples_per_second": 19.944, - "eval_steps_per_second": 2.496, - "eval_wer": 0.07045898695399568, - "step": 43200 + "epoch": 71.42, + "eval_loss": 0.3933159410953522, + "eval_runtime": 168.7969, + "eval_samples_per_second": 18.466, + "eval_steps_per_second": 2.31, + "eval_wer": 0.23301643266385444, + "step": 5500 }, { - "epoch": 35.99, - "learning_rate": 4.015659645232816e-05, - "loss": 0.0966, - "step": 43400 + "epoch": 72.72, + "learning_rate": 9.284915474642393e-05, + "loss": 0.0289, + "step": 5600 }, { - "epoch": 35.99, - "eval_loss": 0.1695939600467682, - "eval_runtime": 258.2906, - "eval_samples_per_second": 20.012, - "eval_steps_per_second": 2.505, - "eval_wer": 0.0707230761104949, - "step": 43400 + "epoch": 72.72, + "eval_loss": 0.38790163397789, + "eval_runtime": 167.7031, + "eval_samples_per_second": 18.586, + "eval_steps_per_second": 2.326, + "eval_wer": 0.23396083863250017, + "step": 5600 } ], - "max_steps": 72360, - "num_train_epochs": 60, - "total_flos": 1.9733994835008543e+20, + "max_steps": 77000, + "num_train_epochs": 1000, + "total_flos": 1.80069386799743e+20, "trial_name": null, "trial_params": null }