{ "best_metric": 45.965834862992175, "best_model_checkpoint": "/media/makhataei/Backups/Whisper-Small-Common-Voice/checkpoint-6200", "epoch": 38.22393822393823, "eval_steps": 100, "global_step": 9900, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.1, "learning_rate": 4.600000000000001e-06, "loss": 3.1025, "step": 25 }, { "epoch": 0.19, "learning_rate": 9.600000000000001e-06, "loss": 1.3525, "step": 50 }, { "epoch": 0.29, "learning_rate": 9.976884422110554e-06, "loss": 0.9564, "step": 75 }, { "epoch": 0.39, "learning_rate": 9.95175879396985e-06, "loss": 0.7495, "step": 100 }, { "epoch": 0.39, "eval_loss": 0.860159158706665, "eval_runtime": 1426.2695, "eval_samples_per_second": 6.062, "eval_steps_per_second": 0.606, "eval_wer": 58.07742554282218, "step": 100 }, { "epoch": 0.48, "learning_rate": 9.926633165829147e-06, "loss": 0.5073, "step": 125 }, { "epoch": 0.58, "learning_rate": 9.901507537688444e-06, "loss": 0.3749, "step": 150 }, { "epoch": 0.68, "learning_rate": 9.87638190954774e-06, "loss": 0.3247, "step": 175 }, { "epoch": 0.77, "learning_rate": 9.851256281407035e-06, "loss": 0.3059, "step": 200 }, { "epoch": 0.77, "eval_loss": 0.5538379549980164, "eval_runtime": 1589.2333, "eval_samples_per_second": 5.44, "eval_steps_per_second": 0.544, "eval_wer": 55.22481850804518, "step": 200 }, { "epoch": 0.87, "learning_rate": 9.826130653266333e-06, "loss": 0.2963, "step": 225 }, { "epoch": 0.97, "learning_rate": 9.80100502512563e-06, "loss": 0.2882, "step": 250 }, { "epoch": 1.06, "learning_rate": 9.775879396984925e-06, "loss": 0.2327, "step": 275 }, { "epoch": 1.16, "learning_rate": 9.750753768844222e-06, "loss": 0.2002, "step": 300 }, { "epoch": 1.16, "eval_loss": 0.5136818885803223, "eval_runtime": 1646.1357, "eval_samples_per_second": 5.252, "eval_steps_per_second": 0.525, "eval_wer": 52.46151047609599, "step": 300 }, { "epoch": 1.25, "learning_rate": 9.725628140703518e-06, "loss": 0.1893, "step": 325 }, { "epoch": 1.35, "learning_rate": 9.700502512562815e-06, "loss": 0.185, "step": 350 }, { "epoch": 1.45, "learning_rate": 9.675376884422111e-06, "loss": 0.1847, "step": 375 }, { "epoch": 1.54, "learning_rate": 9.650251256281408e-06, "loss": 0.1798, "step": 400 }, { "epoch": 1.54, "eval_loss": 0.5102902054786682, "eval_runtime": 1650.3734, "eval_samples_per_second": 5.239, "eval_steps_per_second": 0.524, "eval_wer": 51.65781945064576, "step": 400 }, { "epoch": 1.64, "learning_rate": 9.625125628140705e-06, "loss": 0.1804, "step": 425 }, { "epoch": 1.74, "learning_rate": 9.600000000000001e-06, "loss": 0.1807, "step": 450 }, { "epoch": 1.83, "learning_rate": 9.574874371859298e-06, "loss": 0.1714, "step": 475 }, { "epoch": 1.93, "learning_rate": 9.549748743718595e-06, "loss": 0.1678, "step": 500 }, { "epoch": 1.93, "eval_loss": 0.48063144087791443, "eval_runtime": 1482.5018, "eval_samples_per_second": 5.832, "eval_steps_per_second": 0.583, "eval_wer": 46.55123943708554, "step": 500 }, { "epoch": 2.03, "learning_rate": 9.52462311557789e-06, "loss": 0.1542, "step": 525 }, { "epoch": 2.12, "learning_rate": 9.499497487437188e-06, "loss": 0.0929, "step": 550 }, { "epoch": 2.22, "learning_rate": 9.474371859296483e-06, "loss": 0.0936, "step": 575 }, { "epoch": 2.32, "learning_rate": 9.44924623115578e-06, "loss": 0.0932, "step": 600 }, { "epoch": 2.32, "eval_loss": 0.49363330006599426, "eval_runtime": 1993.4903, "eval_samples_per_second": 4.337, "eval_steps_per_second": 0.434, "eval_wer": 47.49549370772767, "step": 600 }, { "epoch": 2.41, "learning_rate": 9.424120603015076e-06, "loss": 0.0936, "step": 625 }, { "epoch": 2.51, "learning_rate": 9.398994974874373e-06, "loss": 0.0955, "step": 650 }, { "epoch": 2.61, "learning_rate": 9.373869346733669e-06, "loss": 0.0871, "step": 675 }, { "epoch": 2.7, "learning_rate": 9.348743718592966e-06, "loss": 0.0944, "step": 700 }, { "epoch": 2.7, "eval_loss": 0.5119881629943848, "eval_runtime": 1791.3192, "eval_samples_per_second": 4.827, "eval_steps_per_second": 0.483, "eval_wer": 48.91600932678474, "step": 700 }, { "epoch": 2.8, "learning_rate": 9.323618090452262e-06, "loss": 0.0927, "step": 725 }, { "epoch": 2.9, "learning_rate": 9.298492462311557e-06, "loss": 0.0964, "step": 750 }, { "epoch": 2.99, "learning_rate": 9.273366834170856e-06, "loss": 0.1038, "step": 775 }, { "epoch": 3.09, "learning_rate": 9.248241206030152e-06, "loss": 0.0493, "step": 800 }, { "epoch": 3.09, "eval_loss": 0.5198288559913635, "eval_runtime": 1878.4077, "eval_samples_per_second": 4.603, "eval_steps_per_second": 0.46, "eval_wer": 48.26114997271419, "step": 800 }, { "epoch": 3.19, "learning_rate": 9.223115577889447e-06, "loss": 0.0501, "step": 825 }, { "epoch": 3.28, "learning_rate": 9.197989949748744e-06, "loss": 0.0458, "step": 850 }, { "epoch": 3.38, "learning_rate": 9.17286432160804e-06, "loss": 0.0492, "step": 875 }, { "epoch": 3.47, "learning_rate": 9.147738693467337e-06, "loss": 0.0506, "step": 900 }, { "epoch": 3.47, "eval_loss": 0.5227376222610474, "eval_runtime": 1759.968, "eval_samples_per_second": 4.913, "eval_steps_per_second": 0.491, "eval_wer": 47.41280944585008, "step": 900 }, { "epoch": 3.57, "learning_rate": 9.122613065326634e-06, "loss": 0.0494, "step": 925 }, { "epoch": 3.67, "learning_rate": 9.09748743718593e-06, "loss": 0.051, "step": 950 }, { "epoch": 3.76, "learning_rate": 9.072361809045227e-06, "loss": 0.0466, "step": 975 }, { "epoch": 3.86, "learning_rate": 9.047236180904524e-06, "loss": 0.0482, "step": 1000 }, { "epoch": 3.86, "eval_loss": 0.5255833268165588, "eval_runtime": 1701.3645, "eval_samples_per_second": 5.082, "eval_steps_per_second": 0.508, "eval_wer": 46.94977757933555, "step": 1000 }, { "epoch": 3.96, "learning_rate": 9.02211055276382e-06, "loss": 0.046, "step": 1025 }, { "epoch": 4.05, "learning_rate": 8.996984924623117e-06, "loss": 0.0368, "step": 1050 }, { "epoch": 4.15, "learning_rate": 8.971859296482412e-06, "loss": 0.0233, "step": 1075 }, { "epoch": 4.25, "learning_rate": 8.94673366834171e-06, "loss": 0.0244, "step": 1100 }, { "epoch": 4.25, "eval_loss": 0.5491495132446289, "eval_runtime": 1619.0836, "eval_samples_per_second": 5.34, "eval_steps_per_second": 0.534, "eval_wer": 46.084900200095916, "step": 1100 }, { "epoch": 4.34, "learning_rate": 8.921608040201005e-06, "loss": 0.0258, "step": 1125 }, { "epoch": 4.44, "learning_rate": 8.896482412060302e-06, "loss": 0.0248, "step": 1150 }, { "epoch": 4.54, "learning_rate": 8.8713567839196e-06, "loss": 0.0241, "step": 1175 }, { "epoch": 4.63, "learning_rate": 8.846231155778895e-06, "loss": 0.0272, "step": 1200 }, { "epoch": 4.63, "eval_loss": 0.5620735883712769, "eval_runtime": 1837.7585, "eval_samples_per_second": 4.705, "eval_steps_per_second": 0.471, "eval_wer": 46.916703874584506, "step": 1200 }, { "epoch": 4.73, "learning_rate": 8.821105527638191e-06, "loss": 0.0258, "step": 1225 }, { "epoch": 4.83, "learning_rate": 8.795979899497488e-06, "loss": 0.0237, "step": 1250 }, { "epoch": 4.92, "learning_rate": 8.770854271356785e-06, "loss": 0.0266, "step": 1275 }, { "epoch": 5.02, "learning_rate": 8.745728643216081e-06, "loss": 0.0246, "step": 1300 }, { "epoch": 5.02, "eval_loss": 0.5855526328086853, "eval_runtime": 1908.9589, "eval_samples_per_second": 4.529, "eval_steps_per_second": 0.453, "eval_wer": 48.80355873063122, "step": 1300 }, { "epoch": 5.12, "learning_rate": 8.720603015075378e-06, "loss": 0.0142, "step": 1325 }, { "epoch": 5.21, "learning_rate": 8.695477386934675e-06, "loss": 0.014, "step": 1350 }, { "epoch": 5.31, "learning_rate": 8.67035175879397e-06, "loss": 0.0126, "step": 1375 }, { "epoch": 5.41, "learning_rate": 8.645226130653268e-06, "loss": 0.0159, "step": 1400 }, { "epoch": 5.41, "eval_loss": 0.6145116090774536, "eval_runtime": 1843.4778, "eval_samples_per_second": 4.69, "eval_steps_per_second": 0.469, "eval_wer": 48.30414578889054, "step": 1400 }, { "epoch": 5.5, "learning_rate": 8.620100502512564e-06, "loss": 0.0144, "step": 1425 }, { "epoch": 5.6, "learning_rate": 8.59497487437186e-06, "loss": 0.0133, "step": 1450 }, { "epoch": 5.69, "learning_rate": 8.569849246231156e-06, "loss": 0.0151, "step": 1475 }, { "epoch": 5.79, "learning_rate": 8.544723618090453e-06, "loss": 0.0152, "step": 1500 }, { "epoch": 5.79, "eval_loss": 0.6177700757980347, "eval_runtime": 1839.895, "eval_samples_per_second": 4.699, "eval_steps_per_second": 0.47, "eval_wer": 47.756775975260865, "step": 1500 }, { "epoch": 5.89, "learning_rate": 8.51959798994975e-06, "loss": 0.014, "step": 1525 }, { "epoch": 5.98, "learning_rate": 8.494472361809046e-06, "loss": 0.016, "step": 1550 }, { "epoch": 6.08, "learning_rate": 8.469346733668342e-06, "loss": 0.0092, "step": 1575 }, { "epoch": 6.18, "learning_rate": 8.444221105527639e-06, "loss": 0.008, "step": 1600 }, { "epoch": 6.18, "eval_loss": 0.6190542578697205, "eval_runtime": 1730.2546, "eval_samples_per_second": 4.997, "eval_steps_per_second": 0.5, "eval_wer": 48.06105405897041, "step": 1600 }, { "epoch": 6.27, "learning_rate": 8.419095477386936e-06, "loss": 0.0079, "step": 1625 }, { "epoch": 6.37, "learning_rate": 8.393969849246232e-06, "loss": 0.0087, "step": 1650 }, { "epoch": 6.47, "learning_rate": 8.368844221105529e-06, "loss": 0.0082, "step": 1675 }, { "epoch": 6.56, "learning_rate": 8.343718592964824e-06, "loss": 0.0077, "step": 1700 }, { "epoch": 6.56, "eval_loss": 0.6308984160423279, "eval_runtime": 1686.6544, "eval_samples_per_second": 5.126, "eval_steps_per_second": 0.513, "eval_wer": 46.35941194952953, "step": 1700 }, { "epoch": 6.66, "learning_rate": 8.318592964824122e-06, "loss": 0.0076, "step": 1725 }, { "epoch": 6.76, "learning_rate": 8.293467336683417e-06, "loss": 0.0095, "step": 1750 }, { "epoch": 6.85, "learning_rate": 8.268341708542714e-06, "loss": 0.0087, "step": 1775 }, { "epoch": 6.95, "learning_rate": 8.24321608040201e-06, "loss": 0.0097, "step": 1800 }, { "epoch": 6.95, "eval_loss": 0.6272400617599487, "eval_runtime": 1856.6423, "eval_samples_per_second": 4.657, "eval_steps_per_second": 0.466, "eval_wer": 47.9138760728283, "step": 1800 }, { "epoch": 7.05, "learning_rate": 8.218090452261307e-06, "loss": 0.009, "step": 1825 }, { "epoch": 7.14, "learning_rate": 8.192964824120604e-06, "loss": 0.0053, "step": 1850 }, { "epoch": 7.24, "learning_rate": 8.1678391959799e-06, "loss": 0.0051, "step": 1875 }, { "epoch": 7.34, "learning_rate": 8.142713567839197e-06, "loss": 0.0056, "step": 1900 }, { "epoch": 7.34, "eval_loss": 0.6594315767288208, "eval_runtime": 1711.6251, "eval_samples_per_second": 5.051, "eval_steps_per_second": 0.505, "eval_wer": 46.5562004927982, "step": 1900 }, { "epoch": 7.43, "learning_rate": 8.117587939698493e-06, "loss": 0.0056, "step": 1925 }, { "epoch": 7.53, "learning_rate": 8.09246231155779e-06, "loss": 0.0058, "step": 1950 }, { "epoch": 7.63, "learning_rate": 8.067336683417087e-06, "loss": 0.007, "step": 1975 }, { "epoch": 7.72, "learning_rate": 8.042211055276382e-06, "loss": 0.0049, "step": 2000 }, { "epoch": 7.72, "eval_loss": 0.6581406593322754, "eval_runtime": 1917.4042, "eval_samples_per_second": 4.509, "eval_steps_per_second": 0.451, "eval_wer": 47.58313902531792, "step": 2000 }, { "epoch": 7.82, "learning_rate": 8.01708542713568e-06, "loss": 0.0064, "step": 2025 }, { "epoch": 7.92, "learning_rate": 7.991959798994977e-06, "loss": 0.0055, "step": 2050 }, { "epoch": 8.01, "learning_rate": 7.966834170854271e-06, "loss": 0.0055, "step": 2075 }, { "epoch": 8.11, "learning_rate": 7.941708542713568e-06, "loss": 0.0042, "step": 2100 }, { "epoch": 8.11, "eval_loss": 0.695335865020752, "eval_runtime": 1836.7482, "eval_samples_per_second": 4.707, "eval_steps_per_second": 0.471, "eval_wer": 48.092474078483896, "step": 2100 }, { "epoch": 8.2, "learning_rate": 7.916582914572865e-06, "loss": 0.004, "step": 2125 }, { "epoch": 8.3, "learning_rate": 7.891457286432161e-06, "loss": 0.0046, "step": 2150 }, { "epoch": 8.4, "learning_rate": 7.866331658291458e-06, "loss": 0.004, "step": 2175 }, { "epoch": 8.49, "learning_rate": 7.841206030150755e-06, "loss": 0.0038, "step": 2200 }, { "epoch": 8.49, "eval_loss": 0.6856936812400818, "eval_runtime": 1910.3433, "eval_samples_per_second": 4.526, "eval_steps_per_second": 0.453, "eval_wer": 48.371946883630166, "step": 2200 }, { "epoch": 8.59, "learning_rate": 7.816080402010051e-06, "loss": 0.0036, "step": 2225 }, { "epoch": 8.69, "learning_rate": 7.790954773869348e-06, "loss": 0.0038, "step": 2250 }, { "epoch": 8.78, "learning_rate": 7.765829145728644e-06, "loss": 0.0033, "step": 2275 }, { "epoch": 8.88, "learning_rate": 7.740703517587941e-06, "loss": 0.0033, "step": 2300 }, { "epoch": 8.88, "eval_loss": 0.6982905268669128, "eval_runtime": 1950.8321, "eval_samples_per_second": 4.432, "eval_steps_per_second": 0.443, "eval_wer": 49.69654875890923, "step": 2300 }, { "epoch": 8.98, "learning_rate": 7.715577889447236e-06, "loss": 0.0036, "step": 2325 }, { "epoch": 9.07, "learning_rate": 7.690452261306534e-06, "loss": 0.0029, "step": 2350 }, { "epoch": 9.17, "learning_rate": 7.66532663316583e-06, "loss": 0.0027, "step": 2375 }, { "epoch": 9.27, "learning_rate": 7.640201005025126e-06, "loss": 0.003, "step": 2400 }, { "epoch": 9.27, "eval_loss": 0.7109295129776001, "eval_runtime": 1863.5651, "eval_samples_per_second": 4.639, "eval_steps_per_second": 0.464, "eval_wer": 48.11727935704718, "step": 2400 }, { "epoch": 9.36, "learning_rate": 7.615075376884423e-06, "loss": 0.003, "step": 2425 }, { "epoch": 9.46, "learning_rate": 7.589949748743719e-06, "loss": 0.0025, "step": 2450 }, { "epoch": 9.56, "learning_rate": 7.564824120603016e-06, "loss": 0.0027, "step": 2475 }, { "epoch": 9.65, "learning_rate": 7.5396984924623115e-06, "loss": 0.0033, "step": 2500 }, { "epoch": 9.65, "eval_loss": 0.6899213194847107, "eval_runtime": 1934.8822, "eval_samples_per_second": 4.468, "eval_steps_per_second": 0.447, "eval_wer": 48.236344694150915, "step": 2500 }, { "epoch": 9.75, "learning_rate": 7.514572864321609e-06, "loss": 0.0025, "step": 2525 }, { "epoch": 9.85, "learning_rate": 7.4894472361809056e-06, "loss": 0.002, "step": 2550 }, { "epoch": 9.94, "learning_rate": 7.464321608040201e-06, "loss": 0.0031, "step": 2575 }, { "epoch": 10.04, "learning_rate": 7.439195979899499e-06, "loss": 0.0027, "step": 2600 }, { "epoch": 10.04, "eval_loss": 0.7074257135391235, "eval_runtime": 1945.5025, "eval_samples_per_second": 4.444, "eval_steps_per_second": 0.445, "eval_wer": 48.34052686411668, "step": 2600 }, { "epoch": 10.14, "learning_rate": 7.4140703517587946e-06, "loss": 0.0027, "step": 2625 }, { "epoch": 10.23, "learning_rate": 7.388944723618091e-06, "loss": 0.0029, "step": 2650 }, { "epoch": 10.33, "learning_rate": 7.363819095477388e-06, "loss": 0.0032, "step": 2675 }, { "epoch": 10.42, "learning_rate": 7.338693467336684e-06, "loss": 0.0035, "step": 2700 }, { "epoch": 10.42, "eval_loss": 0.7017741799354553, "eval_runtime": 1835.0488, "eval_samples_per_second": 4.712, "eval_steps_per_second": 0.471, "eval_wer": 47.10026293595277, "step": 2700 }, { "epoch": 10.52, "learning_rate": 7.313567839195981e-06, "loss": 0.0024, "step": 2725 }, { "epoch": 10.62, "learning_rate": 7.288442211055277e-06, "loss": 0.0024, "step": 2750 }, { "epoch": 10.71, "learning_rate": 7.2633165829145734e-06, "loss": 0.0031, "step": 2775 }, { "epoch": 10.81, "learning_rate": 7.23819095477387e-06, "loss": 0.0026, "step": 2800 }, { "epoch": 10.81, "eval_loss": 0.7197884917259216, "eval_runtime": 1907.1753, "eval_samples_per_second": 4.533, "eval_steps_per_second": 0.454, "eval_wer": 47.12506821451605, "step": 2800 }, { "epoch": 10.91, "learning_rate": 7.213065326633167e-06, "loss": 0.0022, "step": 2825 }, { "epoch": 11.0, "learning_rate": 7.187939698492463e-06, "loss": 0.0027, "step": 2850 }, { "epoch": 11.1, "learning_rate": 7.162814070351759e-06, "loss": 0.0022, "step": 2875 }, { "epoch": 11.2, "learning_rate": 7.137688442211056e-06, "loss": 0.0027, "step": 2900 }, { "epoch": 11.2, "eval_loss": 0.7459501624107361, "eval_runtime": 2001.7998, "eval_samples_per_second": 4.319, "eval_steps_per_second": 0.432, "eval_wer": 48.27603313985216, "step": 2900 }, { "epoch": 11.29, "learning_rate": 7.112562814070353e-06, "loss": 0.0024, "step": 2925 }, { "epoch": 11.39, "learning_rate": 7.087437185929649e-06, "loss": 0.0028, "step": 2950 }, { "epoch": 11.49, "learning_rate": 7.0623115577889456e-06, "loss": 0.0022, "step": 2975 }, { "epoch": 11.58, "learning_rate": 7.037185929648241e-06, "loss": 0.0023, "step": 3000 }, { "epoch": 11.58, "eval_loss": 0.7347891926765442, "eval_runtime": 1876.4701, "eval_samples_per_second": 4.608, "eval_steps_per_second": 0.461, "eval_wer": 47.71543384432207, "step": 3000 }, { "epoch": 11.68, "learning_rate": 7.012060301507538e-06, "loss": 0.0022, "step": 3025 }, { "epoch": 11.78, "learning_rate": 6.9869346733668354e-06, "loss": 0.0028, "step": 3050 }, { "epoch": 11.87, "learning_rate": 6.961809045226131e-06, "loss": 0.0027, "step": 3075 }, { "epoch": 11.97, "learning_rate": 6.936683417085428e-06, "loss": 0.0023, "step": 3100 }, { "epoch": 11.97, "eval_loss": 0.7387125492095947, "eval_runtime": 2084.696, "eval_samples_per_second": 4.147, "eval_steps_per_second": 0.415, "eval_wer": 48.00813613136876, "step": 3100 }, { "epoch": 12.07, "learning_rate": 6.911557788944724e-06, "loss": 0.002, "step": 3125 }, { "epoch": 12.16, "learning_rate": 6.886432160804021e-06, "loss": 0.0019, "step": 3150 }, { "epoch": 12.26, "learning_rate": 6.861306532663318e-06, "loss": 0.0028, "step": 3175 }, { "epoch": 12.36, "learning_rate": 6.8361809045226135e-06, "loss": 0.0024, "step": 3200 }, { "epoch": 12.36, "eval_loss": 0.7199321985244751, "eval_runtime": 1992.5899, "eval_samples_per_second": 4.339, "eval_steps_per_second": 0.434, "eval_wer": 46.86874700269551, "step": 3200 }, { "epoch": 12.45, "learning_rate": 6.81105527638191e-06, "loss": 0.0024, "step": 3225 }, { "epoch": 12.55, "learning_rate": 6.785929648241206e-06, "loss": 0.0019, "step": 3250 }, { "epoch": 12.64, "learning_rate": 6.760804020100503e-06, "loss": 0.0024, "step": 3275 }, { "epoch": 12.74, "learning_rate": 6.735678391959799e-06, "loss": 0.0033, "step": 3300 }, { "epoch": 12.74, "eval_loss": 0.7249542474746704, "eval_runtime": 2175.7785, "eval_samples_per_second": 3.974, "eval_steps_per_second": 0.398, "eval_wer": 48.68945444924013, "step": 3300 }, { "epoch": 12.84, "learning_rate": 6.710552763819096e-06, "loss": 0.0021, "step": 3325 }, { "epoch": 12.93, "learning_rate": 6.685427135678393e-06, "loss": 0.0014, "step": 3350 }, { "epoch": 13.03, "learning_rate": 6.660301507537689e-06, "loss": 0.0011, "step": 3375 }, { "epoch": 13.13, "learning_rate": 6.6351758793969856e-06, "loss": 0.0017, "step": 3400 }, { "epoch": 13.13, "eval_loss": 0.7241615653038025, "eval_runtime": 2420.7565, "eval_samples_per_second": 3.572, "eval_steps_per_second": 0.357, "eval_wer": 49.044996775313784, "step": 3400 }, { "epoch": 13.22, "learning_rate": 6.610050251256281e-06, "loss": 0.0019, "step": 3425 }, { "epoch": 13.32, "learning_rate": 6.584924623115578e-06, "loss": 0.0014, "step": 3450 }, { "epoch": 13.42, "learning_rate": 6.5597989949748754e-06, "loss": 0.0011, "step": 3475 }, { "epoch": 13.51, "learning_rate": 6.534673366834171e-06, "loss": 0.0016, "step": 3500 }, { "epoch": 13.51, "eval_loss": 0.7358579039573669, "eval_runtime": 2057.6253, "eval_samples_per_second": 4.202, "eval_steps_per_second": 0.42, "eval_wer": 48.70103024590299, "step": 3500 }, { "epoch": 13.61, "learning_rate": 6.509547738693468e-06, "loss": 0.002, "step": 3525 }, { "epoch": 13.71, "learning_rate": 6.484422110552764e-06, "loss": 0.0015, "step": 3550 }, { "epoch": 13.8, "learning_rate": 6.459296482412061e-06, "loss": 0.0024, "step": 3575 }, { "epoch": 13.9, "learning_rate": 6.434170854271358e-06, "loss": 0.0022, "step": 3600 }, { "epoch": 13.9, "eval_loss": 0.7220202088356018, "eval_runtime": 2243.6869, "eval_samples_per_second": 3.853, "eval_steps_per_second": 0.386, "eval_wer": 48.1371235798978, "step": 3600 }, { "epoch": 14.0, "learning_rate": 6.4090452261306535e-06, "loss": 0.0021, "step": 3625 }, { "epoch": 14.09, "learning_rate": 6.38391959798995e-06, "loss": 0.0013, "step": 3650 }, { "epoch": 14.19, "learning_rate": 6.358793969849246e-06, "loss": 0.0014, "step": 3675 }, { "epoch": 14.29, "learning_rate": 6.333668341708543e-06, "loss": 0.0016, "step": 3700 }, { "epoch": 14.29, "eval_loss": 0.7430799007415771, "eval_runtime": 1822.7961, "eval_samples_per_second": 4.743, "eval_steps_per_second": 0.475, "eval_wer": 46.75629640654198, "step": 3700 }, { "epoch": 14.38, "learning_rate": 6.30854271356784e-06, "loss": 0.0008, "step": 3725 }, { "epoch": 14.48, "learning_rate": 6.283417085427136e-06, "loss": 0.0014, "step": 3750 }, { "epoch": 14.58, "learning_rate": 6.258291457286433e-06, "loss": 0.001, "step": 3775 }, { "epoch": 14.67, "learning_rate": 6.233165829145729e-06, "loss": 0.0012, "step": 3800 }, { "epoch": 14.67, "eval_loss": 0.7563586235046387, "eval_runtime": 2100.7282, "eval_samples_per_second": 4.116, "eval_steps_per_second": 0.412, "eval_wer": 47.014271303600076, "step": 3800 }, { "epoch": 14.77, "learning_rate": 6.208040201005026e-06, "loss": 0.0017, "step": 3825 }, { "epoch": 14.86, "learning_rate": 6.182914572864322e-06, "loss": 0.0015, "step": 3850 }, { "epoch": 14.96, "learning_rate": 6.157788944723618e-06, "loss": 0.0012, "step": 3875 }, { "epoch": 15.06, "learning_rate": 6.1326633165829155e-06, "loss": 0.0014, "step": 3900 }, { "epoch": 15.06, "eval_loss": 0.7769792079925537, "eval_runtime": 2049.0992, "eval_samples_per_second": 4.219, "eval_steps_per_second": 0.422, "eval_wer": 47.02419341502539, "step": 3900 }, { "epoch": 15.15, "learning_rate": 6.107537688442211e-06, "loss": 0.0011, "step": 3925 }, { "epoch": 15.25, "learning_rate": 6.082412060301508e-06, "loss": 0.001, "step": 3950 }, { "epoch": 15.35, "learning_rate": 6.057286432160805e-06, "loss": 0.0015, "step": 3975 }, { "epoch": 15.44, "learning_rate": 6.032160804020101e-06, "loss": 0.0008, "step": 4000 }, { "epoch": 15.44, "eval_loss": 0.8116338849067688, "eval_runtime": 2088.1418, "eval_samples_per_second": 4.141, "eval_steps_per_second": 0.414, "eval_wer": 48.46951431264573, "step": 4000 }, { "epoch": 15.54, "learning_rate": 6.007035175879398e-06, "loss": 0.0015, "step": 4025 }, { "epoch": 15.64, "learning_rate": 5.9819095477386935e-06, "loss": 0.0008, "step": 4050 }, { "epoch": 15.73, "learning_rate": 5.95678391959799e-06, "loss": 0.0016, "step": 4075 }, { "epoch": 15.83, "learning_rate": 5.9316582914572876e-06, "loss": 0.0015, "step": 4100 }, { "epoch": 15.83, "eval_loss": 0.7622503638267517, "eval_runtime": 2010.7151, "eval_samples_per_second": 4.3, "eval_steps_per_second": 0.43, "eval_wer": 48.092474078483896, "step": 4100 }, { "epoch": 15.93, "learning_rate": 5.906532663316583e-06, "loss": 0.0016, "step": 4125 }, { "epoch": 16.02, "learning_rate": 5.88140703517588e-06, "loss": 0.002, "step": 4150 }, { "epoch": 16.12, "learning_rate": 5.856281407035176e-06, "loss": 0.0015, "step": 4175 }, { "epoch": 16.22, "learning_rate": 5.831155778894473e-06, "loss": 0.002, "step": 4200 }, { "epoch": 16.22, "eval_loss": 0.7698885202407837, "eval_runtime": 1914.0687, "eval_samples_per_second": 4.517, "eval_steps_per_second": 0.452, "eval_wer": 47.72535595574738, "step": 4200 }, { "epoch": 16.31, "learning_rate": 5.80603015075377e-06, "loss": 0.0013, "step": 4225 }, { "epoch": 16.41, "learning_rate": 5.780904522613066e-06, "loss": 0.0017, "step": 4250 }, { "epoch": 16.51, "learning_rate": 5.755778894472362e-06, "loss": 0.0023, "step": 4275 }, { "epoch": 16.6, "learning_rate": 5.730653266331658e-06, "loss": 0.001, "step": 4300 }, { "epoch": 16.6, "eval_loss": 0.7630722522735596, "eval_runtime": 1923.0045, "eval_samples_per_second": 4.496, "eval_steps_per_second": 0.45, "eval_wer": 46.87536174364572, "step": 4300 }, { "epoch": 16.7, "learning_rate": 5.7055276381909555e-06, "loss": 0.0022, "step": 4325 }, { "epoch": 16.8, "learning_rate": 5.680402010050252e-06, "loss": 0.0012, "step": 4350 }, { "epoch": 16.89, "learning_rate": 5.655276381909548e-06, "loss": 0.0018, "step": 4375 }, { "epoch": 16.99, "learning_rate": 5.6301507537688445e-06, "loss": 0.0009, "step": 4400 }, { "epoch": 16.99, "eval_loss": 0.7591461539268494, "eval_runtime": 1922.4876, "eval_samples_per_second": 4.497, "eval_steps_per_second": 0.45, "eval_wer": 48.416596385044066, "step": 4400 }, { "epoch": 17.08, "learning_rate": 5.605025125628141e-06, "loss": 0.0012, "step": 4425 }, { "epoch": 17.18, "learning_rate": 5.579899497487438e-06, "loss": 0.0009, "step": 4450 }, { "epoch": 17.28, "learning_rate": 5.554773869346734e-06, "loss": 0.0006, "step": 4475 }, { "epoch": 17.37, "learning_rate": 5.52964824120603e-06, "loss": 0.0008, "step": 4500 }, { "epoch": 17.37, "eval_loss": 0.779658317565918, "eval_runtime": 1935.42, "eval_samples_per_second": 4.467, "eval_steps_per_second": 0.447, "eval_wer": 47.17798614211771, "step": 4500 }, { "epoch": 17.47, "learning_rate": 5.504522613065328e-06, "loss": 0.0022, "step": 4525 }, { "epoch": 17.57, "learning_rate": 5.479396984924623e-06, "loss": 0.0008, "step": 4550 }, { "epoch": 17.66, "learning_rate": 5.45427135678392e-06, "loss": 0.0016, "step": 4575 }, { "epoch": 17.76, "learning_rate": 5.429145728643217e-06, "loss": 0.0008, "step": 4600 }, { "epoch": 17.76, "eval_loss": 0.7850877046585083, "eval_runtime": 1838.7142, "eval_samples_per_second": 4.702, "eval_steps_per_second": 0.47, "eval_wer": 46.76621851796729, "step": 4600 }, { "epoch": 17.86, "learning_rate": 5.404020100502513e-06, "loss": 0.0011, "step": 4625 }, { "epoch": 17.95, "learning_rate": 5.37889447236181e-06, "loss": 0.0007, "step": 4650 }, { "epoch": 18.05, "learning_rate": 5.353768844221106e-06, "loss": 0.0015, "step": 4675 }, { "epoch": 18.15, "learning_rate": 5.328643216080402e-06, "loss": 0.0007, "step": 4700 }, { "epoch": 18.15, "eval_loss": 0.7897337079048157, "eval_runtime": 1943.7204, "eval_samples_per_second": 4.448, "eval_steps_per_second": 0.445, "eval_wer": 48.315721585553405, "step": 4700 }, { "epoch": 18.24, "learning_rate": 5.3035175879397e-06, "loss": 0.0007, "step": 4725 }, { "epoch": 18.34, "learning_rate": 5.2783919597989955e-06, "loss": 0.0006, "step": 4750 }, { "epoch": 18.44, "learning_rate": 5.253266331658292e-06, "loss": 0.0007, "step": 4775 }, { "epoch": 18.53, "learning_rate": 5.228140703517588e-06, "loss": 0.0006, "step": 4800 }, { "epoch": 18.53, "eval_loss": 0.7760252952575684, "eval_runtime": 1927.3698, "eval_samples_per_second": 4.486, "eval_steps_per_second": 0.449, "eval_wer": 48.806866101106316, "step": 4800 }, { "epoch": 18.63, "learning_rate": 5.2030150753768845e-06, "loss": 0.001, "step": 4825 }, { "epoch": 18.73, "learning_rate": 5.177889447236182e-06, "loss": 0.0008, "step": 4850 }, { "epoch": 18.82, "learning_rate": 5.152763819095478e-06, "loss": 0.0017, "step": 4875 }, { "epoch": 18.92, "learning_rate": 5.127638190954774e-06, "loss": 0.0016, "step": 4900 }, { "epoch": 18.92, "eval_loss": 0.7762993574142456, "eval_runtime": 2000.3946, "eval_samples_per_second": 4.322, "eval_steps_per_second": 0.432, "eval_wer": 47.97175505614261, "step": 4900 }, { "epoch": 19.02, "learning_rate": 5.10251256281407e-06, "loss": 0.0011, "step": 4925 }, { "epoch": 19.11, "learning_rate": 5.077386934673368e-06, "loss": 0.0006, "step": 4950 }, { "epoch": 19.21, "learning_rate": 5.052261306532664e-06, "loss": 0.0006, "step": 4975 }, { "epoch": 19.31, "learning_rate": 5.02713567839196e-06, "loss": 0.0009, "step": 5000 }, { "epoch": 19.31, "eval_loss": 0.8151038289070129, "eval_runtime": 1941.3748, "eval_samples_per_second": 4.454, "eval_steps_per_second": 0.446, "eval_wer": 48.158621487985975, "step": 5000 }, { "epoch": 19.4, "learning_rate": 5.002010050251257e-06, "loss": 0.0008, "step": 5025 }, { "epoch": 19.5, "learning_rate": 4.976884422110553e-06, "loss": 0.0012, "step": 5050 }, { "epoch": 19.59, "learning_rate": 4.95175879396985e-06, "loss": 0.001, "step": 5075 }, { "epoch": 19.69, "learning_rate": 4.9266331658291465e-06, "loss": 0.0004, "step": 5100 }, { "epoch": 19.69, "eval_loss": 0.7967365384101868, "eval_runtime": 1771.7869, "eval_samples_per_second": 4.88, "eval_steps_per_second": 0.488, "eval_wer": 47.55668006151709, "step": 5100 }, { "epoch": 19.79, "learning_rate": 4.901507537688442e-06, "loss": 0.0007, "step": 5125 }, { "epoch": 19.88, "learning_rate": 4.876381909547739e-06, "loss": 0.0007, "step": 5150 }, { "epoch": 19.98, "learning_rate": 4.8512562814070355e-06, "loss": 0.0009, "step": 5175 }, { "epoch": 20.08, "learning_rate": 4.826130653266332e-06, "loss": 0.0007, "step": 5200 }, { "epoch": 20.08, "eval_loss": 0.8094375729560852, "eval_runtime": 1764.7964, "eval_samples_per_second": 4.899, "eval_steps_per_second": 0.49, "eval_wer": 46.78606274081791, "step": 5200 }, { "epoch": 20.17, "learning_rate": 4.801005025125629e-06, "loss": 0.0007, "step": 5225 }, { "epoch": 20.27, "learning_rate": 4.7758793969849245e-06, "loss": 0.0012, "step": 5250 }, { "epoch": 20.37, "learning_rate": 4.750753768844221e-06, "loss": 0.0008, "step": 5275 }, { "epoch": 20.46, "learning_rate": 4.725628140703518e-06, "loss": 0.001, "step": 5300 }, { "epoch": 20.46, "eval_loss": 0.8205662369728088, "eval_runtime": 1833.049, "eval_samples_per_second": 4.717, "eval_steps_per_second": 0.472, "eval_wer": 47.15648823402954, "step": 5300 }, { "epoch": 20.56, "learning_rate": 4.700502512562814e-06, "loss": 0.0013, "step": 5325 }, { "epoch": 20.66, "learning_rate": 4.675376884422111e-06, "loss": 0.0007, "step": 5350 }, { "epoch": 20.75, "learning_rate": 4.650251256281408e-06, "loss": 0.0007, "step": 5375 }, { "epoch": 20.85, "learning_rate": 4.625125628140703e-06, "loss": 0.0008, "step": 5400 }, { "epoch": 20.85, "eval_loss": 0.8015366792678833, "eval_runtime": 1825.3401, "eval_samples_per_second": 4.737, "eval_steps_per_second": 0.474, "eval_wer": 47.621173785781615, "step": 5400 }, { "epoch": 20.95, "learning_rate": 4.600000000000001e-06, "loss": 0.0007, "step": 5425 }, { "epoch": 21.04, "learning_rate": 4.574874371859297e-06, "loss": 0.0006, "step": 5450 }, { "epoch": 21.14, "learning_rate": 4.549748743718593e-06, "loss": 0.0005, "step": 5475 }, { "epoch": 21.24, "learning_rate": 4.52462311557789e-06, "loss": 0.0004, "step": 5500 }, { "epoch": 21.24, "eval_loss": 0.8104465007781982, "eval_runtime": 1735.3093, "eval_samples_per_second": 4.982, "eval_steps_per_second": 0.498, "eval_wer": 47.220981958294054, "step": 5500 }, { "epoch": 21.33, "learning_rate": 4.499497487437186e-06, "loss": 0.0004, "step": 5525 }, { "epoch": 21.43, "learning_rate": 4.474371859296483e-06, "loss": 0.0005, "step": 5550 }, { "epoch": 21.53, "learning_rate": 4.44924623115578e-06, "loss": 0.001, "step": 5575 }, { "epoch": 21.62, "learning_rate": 4.4241206030150755e-06, "loss": 0.0003, "step": 5600 }, { "epoch": 21.62, "eval_loss": 0.8020026683807373, "eval_runtime": 1798.7419, "eval_samples_per_second": 4.807, "eval_steps_per_second": 0.481, "eval_wer": 48.145392006085565, "step": 5600 }, { "epoch": 21.72, "learning_rate": 4.398994974874372e-06, "loss": 0.0008, "step": 5625 }, { "epoch": 21.81, "learning_rate": 4.373869346733669e-06, "loss": 0.0004, "step": 5650 }, { "epoch": 21.91, "learning_rate": 4.348743718592965e-06, "loss": 0.0006, "step": 5675 }, { "epoch": 22.01, "learning_rate": 4.323618090452262e-06, "loss": 0.0004, "step": 5700 }, { "epoch": 22.01, "eval_loss": 0.8294846415519714, "eval_runtime": 1827.1151, "eval_samples_per_second": 4.732, "eval_steps_per_second": 0.473, "eval_wer": 46.94150915314779, "step": 5700 }, { "epoch": 22.1, "learning_rate": 4.298492462311558e-06, "loss": 0.0002, "step": 5725 }, { "epoch": 22.2, "learning_rate": 4.273366834170854e-06, "loss": 0.0003, "step": 5750 }, { "epoch": 22.3, "learning_rate": 4.248241206030151e-06, "loss": 0.0002, "step": 5775 }, { "epoch": 22.39, "learning_rate": 4.223115577889448e-06, "loss": 0.0004, "step": 5800 }, { "epoch": 22.39, "eval_loss": 0.822780191898346, "eval_runtime": 1778.1094, "eval_samples_per_second": 4.862, "eval_steps_per_second": 0.486, "eval_wer": 46.61077210563741, "step": 5800 }, { "epoch": 22.49, "learning_rate": 4.197989949748744e-06, "loss": 0.0003, "step": 5825 }, { "epoch": 22.59, "learning_rate": 4.172864321608041e-06, "loss": 0.0003, "step": 5850 }, { "epoch": 22.68, "learning_rate": 4.147738693467337e-06, "loss": 0.0004, "step": 5875 }, { "epoch": 22.78, "learning_rate": 4.122613065326633e-06, "loss": 0.0005, "step": 5900 }, { "epoch": 22.78, "eval_loss": 0.8386306166648865, "eval_runtime": 1804.5855, "eval_samples_per_second": 4.791, "eval_steps_per_second": 0.479, "eval_wer": 48.09743513419656, "step": 5900 }, { "epoch": 22.88, "learning_rate": 4.09748743718593e-06, "loss": 0.0007, "step": 5925 }, { "epoch": 22.97, "learning_rate": 4.0723618090452265e-06, "loss": 0.0013, "step": 5950 }, { "epoch": 23.07, "learning_rate": 4.047236180904523e-06, "loss": 0.0008, "step": 5975 }, { "epoch": 23.17, "learning_rate": 4.02211055276382e-06, "loss": 0.0007, "step": 6000 }, { "epoch": 23.17, "eval_loss": 0.8414955735206604, "eval_runtime": 1746.5835, "eval_samples_per_second": 4.95, "eval_steps_per_second": 0.495, "eval_wer": 46.61407947611252, "step": 6000 }, { "epoch": 23.26, "learning_rate": 3.997989949748744e-06, "loss": 0.0004, "step": 6025 }, { "epoch": 23.36, "learning_rate": 3.97286432160804e-06, "loss": 0.0004, "step": 6050 }, { "epoch": 23.46, "learning_rate": 3.947738693467337e-06, "loss": 0.0006, "step": 6075 }, { "epoch": 23.55, "learning_rate": 3.9226130653266335e-06, "loss": 0.0003, "step": 6100 }, { "epoch": 23.55, "eval_loss": 0.8283448815345764, "eval_runtime": 1775.2653, "eval_samples_per_second": 4.87, "eval_steps_per_second": 0.487, "eval_wer": 46.32633824477848, "step": 6100 }, { "epoch": 23.65, "learning_rate": 3.89748743718593e-06, "loss": 0.0003, "step": 6125 }, { "epoch": 23.75, "learning_rate": 3.872361809045227e-06, "loss": 0.0011, "step": 6150 }, { "epoch": 23.84, "learning_rate": 3.8472361809045225e-06, "loss": 0.0003, "step": 6175 }, { "epoch": 23.94, "learning_rate": 3.822110552763819e-06, "loss": 0.0005, "step": 6200 }, { "epoch": 23.94, "eval_loss": 0.8341825604438782, "eval_runtime": 1685.2846, "eval_samples_per_second": 5.13, "eval_steps_per_second": 0.513, "eval_wer": 45.965834862992175, "step": 6200 }, { "epoch": 24.03, "learning_rate": 3.796984924623116e-06, "loss": 0.0003, "step": 6225 }, { "epoch": 24.13, "learning_rate": 3.7718592964824124e-06, "loss": 0.0008, "step": 6250 }, { "epoch": 24.23, "learning_rate": 3.746733668341709e-06, "loss": 0.0003, "step": 6275 }, { "epoch": 24.32, "learning_rate": 3.721608040201005e-06, "loss": 0.0002, "step": 6300 }, { "epoch": 24.32, "eval_loss": 0.8378849029541016, "eval_runtime": 1806.9028, "eval_samples_per_second": 4.785, "eval_steps_per_second": 0.479, "eval_wer": 46.624001587537826, "step": 6300 }, { "epoch": 24.42, "learning_rate": 3.6964824120603014e-06, "loss": 0.0002, "step": 6325 }, { "epoch": 24.52, "learning_rate": 3.6713567839195984e-06, "loss": 0.0002, "step": 6350 }, { "epoch": 24.61, "learning_rate": 3.646231155778895e-06, "loss": 0.0004, "step": 6375 }, { "epoch": 24.71, "learning_rate": 3.6211055276381912e-06, "loss": 0.0005, "step": 6400 }, { "epoch": 24.71, "eval_loss": 0.8371052742004395, "eval_runtime": 1889.3529, "eval_samples_per_second": 4.576, "eval_steps_per_second": 0.458, "eval_wer": 48.080898281821035, "step": 6400 }, { "epoch": 24.81, "learning_rate": 3.5959798994974874e-06, "loss": 0.0005, "step": 6425 }, { "epoch": 24.9, "learning_rate": 3.570854271356784e-06, "loss": 0.0005, "step": 6450 }, { "epoch": 25.0, "learning_rate": 3.545728643216081e-06, "loss": 0.0002, "step": 6475 }, { "epoch": 25.1, "learning_rate": 3.5206030150753773e-06, "loss": 0.0002, "step": 6500 }, { "epoch": 25.1, "eval_loss": 0.8257761597633362, "eval_runtime": 1907.5906, "eval_samples_per_second": 4.532, "eval_steps_per_second": 0.453, "eval_wer": 47.586446395793025, "step": 6500 }, { "epoch": 25.19, "learning_rate": 3.4954773869346735e-06, "loss": 0.0003, "step": 6525 }, { "epoch": 25.29, "learning_rate": 3.47035175879397e-06, "loss": 0.0002, "step": 6550 }, { "epoch": 25.39, "learning_rate": 3.4452261306532663e-06, "loss": 0.0001, "step": 6575 }, { "epoch": 25.48, "learning_rate": 3.4201005025125634e-06, "loss": 0.0001, "step": 6600 }, { "epoch": 25.48, "eval_loss": 0.8396378755569458, "eval_runtime": 1829.8555, "eval_samples_per_second": 4.725, "eval_steps_per_second": 0.473, "eval_wer": 47.260670403995306, "step": 6600 }, { "epoch": 25.58, "learning_rate": 3.3949748743718596e-06, "loss": 0.0001, "step": 6625 }, { "epoch": 25.68, "learning_rate": 3.369849246231156e-06, "loss": 0.0003, "step": 6650 }, { "epoch": 25.77, "learning_rate": 3.3447236180904524e-06, "loss": 0.0001, "step": 6675 }, { "epoch": 25.87, "learning_rate": 3.319597989949749e-06, "loss": 0.0002, "step": 6700 }, { "epoch": 25.87, "eval_loss": 0.8490523099899292, "eval_runtime": 1855.9322, "eval_samples_per_second": 4.659, "eval_steps_per_second": 0.466, "eval_wer": 47.543450579616675, "step": 6700 }, { "epoch": 25.97, "learning_rate": 3.2944723618090456e-06, "loss": 0.0002, "step": 6725 }, { "epoch": 26.06, "learning_rate": 3.2693467336683422e-06, "loss": 0.0001, "step": 6750 }, { "epoch": 26.16, "learning_rate": 3.2442211055276384e-06, "loss": 0.0001, "step": 6775 }, { "epoch": 26.25, "learning_rate": 3.219095477386935e-06, "loss": 0.0005, "step": 6800 }, { "epoch": 26.25, "eval_loss": 0.8443611860275269, "eval_runtime": 1852.0247, "eval_samples_per_second": 4.668, "eval_steps_per_second": 0.467, "eval_wer": 48.99373253294968, "step": 6800 }, { "epoch": 26.35, "learning_rate": 3.1939698492462312e-06, "loss": 0.0001, "step": 6825 }, { "epoch": 26.45, "learning_rate": 3.1688442211055283e-06, "loss": 0.0001, "step": 6850 }, { "epoch": 26.54, "learning_rate": 3.1437185929648245e-06, "loss": 0.0001, "step": 6875 }, { "epoch": 26.64, "learning_rate": 3.1185929648241207e-06, "loss": 0.0001, "step": 6900 }, { "epoch": 26.64, "eval_loss": 0.8540186882019043, "eval_runtime": 1842.737, "eval_samples_per_second": 4.692, "eval_steps_per_second": 0.469, "eval_wer": 48.05443931802021, "step": 6900 }, { "epoch": 26.74, "learning_rate": 3.0934673366834173e-06, "loss": 0.0001, "step": 6925 }, { "epoch": 26.83, "learning_rate": 3.0683417085427135e-06, "loss": 0.0001, "step": 6950 }, { "epoch": 26.93, "learning_rate": 3.0432160804020105e-06, "loss": 0.0002, "step": 6975 }, { "epoch": 27.03, "learning_rate": 3.0180904522613067e-06, "loss": 0.0001, "step": 7000 }, { "epoch": 27.03, "eval_loss": 0.8605034947395325, "eval_runtime": 1849.0664, "eval_samples_per_second": 4.676, "eval_steps_per_second": 0.468, "eval_wer": 48.53896909262291, "step": 7000 }, { "epoch": 27.12, "learning_rate": 2.9929648241206034e-06, "loss": 0.0002, "step": 7025 }, { "epoch": 27.22, "learning_rate": 2.9678391959798996e-06, "loss": 0.0001, "step": 7050 }, { "epoch": 27.32, "learning_rate": 2.942713567839196e-06, "loss": 0.0001, "step": 7075 }, { "epoch": 27.41, "learning_rate": 2.917587939698493e-06, "loss": 0.0001, "step": 7100 }, { "epoch": 27.41, "eval_loss": 0.8613005876541138, "eval_runtime": 1885.8486, "eval_samples_per_second": 4.585, "eval_steps_per_second": 0.459, "eval_wer": 48.92262406773495, "step": 7100 }, { "epoch": 27.51, "learning_rate": 2.8924623115577894e-06, "loss": 0.0001, "step": 7125 }, { "epoch": 27.61, "learning_rate": 2.8673366834170856e-06, "loss": 0.0001, "step": 7150 }, { "epoch": 27.7, "learning_rate": 2.8422110552763822e-06, "loss": 0.0003, "step": 7175 }, { "epoch": 27.8, "learning_rate": 2.8170854271356784e-06, "loss": 0.0001, "step": 7200 }, { "epoch": 27.8, "eval_loss": 0.8672710061073303, "eval_runtime": 1858.2034, "eval_samples_per_second": 4.653, "eval_steps_per_second": 0.466, "eval_wer": 48.94908303153578, "step": 7200 }, { "epoch": 27.9, "learning_rate": 2.7919597989949755e-06, "loss": 0.0001, "step": 7225 }, { "epoch": 27.99, "learning_rate": 2.7668341708542717e-06, "loss": 0.0001, "step": 7250 }, { "epoch": 28.09, "learning_rate": 2.7417085427135683e-06, "loss": 0.0001, "step": 7275 }, { "epoch": 28.19, "learning_rate": 2.7165829145728645e-06, "loss": 0.0001, "step": 7300 }, { "epoch": 28.19, "eval_loss": 0.8688055872917175, "eval_runtime": 1883.3395, "eval_samples_per_second": 4.591, "eval_steps_per_second": 0.459, "eval_wer": 48.7936366192059, "step": 7300 }, { "epoch": 28.28, "learning_rate": 2.6914572864321607e-06, "loss": 0.0002, "step": 7325 }, { "epoch": 28.38, "learning_rate": 2.6663316582914573e-06, "loss": 0.0001, "step": 7350 }, { "epoch": 28.47, "learning_rate": 2.6412060301507544e-06, "loss": 0.0001, "step": 7375 }, { "epoch": 28.57, "learning_rate": 2.6160804020100506e-06, "loss": 0.0001, "step": 7400 }, { "epoch": 28.57, "eval_loss": 0.8710694313049316, "eval_runtime": 1878.6911, "eval_samples_per_second": 4.602, "eval_steps_per_second": 0.46, "eval_wer": 48.8349787501447, "step": 7400 }, { "epoch": 28.67, "learning_rate": 2.5909547738693468e-06, "loss": 0.0001, "step": 7425 }, { "epoch": 28.76, "learning_rate": 2.5658291457286434e-06, "loss": 0.0001, "step": 7450 }, { "epoch": 28.86, "learning_rate": 2.5407035175879396e-06, "loss": 0.0001, "step": 7475 }, { "epoch": 28.96, "learning_rate": 2.5155778894472366e-06, "loss": 0.0001, "step": 7500 }, { "epoch": 28.96, "eval_loss": 0.872825026512146, "eval_runtime": 1901.4507, "eval_samples_per_second": 4.547, "eval_steps_per_second": 0.455, "eval_wer": 48.85813034347042, "step": 7500 }, { "epoch": 29.05, "learning_rate": 2.490452261306533e-06, "loss": 0.0001, "step": 7525 }, { "epoch": 29.15, "learning_rate": 2.4653266331658294e-06, "loss": 0.0002, "step": 7550 }, { "epoch": 29.25, "learning_rate": 2.4402010050251256e-06, "loss": 0.0001, "step": 7575 }, { "epoch": 29.34, "learning_rate": 2.4150753768844223e-06, "loss": 0.0001, "step": 7600 }, { "epoch": 29.34, "eval_loss": 0.8735654354095459, "eval_runtime": 1920.4668, "eval_samples_per_second": 4.502, "eval_steps_per_second": 0.45, "eval_wer": 49.8453804302889, "step": 7600 }, { "epoch": 29.44, "learning_rate": 2.389949748743719e-06, "loss": 0.0001, "step": 7625 }, { "epoch": 29.54, "learning_rate": 2.3648241206030155e-06, "loss": 0.0001, "step": 7650 }, { "epoch": 29.63, "learning_rate": 2.3396984924623117e-06, "loss": 0.0001, "step": 7675 }, { "epoch": 29.73, "learning_rate": 2.314572864321608e-06, "loss": 0.0001, "step": 7700 }, { "epoch": 29.73, "eval_loss": 0.8759255409240723, "eval_runtime": 1934.3216, "eval_samples_per_second": 4.47, "eval_steps_per_second": 0.447, "eval_wer": 49.92475732169139, "step": 7700 }, { "epoch": 29.83, "learning_rate": 2.289447236180905e-06, "loss": 0.0001, "step": 7725 }, { "epoch": 29.92, "learning_rate": 2.264321608040201e-06, "loss": 0.0001, "step": 7750 }, { "epoch": 30.02, "learning_rate": 2.2391959798994978e-06, "loss": 0.0001, "step": 7775 }, { "epoch": 30.12, "learning_rate": 2.214070351758794e-06, "loss": 0.0001, "step": 7800 }, { "epoch": 30.12, "eval_loss": 0.8785723447799683, "eval_runtime": 1950.1663, "eval_samples_per_second": 4.433, "eval_steps_per_second": 0.444, "eval_wer": 49.693241388434124, "step": 7800 }, { "epoch": 30.21, "learning_rate": 2.1889447236180906e-06, "loss": 0.0001, "step": 7825 }, { "epoch": 30.31, "learning_rate": 2.163819095477387e-06, "loss": 0.0001, "step": 7850 }, { "epoch": 30.41, "learning_rate": 2.1386934673366834e-06, "loss": 0.0001, "step": 7875 }, { "epoch": 30.5, "learning_rate": 2.11356783919598e-06, "loss": 0.0001, "step": 7900 }, { "epoch": 30.5, "eval_loss": 0.8809360265731812, "eval_runtime": 1948.9202, "eval_samples_per_second": 4.436, "eval_steps_per_second": 0.444, "eval_wer": 49.74285194556069, "step": 7900 }, { "epoch": 30.6, "learning_rate": 2.0884422110552766e-06, "loss": 0.0001, "step": 7925 }, { "epoch": 30.69, "learning_rate": 2.063316582914573e-06, "loss": 0.0001, "step": 7950 }, { "epoch": 30.79, "learning_rate": 2.0381909547738695e-06, "loss": 0.0001, "step": 7975 }, { "epoch": 30.89, "learning_rate": 2.013065326633166e-06, "loss": 0.0001, "step": 8000 }, { "epoch": 30.89, "eval_loss": 0.8825691342353821, "eval_runtime": 1955.4266, "eval_samples_per_second": 4.422, "eval_steps_per_second": 0.442, "eval_wer": 49.91318152502853, "step": 8000 }, { "epoch": 30.98, "learning_rate": 1.9879396984924627e-06, "loss": 0.0001, "step": 8025 }, { "epoch": 31.08, "learning_rate": 1.962814070351759e-06, "loss": 0.0002, "step": 8050 }, { "epoch": 31.18, "learning_rate": 1.9376884422110555e-06, "loss": 0.0001, "step": 8075 }, { "epoch": 31.27, "learning_rate": 1.912562814070352e-06, "loss": 0.0001, "step": 8100 }, { "epoch": 31.27, "eval_loss": 0.8839845657348633, "eval_runtime": 1965.0139, "eval_samples_per_second": 4.4, "eval_steps_per_second": 0.44, "eval_wer": 50.45062922723289, "step": 8100 }, { "epoch": 31.37, "learning_rate": 1.8874371859296483e-06, "loss": 0.0001, "step": 8125 }, { "epoch": 31.47, "learning_rate": 1.862311557788945e-06, "loss": 0.0001, "step": 8150 }, { "epoch": 31.56, "learning_rate": 1.8371859296482414e-06, "loss": 0.0001, "step": 8175 }, { "epoch": 31.66, "learning_rate": 1.8120603015075378e-06, "loss": 0.0001, "step": 8200 }, { "epoch": 31.66, "eval_loss": 0.8858728408813477, "eval_runtime": 1964.1317, "eval_samples_per_second": 4.402, "eval_steps_per_second": 0.44, "eval_wer": 50.2918754444279, "step": 8200 }, { "epoch": 31.76, "learning_rate": 1.7869346733668344e-06, "loss": 0.0001, "step": 8225 }, { "epoch": 31.85, "learning_rate": 1.7618090452261308e-06, "loss": 0.0001, "step": 8250 }, { "epoch": 31.95, "learning_rate": 1.7366834170854272e-06, "loss": 0.0001, "step": 8275 }, { "epoch": 32.05, "learning_rate": 1.7115577889447238e-06, "loss": 0.0001, "step": 8300 }, { "epoch": 32.05, "eval_loss": 0.8887734413146973, "eval_runtime": 1974.3769, "eval_samples_per_second": 4.379, "eval_steps_per_second": 0.438, "eval_wer": 50.553157711961106, "step": 8300 }, { "epoch": 32.14, "learning_rate": 1.6864321608040202e-06, "loss": 0.0001, "step": 8325 }, { "epoch": 32.24, "learning_rate": 1.6613065326633169e-06, "loss": 0.0001, "step": 8350 }, { "epoch": 32.34, "learning_rate": 1.6361809045226133e-06, "loss": 0.0001, "step": 8375 }, { "epoch": 32.43, "learning_rate": 1.6110552763819095e-06, "loss": 0.0001, "step": 8400 }, { "epoch": 32.43, "eval_loss": 0.8924394845962524, "eval_runtime": 1954.9726, "eval_samples_per_second": 4.423, "eval_steps_per_second": 0.442, "eval_wer": 50.64907145573911, "step": 8400 }, { "epoch": 32.53, "learning_rate": 1.5859296482412063e-06, "loss": 0.0001, "step": 8425 }, { "epoch": 32.63, "learning_rate": 1.5608040201005025e-06, "loss": 0.0001, "step": 8450 }, { "epoch": 32.72, "learning_rate": 1.5356783919597993e-06, "loss": 0.0001, "step": 8475 }, { "epoch": 32.82, "learning_rate": 1.5105527638190955e-06, "loss": 0.0001, "step": 8500 }, { "epoch": 32.82, "eval_loss": 0.8927690982818604, "eval_runtime": 1969.9296, "eval_samples_per_second": 4.389, "eval_steps_per_second": 0.439, "eval_wer": 50.99965272610011, "step": 8500 }, { "epoch": 32.92, "learning_rate": 1.485427135678392e-06, "loss": 0.0001, "step": 8525 }, { "epoch": 33.01, "learning_rate": 1.4603015075376886e-06, "loss": 0.0001, "step": 8550 }, { "epoch": 33.11, "learning_rate": 1.435175879396985e-06, "loss": 0.0001, "step": 8575 }, { "epoch": 33.2, "learning_rate": 1.4100502512562816e-06, "loss": 0.0001, "step": 8600 }, { "epoch": 33.2, "eval_loss": 0.8920454382896423, "eval_runtime": 1993.7139, "eval_samples_per_second": 4.337, "eval_steps_per_second": 0.434, "eval_wer": 51.31881397694763, "step": 8600 }, { "epoch": 33.3, "learning_rate": 1.384924623115578e-06, "loss": 0.0001, "step": 8625 }, { "epoch": 33.4, "learning_rate": 1.3597989949748744e-06, "loss": 0.0001, "step": 8650 }, { "epoch": 33.49, "learning_rate": 1.334673366834171e-06, "loss": 0.0001, "step": 8675 }, { "epoch": 33.59, "learning_rate": 1.3095477386934674e-06, "loss": 0.0001, "step": 8700 }, { "epoch": 33.59, "eval_loss": 0.8945680856704712, "eval_runtime": 1991.4509, "eval_samples_per_second": 4.342, "eval_steps_per_second": 0.434, "eval_wer": 51.14186965652958, "step": 8700 }, { "epoch": 33.69, "learning_rate": 1.284422110552764e-06, "loss": 0.0001, "step": 8725 }, { "epoch": 33.78, "learning_rate": 1.2592964824120605e-06, "loss": 0.0001, "step": 8750 }, { "epoch": 33.88, "learning_rate": 1.2341708542713569e-06, "loss": 0.0001, "step": 8775 }, { "epoch": 33.98, "learning_rate": 1.2090452261306533e-06, "loss": 0.0001, "step": 8800 }, { "epoch": 33.98, "eval_loss": 0.8956067562103271, "eval_runtime": 1992.4579, "eval_samples_per_second": 4.339, "eval_steps_per_second": 0.434, "eval_wer": 51.155099138429996, "step": 8800 }, { "epoch": 34.07, "learning_rate": 1.18391959798995e-06, "loss": 0.0001, "step": 8825 }, { "epoch": 34.17, "learning_rate": 1.1587939698492463e-06, "loss": 0.0001, "step": 8850 }, { "epoch": 34.27, "learning_rate": 1.133668341708543e-06, "loss": 0.0001, "step": 8875 }, { "epoch": 34.36, "learning_rate": 1.1085427135678393e-06, "loss": 0.0001, "step": 8900 }, { "epoch": 34.36, "eval_loss": 0.8987666368484497, "eval_runtime": 1982.6531, "eval_samples_per_second": 4.361, "eval_steps_per_second": 0.436, "eval_wer": 50.74829256999222, "step": 8900 }, { "epoch": 34.46, "learning_rate": 1.0834170854271357e-06, "loss": 0.0001, "step": 8925 }, { "epoch": 34.56, "learning_rate": 1.0582914572864322e-06, "loss": 0.0001, "step": 8950 }, { "epoch": 34.65, "learning_rate": 1.0331658291457288e-06, "loss": 0.0001, "step": 8975 }, { "epoch": 34.75, "learning_rate": 1.0080402010050252e-06, "loss": 0.0001, "step": 9000 }, { "epoch": 34.75, "eval_loss": 0.9003340601921082, "eval_runtime": 1982.3624, "eval_samples_per_second": 4.361, "eval_steps_per_second": 0.436, "eval_wer": 50.888855815184144, "step": 9000 }, { "epoch": 34.85, "learning_rate": 9.829145728643216e-07, "loss": 0.0001, "step": 9025 }, { "epoch": 34.94, "learning_rate": 9.577889447236182e-07, "loss": 0.0001, "step": 9050 }, { "epoch": 35.04, "learning_rate": 9.326633165829146e-07, "loss": 0.0001, "step": 9075 }, { "epoch": 35.14, "learning_rate": 9.075376884422111e-07, "loss": 0.0001, "step": 9100 }, { "epoch": 35.14, "eval_loss": 0.9010794162750244, "eval_runtime": 1996.3748, "eval_samples_per_second": 4.331, "eval_steps_per_second": 0.433, "eval_wer": 50.93019794612294, "step": 9100 }, { "epoch": 35.23, "learning_rate": 8.824120603015077e-07, "loss": 0.0001, "step": 9125 }, { "epoch": 35.33, "learning_rate": 8.572864321608041e-07, "loss": 0.0001, "step": 9150 }, { "epoch": 35.42, "learning_rate": 8.321608040201006e-07, "loss": 0.0001, "step": 9175 }, { "epoch": 35.52, "learning_rate": 8.070351758793971e-07, "loss": 0.0001, "step": 9200 }, { "epoch": 35.52, "eval_loss": 0.9019636511802673, "eval_runtime": 1992.9594, "eval_samples_per_second": 4.338, "eval_steps_per_second": 0.434, "eval_wer": 50.953349539448666, "step": 9200 }, { "epoch": 35.62, "learning_rate": 7.819095477386936e-07, "loss": 0.0001, "step": 9225 }, { "epoch": 35.71, "learning_rate": 7.567839195979901e-07, "loss": 0.0001, "step": 9250 }, { "epoch": 35.81, "learning_rate": 7.316582914572864e-07, "loss": 0.0001, "step": 9275 }, { "epoch": 35.91, "learning_rate": 7.065326633165829e-07, "loss": 0.0001, "step": 9300 }, { "epoch": 35.91, "eval_loss": 0.901878297328949, "eval_runtime": 1999.423, "eval_samples_per_second": 4.324, "eval_steps_per_second": 0.433, "eval_wer": 51.560252021630205, "step": 9300 }, { "epoch": 36.0, "learning_rate": 6.814070351758795e-07, "loss": 0.0001, "step": 9325 }, { "epoch": 36.1, "learning_rate": 6.56281407035176e-07, "loss": 0.0001, "step": 9350 }, { "epoch": 36.2, "learning_rate": 6.311557788944724e-07, "loss": 0.0001, "step": 9375 }, { "epoch": 36.29, "learning_rate": 6.060301507537689e-07, "loss": 0.0001, "step": 9400 }, { "epoch": 36.29, "eval_loss": 0.9032866358757019, "eval_runtime": 2014.4202, "eval_samples_per_second": 4.292, "eval_steps_per_second": 0.429, "eval_wer": 51.64789733922045, "step": 9400 }, { "epoch": 36.39, "learning_rate": 5.809045226130654e-07, "loss": 0.0001, "step": 9425 }, { "epoch": 36.49, "learning_rate": 5.557788944723619e-07, "loss": 0.0001, "step": 9450 }, { "epoch": 36.58, "learning_rate": 5.306532663316583e-07, "loss": 0.0001, "step": 9475 }, { "epoch": 36.68, "learning_rate": 5.055276381909549e-07, "loss": 0.0001, "step": 9500 }, { "epoch": 36.68, "eval_loss": 0.9039894938468933, "eval_runtime": 2029.2995, "eval_samples_per_second": 4.261, "eval_steps_per_second": 0.426, "eval_wer": 51.68097104397149, "step": 9500 }, { "epoch": 36.78, "learning_rate": 4.804020100502513e-07, "loss": 0.0001, "step": 9525 }, { "epoch": 36.87, "learning_rate": 4.552763819095478e-07, "loss": 0.0001, "step": 9550 }, { "epoch": 36.97, "learning_rate": 4.3015075376884424e-07, "loss": 0.0001, "step": 9575 }, { "epoch": 37.07, "learning_rate": 4.0502512562814075e-07, "loss": 0.0001, "step": 9600 }, { "epoch": 37.07, "eval_loss": 0.9048639535903931, "eval_runtime": 2059.954, "eval_samples_per_second": 4.197, "eval_steps_per_second": 0.42, "eval_wer": 51.674356303021284, "step": 9600 }, { "epoch": 37.16, "learning_rate": 3.7989949748743727e-07, "loss": 0.0001, "step": 9625 }, { "epoch": 37.26, "learning_rate": 3.547738693467337e-07, "loss": 0.0001, "step": 9650 }, { "epoch": 37.36, "learning_rate": 3.296482412060302e-07, "loss": 0.0001, "step": 9675 }, { "epoch": 37.45, "learning_rate": 3.0452261306532665e-07, "loss": 0.0001, "step": 9700 }, { "epoch": 37.45, "eval_loss": 0.905308187007904, "eval_runtime": 1999.2162, "eval_samples_per_second": 4.325, "eval_steps_per_second": 0.433, "eval_wer": 51.6429362835078, "step": 9700 }, { "epoch": 37.55, "learning_rate": 2.7939698492462317e-07, "loss": 0.0001, "step": 9725 }, { "epoch": 37.64, "learning_rate": 2.5427135678391963e-07, "loss": 0.0001, "step": 9750 }, { "epoch": 37.74, "learning_rate": 2.291457286432161e-07, "loss": 0.0001, "step": 9775 }, { "epoch": 37.84, "learning_rate": 2.0402010050251258e-07, "loss": 0.0001, "step": 9800 }, { "epoch": 37.84, "eval_loss": 0.9057276248931885, "eval_runtime": 2081.4562, "eval_samples_per_second": 4.154, "eval_steps_per_second": 0.416, "eval_wer": 51.59663309685635, "step": 9800 }, { "epoch": 37.93, "learning_rate": 1.7889447236180904e-07, "loss": 0.0, "step": 9825 }, { "epoch": 38.03, "learning_rate": 1.5376884422110556e-07, "loss": 0.0001, "step": 9850 }, { "epoch": 38.13, "learning_rate": 1.2864321608040202e-07, "loss": 0.0001, "step": 9875 }, { "epoch": 38.22, "learning_rate": 1.035175879396985e-07, "loss": 0.0001, "step": 9900 }, { "epoch": 38.22, "eval_loss": 0.9060160517692566, "eval_runtime": 2006.0349, "eval_samples_per_second": 4.31, "eval_steps_per_second": 0.431, "eval_wer": 51.73719634204825, "step": 9900 } ], "logging_steps": 25, "max_steps": 10000, "num_train_epochs": 39, "save_steps": 100, "total_flos": 1.599369147113472e+20, "trial_name": null, "trial_params": null }