{ "best_metric": 0.5550447702407837, "best_model_checkpoint": "ai-light-dance_drums_ft_pretrain_wav2vec2-base-new-v3/checkpoint-1665", "epoch": 100.0, "global_step": 4500, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.22, "learning_rate": 1e-05, "loss": 0.2149, "step": 10 }, { "epoch": 0.44, "learning_rate": 2e-05, "loss": 0.2628, "step": 20 }, { "epoch": 0.67, "learning_rate": 3e-05, "loss": 0.2398, "step": 30 }, { "epoch": 0.89, "learning_rate": 4e-05, "loss": 0.1747, "step": 40 }, { "epoch": 1.0, "eval_loss": 0.5638056397438049, "eval_runtime": 2.4228, "eval_samples_per_second": 7.017, "eval_steps_per_second": 3.715, "eval_wer": 0.33373063170441003, "step": 45 }, { "epoch": 1.11, "learning_rate": 5e-05, "loss": 0.2076, "step": 50 }, { "epoch": 1.33, "learning_rate": 6e-05, "loss": 0.2309, "step": 60 }, { "epoch": 1.56, "learning_rate": 7e-05, "loss": 0.24, "step": 70 }, { "epoch": 1.78, "learning_rate": 8e-05, "loss": 0.2666, "step": 80 }, { "epoch": 2.0, "learning_rate": 9e-05, "loss": 0.2339, "step": 90 }, { "epoch": 2.0, "eval_loss": 0.5784714818000793, "eval_runtime": 2.5397, "eval_samples_per_second": 6.694, "eval_steps_per_second": 3.544, "eval_wer": 0.3253873659117998, "step": 90 }, { "epoch": 2.22, "learning_rate": 9.900000000000001e-05, "loss": 0.2321, "step": 100 }, { "epoch": 2.44, "learning_rate": 9.979545454545454e-05, "loss": 0.2695, "step": 110 }, { "epoch": 2.67, "learning_rate": 9.956818181818183e-05, "loss": 0.2069, "step": 120 }, { "epoch": 2.89, "learning_rate": 9.93409090909091e-05, "loss": 0.2849, "step": 130 }, { "epoch": 3.0, "eval_loss": 0.5586056709289551, "eval_runtime": 2.5587, "eval_samples_per_second": 6.644, "eval_steps_per_second": 3.517, "eval_wer": 0.3396901072705602, "step": 135 }, { "epoch": 3.11, "learning_rate": 9.911363636363636e-05, "loss": 0.2394, "step": 140 }, { "epoch": 3.33, "learning_rate": 9.888636363636364e-05, "loss": 0.2421, "step": 150 }, { "epoch": 3.56, "learning_rate": 9.865909090909092e-05, "loss": 0.3409, "step": 160 }, { "epoch": 3.78, "learning_rate": 9.843181818181819e-05, "loss": 0.2621, "step": 170 }, { "epoch": 4.0, "learning_rate": 9.820454545454546e-05, "loss": 0.2396, "step": 180 }, { "epoch": 4.0, "eval_loss": 0.5868120789527893, "eval_runtime": 2.5527, "eval_samples_per_second": 6.66, "eval_steps_per_second": 3.526, "eval_wer": 0.3265792610250298, "step": 180 }, { "epoch": 4.22, "learning_rate": 9.797727272727273e-05, "loss": 0.2449, "step": 190 }, { "epoch": 4.44, "learning_rate": 9.775e-05, "loss": 0.271, "step": 200 }, { "epoch": 4.67, "learning_rate": 9.752272727272728e-05, "loss": 0.2343, "step": 210 }, { "epoch": 4.89, "learning_rate": 9.729545454545455e-05, "loss": 0.2272, "step": 220 }, { "epoch": 5.0, "eval_loss": 0.6052439212799072, "eval_runtime": 2.5975, "eval_samples_per_second": 6.545, "eval_steps_per_second": 3.465, "eval_wer": 0.3230035756853397, "step": 225 }, { "epoch": 5.11, "learning_rate": 9.70909090909091e-05, "loss": 0.2344, "step": 230 }, { "epoch": 5.33, "learning_rate": 9.686363636363637e-05, "loss": 0.2515, "step": 240 }, { "epoch": 5.56, "learning_rate": 9.663636363636363e-05, "loss": 0.2331, "step": 250 }, { "epoch": 5.78, "learning_rate": 9.640909090909092e-05, "loss": 0.2434, "step": 260 }, { "epoch": 6.0, "learning_rate": 9.618181818181819e-05, "loss": 0.2497, "step": 270 }, { "epoch": 6.0, "eval_loss": 0.5912988781929016, "eval_runtime": 2.5744, "eval_samples_per_second": 6.604, "eval_steps_per_second": 3.496, "eval_wer": 0.32777115613825986, "step": 270 }, { "epoch": 6.22, "learning_rate": 9.595454545454546e-05, "loss": 0.2195, "step": 280 }, { "epoch": 6.44, "learning_rate": 9.572727272727273e-05, "loss": 0.2656, "step": 290 }, { "epoch": 6.67, "learning_rate": 9.55e-05, "loss": 0.2641, "step": 300 }, { "epoch": 6.89, "learning_rate": 9.527272727272728e-05, "loss": 0.2218, "step": 310 }, { "epoch": 7.0, "eval_loss": 0.5925901532173157, "eval_runtime": 2.5865, "eval_samples_per_second": 6.572, "eval_steps_per_second": 3.48, "eval_wer": 0.33492252681764006, "step": 315 }, { "epoch": 7.11, "learning_rate": 9.504545454545455e-05, "loss": 0.2357, "step": 320 }, { "epoch": 7.33, "learning_rate": 9.481818181818183e-05, "loss": 0.2061, "step": 330 }, { "epoch": 7.56, "learning_rate": 9.459090909090909e-05, "loss": 0.279, "step": 340 }, { "epoch": 7.78, "learning_rate": 9.436363636363636e-05, "loss": 0.2628, "step": 350 }, { "epoch": 8.0, "learning_rate": 9.413636363636365e-05, "loss": 0.2584, "step": 360 }, { "epoch": 8.0, "eval_loss": 0.5617051720619202, "eval_runtime": 2.5692, "eval_samples_per_second": 6.617, "eval_steps_per_second": 3.503, "eval_wer": 0.3218116805721097, "step": 360 }, { "epoch": 8.22, "learning_rate": 9.390909090909091e-05, "loss": 0.2428, "step": 370 }, { "epoch": 8.44, "learning_rate": 9.368181818181818e-05, "loss": 0.2143, "step": 380 }, { "epoch": 8.67, "learning_rate": 9.345454545454547e-05, "loss": 0.249, "step": 390 }, { "epoch": 8.89, "learning_rate": 9.322727272727273e-05, "loss": 0.2741, "step": 400 }, { "epoch": 9.0, "eval_loss": 0.5901447534561157, "eval_runtime": 2.647, "eval_samples_per_second": 6.422, "eval_steps_per_second": 3.4, "eval_wer": 0.3230035756853397, "step": 405 }, { "epoch": 9.11, "learning_rate": 9.300000000000001e-05, "loss": 0.2379, "step": 410 }, { "epoch": 9.33, "learning_rate": 9.277272727272728e-05, "loss": 0.2382, "step": 420 }, { "epoch": 9.56, "learning_rate": 9.254545454545454e-05, "loss": 0.2526, "step": 430 }, { "epoch": 9.78, "learning_rate": 9.231818181818183e-05, "loss": 0.3068, "step": 440 }, { "epoch": 10.0, "learning_rate": 9.20909090909091e-05, "loss": 0.2481, "step": 450 }, { "epoch": 10.0, "eval_loss": 0.5860414505004883, "eval_runtime": 2.4994, "eval_samples_per_second": 6.802, "eval_steps_per_second": 3.601, "eval_wer": 0.32777115613825986, "step": 450 }, { "epoch": 10.22, "learning_rate": 9.186363636363636e-05, "loss": 0.2483, "step": 460 }, { "epoch": 10.44, "learning_rate": 9.163636363636364e-05, "loss": 0.2183, "step": 470 }, { "epoch": 10.67, "learning_rate": 9.140909090909092e-05, "loss": 0.2119, "step": 480 }, { "epoch": 10.89, "learning_rate": 9.118181818181819e-05, "loss": 0.2504, "step": 490 }, { "epoch": 11.0, "eval_loss": 0.5991201996803284, "eval_runtime": 2.4924, "eval_samples_per_second": 6.821, "eval_steps_per_second": 3.611, "eval_wer": 0.31227651966626935, "step": 495 }, { "epoch": 11.11, "learning_rate": 9.095454545454546e-05, "loss": 0.1884, "step": 500 }, { "epoch": 11.33, "learning_rate": 9.072727272727273e-05, "loss": 0.2462, "step": 510 }, { "epoch": 11.56, "learning_rate": 9.05e-05, "loss": 0.2704, "step": 520 }, { "epoch": 11.78, "learning_rate": 9.027272727272728e-05, "loss": 0.2557, "step": 530 }, { "epoch": 12.0, "learning_rate": 9.004545454545455e-05, "loss": 0.2125, "step": 540 }, { "epoch": 12.0, "eval_loss": 0.5991844534873962, "eval_runtime": 2.5722, "eval_samples_per_second": 6.609, "eval_steps_per_second": 3.499, "eval_wer": 0.3218116805721097, "step": 540 }, { "epoch": 12.22, "learning_rate": 8.981818181818182e-05, "loss": 0.2385, "step": 550 }, { "epoch": 12.44, "learning_rate": 8.959090909090909e-05, "loss": 0.2087, "step": 560 }, { "epoch": 12.67, "learning_rate": 8.936363636363636e-05, "loss": 0.1979, "step": 570 }, { "epoch": 12.89, "learning_rate": 8.913636363636364e-05, "loss": 0.2482, "step": 580 }, { "epoch": 13.0, "eval_loss": 0.5756039023399353, "eval_runtime": 2.4594, "eval_samples_per_second": 6.912, "eval_steps_per_second": 3.659, "eval_wer": 0.31942789034564956, "step": 585 }, { "epoch": 13.11, "learning_rate": 8.890909090909091e-05, "loss": 0.2199, "step": 590 }, { "epoch": 13.33, "learning_rate": 8.86818181818182e-05, "loss": 0.2978, "step": 600 }, { "epoch": 13.56, "learning_rate": 8.845454545454545e-05, "loss": 0.2514, "step": 610 }, { "epoch": 13.78, "learning_rate": 8.822727272727274e-05, "loss": 0.2367, "step": 620 }, { "epoch": 14.0, "learning_rate": 8.800000000000001e-05, "loss": 0.2135, "step": 630 }, { "epoch": 14.0, "eval_loss": 0.5836071372032166, "eval_runtime": 2.5386, "eval_samples_per_second": 6.697, "eval_steps_per_second": 3.545, "eval_wer": 0.3301549463647199, "step": 630 }, { "epoch": 14.22, "learning_rate": 8.777272727272727e-05, "loss": 0.2302, "step": 640 }, { "epoch": 14.44, "learning_rate": 8.754545454545456e-05, "loss": 0.2274, "step": 650 }, { "epoch": 14.67, "learning_rate": 8.731818181818183e-05, "loss": 0.1999, "step": 660 }, { "epoch": 14.89, "learning_rate": 8.709090909090909e-05, "loss": 0.2345, "step": 670 }, { "epoch": 15.0, "eval_loss": 0.6346899271011353, "eval_runtime": 2.512, "eval_samples_per_second": 6.768, "eval_steps_per_second": 3.583, "eval_wer": 0.3253873659117998, "step": 675 }, { "epoch": 15.11, "learning_rate": 8.686363636363637e-05, "loss": 0.249, "step": 680 }, { "epoch": 15.33, "learning_rate": 8.663636363636364e-05, "loss": 0.2475, "step": 690 }, { "epoch": 15.56, "learning_rate": 8.640909090909092e-05, "loss": 0.2608, "step": 700 }, { "epoch": 15.78, "learning_rate": 8.618181818181819e-05, "loss": 0.2417, "step": 710 }, { "epoch": 16.0, "learning_rate": 8.595454545454546e-05, "loss": 0.1912, "step": 720 }, { "epoch": 16.0, "eval_loss": 0.6159502863883972, "eval_runtime": 2.5046, "eval_samples_per_second": 6.788, "eval_steps_per_second": 3.593, "eval_wer": 0.3206197854588796, "step": 720 }, { "epoch": 16.22, "learning_rate": 8.572727272727273e-05, "loss": 0.2042, "step": 730 }, { "epoch": 16.44, "learning_rate": 8.55e-05, "loss": 0.2584, "step": 740 }, { "epoch": 16.67, "learning_rate": 8.527272727272728e-05, "loss": 1.0367, "step": 750 }, { "epoch": 16.89, "learning_rate": 8.504545454545455e-05, "loss": 0.2117, "step": 760 }, { "epoch": 17.0, "eval_loss": 0.626762866973877, "eval_runtime": 2.5302, "eval_samples_per_second": 6.719, "eval_steps_per_second": 3.557, "eval_wer": 0.3098927294398093, "step": 765 }, { "epoch": 17.11, "learning_rate": 8.481818181818182e-05, "loss": 0.1709, "step": 770 }, { "epoch": 17.33, "learning_rate": 8.45909090909091e-05, "loss": 0.2427, "step": 780 }, { "epoch": 17.56, "learning_rate": 8.436363636363637e-05, "loss": 0.2564, "step": 790 }, { "epoch": 17.78, "learning_rate": 8.413636363636364e-05, "loss": 0.2481, "step": 800 }, { "epoch": 18.0, "learning_rate": 8.390909090909091e-05, "loss": 0.2217, "step": 810 }, { "epoch": 18.0, "eval_loss": 0.6872562766075134, "eval_runtime": 2.5217, "eval_samples_per_second": 6.741, "eval_steps_per_second": 3.569, "eval_wer": 0.3182359952324195, "step": 810 }, { "epoch": 18.22, "learning_rate": 8.368181818181818e-05, "loss": 0.3087, "step": 820 }, { "epoch": 18.44, "learning_rate": 8.345454545454547e-05, "loss": 0.1941, "step": 830 }, { "epoch": 18.67, "learning_rate": 8.322727272727273e-05, "loss": 0.2528, "step": 840 }, { "epoch": 18.89, "learning_rate": 8.3e-05, "loss": 0.2165, "step": 850 }, { "epoch": 19.0, "eval_loss": 0.6720542311668396, "eval_runtime": 2.4846, "eval_samples_per_second": 6.842, "eval_steps_per_second": 3.622, "eval_wer": 0.31585220500595945, "step": 855 }, { "epoch": 19.11, "learning_rate": 8.277272727272728e-05, "loss": 0.25, "step": 860 }, { "epoch": 19.33, "learning_rate": 8.254545454545454e-05, "loss": 0.2204, "step": 870 }, { "epoch": 19.56, "learning_rate": 8.231818181818183e-05, "loss": 0.2249, "step": 880 }, { "epoch": 19.78, "learning_rate": 8.20909090909091e-05, "loss": 0.246, "step": 890 }, { "epoch": 20.0, "learning_rate": 8.186363636363636e-05, "loss": 0.207, "step": 900 }, { "epoch": 20.0, "eval_loss": 0.6311757564544678, "eval_runtime": 2.538, "eval_samples_per_second": 6.698, "eval_steps_per_second": 3.546, "eval_wer": 0.3206197854588796, "step": 900 }, { "epoch": 20.22, "learning_rate": 8.163636363636364e-05, "loss": 0.2194, "step": 910 }, { "epoch": 20.44, "learning_rate": 8.140909090909092e-05, "loss": 0.2629, "step": 920 }, { "epoch": 20.67, "learning_rate": 8.118181818181818e-05, "loss": 0.2146, "step": 930 }, { "epoch": 20.89, "learning_rate": 8.095454545454546e-05, "loss": 0.2263, "step": 940 }, { "epoch": 21.0, "eval_loss": 0.6223281621932983, "eval_runtime": 2.4885, "eval_samples_per_second": 6.831, "eval_steps_per_second": 3.617, "eval_wer": 0.3289630512514899, "step": 945 }, { "epoch": 21.11, "learning_rate": 8.072727272727273e-05, "loss": 0.1938, "step": 950 }, { "epoch": 21.33, "learning_rate": 8.05e-05, "loss": 0.2453, "step": 960 }, { "epoch": 21.56, "learning_rate": 8.027272727272728e-05, "loss": 0.2313, "step": 970 }, { "epoch": 21.78, "learning_rate": 8.004545454545455e-05, "loss": 0.244, "step": 980 }, { "epoch": 22.0, "learning_rate": 7.981818181818182e-05, "loss": 0.2015, "step": 990 }, { "epoch": 22.0, "eval_loss": 0.6319324374198914, "eval_runtime": 2.5118, "eval_samples_per_second": 6.768, "eval_steps_per_second": 3.583, "eval_wer": 0.3182359952324195, "step": 990 }, { "epoch": 22.22, "learning_rate": 7.95909090909091e-05, "loss": 0.2187, "step": 1000 }, { "epoch": 22.44, "learning_rate": 7.936363636363637e-05, "loss": 0.23, "step": 1010 }, { "epoch": 22.67, "learning_rate": 7.913636363636364e-05, "loss": 0.2501, "step": 1020 }, { "epoch": 22.89, "learning_rate": 7.890909090909091e-05, "loss": 0.1997, "step": 1030 }, { "epoch": 23.0, "eval_loss": 0.6527409553527832, "eval_runtime": 2.4821, "eval_samples_per_second": 6.849, "eval_steps_per_second": 3.626, "eval_wer": 0.3134684147794994, "step": 1035 }, { "epoch": 23.11, "learning_rate": 7.86818181818182e-05, "loss": 0.2148, "step": 1040 }, { "epoch": 23.33, "learning_rate": 7.845454545454545e-05, "loss": 0.2292, "step": 1050 }, { "epoch": 23.56, "learning_rate": 7.822727272727273e-05, "loss": 0.1685, "step": 1060 }, { "epoch": 23.78, "learning_rate": 7.800000000000001e-05, "loss": 0.2818, "step": 1070 }, { "epoch": 24.0, "learning_rate": 7.777272727272727e-05, "loss": 0.2318, "step": 1080 }, { "epoch": 24.0, "eval_loss": 0.5986764430999756, "eval_runtime": 2.5, "eval_samples_per_second": 6.8, "eval_steps_per_second": 3.6, "eval_wer": 0.32777115613825986, "step": 1080 }, { "epoch": 24.22, "learning_rate": 7.754545454545456e-05, "loss": 0.2375, "step": 1090 }, { "epoch": 24.44, "learning_rate": 7.731818181818183e-05, "loss": 0.254, "step": 1100 }, { "epoch": 24.67, "learning_rate": 7.709090909090909e-05, "loss": 0.2489, "step": 1110 }, { "epoch": 24.89, "learning_rate": 7.686363636363637e-05, "loss": 0.2196, "step": 1120 }, { "epoch": 25.0, "eval_loss": 0.6269426941871643, "eval_runtime": 2.4962, "eval_samples_per_second": 6.81, "eval_steps_per_second": 3.606, "eval_wer": 0.32419547079856975, "step": 1125 }, { "epoch": 25.11, "learning_rate": 7.663636363636364e-05, "loss": 0.1759, "step": 1130 }, { "epoch": 25.33, "learning_rate": 7.64090909090909e-05, "loss": 0.2394, "step": 1140 }, { "epoch": 25.56, "learning_rate": 7.618181818181819e-05, "loss": 0.2462, "step": 1150 }, { "epoch": 25.78, "learning_rate": 7.595454545454546e-05, "loss": 0.2166, "step": 1160 }, { "epoch": 26.0, "learning_rate": 7.572727272727273e-05, "loss": 0.2298, "step": 1170 }, { "epoch": 26.0, "eval_loss": 0.5773761868476868, "eval_runtime": 2.5516, "eval_samples_per_second": 6.663, "eval_steps_per_second": 3.527, "eval_wer": 0.3253873659117998, "step": 1170 }, { "epoch": 26.22, "learning_rate": 7.55e-05, "loss": 0.215, "step": 1180 }, { "epoch": 26.44, "learning_rate": 7.527272727272728e-05, "loss": 0.2124, "step": 1190 }, { "epoch": 26.67, "learning_rate": 7.504545454545455e-05, "loss": 0.2298, "step": 1200 }, { "epoch": 26.89, "learning_rate": 7.481818181818182e-05, "loss": 0.2117, "step": 1210 }, { "epoch": 27.0, "eval_loss": 0.5937696099281311, "eval_runtime": 2.5092, "eval_samples_per_second": 6.775, "eval_steps_per_second": 3.587, "eval_wer": 0.30274135876042907, "step": 1215 }, { "epoch": 27.11, "learning_rate": 7.45909090909091e-05, "loss": 0.2185, "step": 1220 }, { "epoch": 27.33, "learning_rate": 7.436363636363637e-05, "loss": 0.2526, "step": 1230 }, { "epoch": 27.56, "learning_rate": 7.413636363636364e-05, "loss": 0.2263, "step": 1240 }, { "epoch": 27.78, "learning_rate": 7.390909090909091e-05, "loss": 0.2285, "step": 1250 }, { "epoch": 28.0, "learning_rate": 7.368181818181818e-05, "loss": 0.2553, "step": 1260 }, { "epoch": 28.0, "eval_loss": 0.5831002593040466, "eval_runtime": 2.5597, "eval_samples_per_second": 6.641, "eval_steps_per_second": 3.516, "eval_wer": 0.31227651966626935, "step": 1260 }, { "epoch": 28.22, "learning_rate": 7.345454545454545e-05, "loss": 0.2105, "step": 1270 }, { "epoch": 28.44, "learning_rate": 7.322727272727273e-05, "loss": 0.2412, "step": 1280 }, { "epoch": 28.67, "learning_rate": 7.3e-05, "loss": 0.215, "step": 1290 }, { "epoch": 28.89, "learning_rate": 7.277272727272728e-05, "loss": 0.226, "step": 1300 }, { "epoch": 29.0, "eval_loss": 0.6151101589202881, "eval_runtime": 2.4897, "eval_samples_per_second": 6.828, "eval_steps_per_second": 3.615, "eval_wer": 0.3098927294398093, "step": 1305 }, { "epoch": 29.11, "learning_rate": 7.254545454545454e-05, "loss": 0.2142, "step": 1310 }, { "epoch": 29.33, "learning_rate": 7.231818181818182e-05, "loss": 0.2337, "step": 1320 }, { "epoch": 29.56, "learning_rate": 7.20909090909091e-05, "loss": 0.2312, "step": 1330 }, { "epoch": 29.78, "learning_rate": 7.186363636363636e-05, "loss": 0.2473, "step": 1340 }, { "epoch": 30.0, "learning_rate": 7.163636363636363e-05, "loss": 0.1635, "step": 1350 }, { "epoch": 30.0, "eval_loss": 0.5622395873069763, "eval_runtime": 2.4788, "eval_samples_per_second": 6.858, "eval_steps_per_second": 3.631, "eval_wer": 0.3230035756853397, "step": 1350 }, { "epoch": 30.22, "learning_rate": 7.140909090909092e-05, "loss": 0.2489, "step": 1360 }, { "epoch": 30.44, "learning_rate": 7.118181818181818e-05, "loss": 0.2278, "step": 1370 }, { "epoch": 30.67, "learning_rate": 7.095454545454546e-05, "loss": 0.2083, "step": 1380 }, { "epoch": 30.89, "learning_rate": 7.075e-05, "loss": 0.5734, "step": 1390 }, { "epoch": 31.0, "eval_loss": 0.6198131442070007, "eval_runtime": 2.5498, "eval_samples_per_second": 6.667, "eval_steps_per_second": 3.53, "eval_wer": 0.29201430274135876, "step": 1395 }, { "epoch": 31.11, "learning_rate": 7.052272727272727e-05, "loss": 0.2116, "step": 1400 }, { "epoch": 31.33, "learning_rate": 7.029545454545456e-05, "loss": 0.1918, "step": 1410 }, { "epoch": 31.56, "learning_rate": 7.006818181818181e-05, "loss": 0.2533, "step": 1420 }, { "epoch": 31.78, "learning_rate": 6.984090909090909e-05, "loss": 0.2381, "step": 1430 }, { "epoch": 32.0, "learning_rate": 6.961363636363637e-05, "loss": 0.2196, "step": 1440 }, { "epoch": 32.0, "eval_loss": 0.5778882503509521, "eval_runtime": 2.5141, "eval_samples_per_second": 6.762, "eval_steps_per_second": 3.58, "eval_wer": 0.3039332538736591, "step": 1440 }, { "epoch": 32.22, "learning_rate": 6.938636363636364e-05, "loss": 0.1784, "step": 1450 }, { "epoch": 32.44, "learning_rate": 6.915909090909092e-05, "loss": 0.2171, "step": 1460 }, { "epoch": 32.67, "learning_rate": 6.893181818181819e-05, "loss": 0.2028, "step": 1470 }, { "epoch": 32.89, "learning_rate": 6.870454545454546e-05, "loss": 0.2019, "step": 1480 }, { "epoch": 33.0, "eval_loss": 0.5865838527679443, "eval_runtime": 2.5084, "eval_samples_per_second": 6.777, "eval_steps_per_second": 3.588, "eval_wer": 0.3110846245530393, "step": 1485 }, { "epoch": 33.11, "learning_rate": 6.847727272727273e-05, "loss": 0.2082, "step": 1490 }, { "epoch": 33.33, "learning_rate": 6.825e-05, "loss": 0.2251, "step": 1500 }, { "epoch": 33.56, "learning_rate": 6.802272727272728e-05, "loss": 0.3452, "step": 1510 }, { "epoch": 33.78, "learning_rate": 6.779545454545455e-05, "loss": 0.2135, "step": 1520 }, { "epoch": 34.0, "learning_rate": 6.756818181818182e-05, "loss": 0.2222, "step": 1530 }, { "epoch": 34.0, "eval_loss": 0.5556985139846802, "eval_runtime": 2.5608, "eval_samples_per_second": 6.638, "eval_steps_per_second": 3.514, "eval_wer": 0.3063170441001192, "step": 1530 }, { "epoch": 34.22, "learning_rate": 6.73409090909091e-05, "loss": 0.1691, "step": 1540 }, { "epoch": 34.44, "learning_rate": 6.711363636363637e-05, "loss": 0.1986, "step": 1550 }, { "epoch": 34.67, "learning_rate": 6.688636363636364e-05, "loss": 0.2246, "step": 1560 }, { "epoch": 34.89, "learning_rate": 6.665909090909091e-05, "loss": 0.2167, "step": 1570 }, { "epoch": 35.0, "eval_loss": 0.5739646553993225, "eval_runtime": 2.4762, "eval_samples_per_second": 6.865, "eval_steps_per_second": 3.635, "eval_wer": 0.3206197854588796, "step": 1575 }, { "epoch": 35.11, "learning_rate": 6.643181818181818e-05, "loss": 0.2261, "step": 1580 }, { "epoch": 35.33, "learning_rate": 6.620454545454545e-05, "loss": 0.1823, "step": 1590 }, { "epoch": 35.56, "learning_rate": 6.597727272727273e-05, "loss": 0.1962, "step": 1600 }, { "epoch": 35.78, "learning_rate": 6.575e-05, "loss": 0.2168, "step": 1610 }, { "epoch": 36.0, "learning_rate": 6.552272727272728e-05, "loss": 0.2011, "step": 1620 }, { "epoch": 36.0, "eval_loss": 0.5597788095474243, "eval_runtime": 2.5199, "eval_samples_per_second": 6.746, "eval_steps_per_second": 3.572, "eval_wer": 0.300357568533969, "step": 1620 }, { "epoch": 36.22, "learning_rate": 6.529545454545454e-05, "loss": 0.1985, "step": 1630 }, { "epoch": 36.44, "learning_rate": 6.506818181818182e-05, "loss": 0.2325, "step": 1640 }, { "epoch": 36.67, "learning_rate": 6.48409090909091e-05, "loss": 0.221, "step": 1650 }, { "epoch": 36.89, "learning_rate": 6.461363636363636e-05, "loss": 0.2032, "step": 1660 }, { "epoch": 37.0, "eval_loss": 0.5550447702407837, "eval_runtime": 2.4895, "eval_samples_per_second": 6.829, "eval_steps_per_second": 3.615, "eval_wer": 0.3146603098927294, "step": 1665 }, { "epoch": 37.11, "learning_rate": 6.438636363636365e-05, "loss": 0.1469, "step": 1670 }, { "epoch": 37.33, "learning_rate": 6.415909090909092e-05, "loss": 0.1909, "step": 1680 }, { "epoch": 37.56, "learning_rate": 6.393181818181818e-05, "loss": 0.2543, "step": 1690 }, { "epoch": 37.78, "learning_rate": 6.370454545454546e-05, "loss": 0.1942, "step": 1700 }, { "epoch": 38.0, "learning_rate": 6.347727272727273e-05, "loss": 0.225, "step": 1710 }, { "epoch": 38.0, "eval_loss": 0.5793956518173218, "eval_runtime": 2.5099, "eval_samples_per_second": 6.773, "eval_steps_per_second": 3.586, "eval_wer": 0.3098927294398093, "step": 1710 }, { "epoch": 38.22, "learning_rate": 6.324999999999999e-05, "loss": 0.1756, "step": 1720 }, { "epoch": 38.44, "learning_rate": 6.302272727272728e-05, "loss": 0.2029, "step": 1730 }, { "epoch": 38.67, "learning_rate": 6.279545454545455e-05, "loss": 0.2247, "step": 1740 }, { "epoch": 38.89, "learning_rate": 6.256818181818182e-05, "loss": 0.2068, "step": 1750 }, { "epoch": 39.0, "eval_loss": 0.6223248243331909, "eval_runtime": 2.4984, "eval_samples_per_second": 6.804, "eval_steps_per_second": 3.602, "eval_wer": 0.3063170441001192, "step": 1755 }, { "epoch": 39.11, "learning_rate": 6.23409090909091e-05, "loss": 0.2323, "step": 1760 }, { "epoch": 39.33, "learning_rate": 6.211363636363637e-05, "loss": 0.196, "step": 1770 }, { "epoch": 39.56, "learning_rate": 6.188636363636364e-05, "loss": 0.208, "step": 1780 }, { "epoch": 39.78, "learning_rate": 6.165909090909091e-05, "loss": 0.1877, "step": 1790 }, { "epoch": 40.0, "learning_rate": 6.143181818181818e-05, "loss": 0.2105, "step": 1800 }, { "epoch": 40.0, "eval_loss": 0.5797024965286255, "eval_runtime": 2.5499, "eval_samples_per_second": 6.667, "eval_steps_per_second": 3.53, "eval_wer": 0.3039332538736591, "step": 1800 }, { "epoch": 40.22, "learning_rate": 6.120454545454546e-05, "loss": 0.2365, "step": 1810 }, { "epoch": 40.44, "learning_rate": 6.097727272727273e-05, "loss": 0.2289, "step": 1820 }, { "epoch": 40.67, "learning_rate": 6.0750000000000006e-05, "loss": 0.2039, "step": 1830 }, { "epoch": 40.89, "learning_rate": 6.052272727272728e-05, "loss": 0.1968, "step": 1840 }, { "epoch": 41.0, "eval_loss": 0.5681240558624268, "eval_runtime": 2.5164, "eval_samples_per_second": 6.756, "eval_steps_per_second": 3.577, "eval_wer": 0.2967818831942789, "step": 1845 }, { "epoch": 41.11, "learning_rate": 6.0295454545454544e-05, "loss": 0.1896, "step": 1850 }, { "epoch": 41.33, "learning_rate": 6.006818181818182e-05, "loss": 0.2074, "step": 1860 }, { "epoch": 41.56, "learning_rate": 5.9840909090909095e-05, "loss": 0.2141, "step": 1870 }, { "epoch": 41.78, "learning_rate": 5.9613636363636374e-05, "loss": 0.2159, "step": 1880 }, { "epoch": 42.0, "learning_rate": 5.938636363636364e-05, "loss": 0.224, "step": 1890 }, { "epoch": 42.0, "eval_loss": 0.5742160677909851, "eval_runtime": 2.5274, "eval_samples_per_second": 6.726, "eval_steps_per_second": 3.561, "eval_wer": 0.3170441001191895, "step": 1890 }, { "epoch": 42.22, "learning_rate": 5.915909090909091e-05, "loss": 0.1763, "step": 1900 }, { "epoch": 42.44, "learning_rate": 5.895454545454546e-05, "loss": 0.3628, "step": 1910 }, { "epoch": 42.67, "learning_rate": 5.8727272727272734e-05, "loss": 0.1913, "step": 1920 }, { "epoch": 42.89, "learning_rate": 5.85e-05, "loss": 0.2351, "step": 1930 }, { "epoch": 43.0, "eval_loss": 0.5566673278808594, "eval_runtime": 2.4939, "eval_samples_per_second": 6.817, "eval_steps_per_second": 3.609, "eval_wer": 0.3110846245530393, "step": 1935 }, { "epoch": 43.11, "learning_rate": 5.827272727272728e-05, "loss": 0.1828, "step": 1940 }, { "epoch": 43.33, "learning_rate": 5.804545454545455e-05, "loss": 0.1875, "step": 1950 }, { "epoch": 43.56, "learning_rate": 5.7818181818181815e-05, "loss": 0.1983, "step": 1960 }, { "epoch": 43.78, "learning_rate": 5.7590909090909094e-05, "loss": 0.2419, "step": 1970 }, { "epoch": 44.0, "learning_rate": 5.7363636363636366e-05, "loss": 0.2121, "step": 1980 }, { "epoch": 44.0, "eval_loss": 0.589346170425415, "eval_runtime": 2.5108, "eval_samples_per_second": 6.771, "eval_steps_per_second": 3.585, "eval_wer": 0.3039332538736591, "step": 1980 }, { "epoch": 44.22, "learning_rate": 5.7136363636363645e-05, "loss": 0.2079, "step": 1990 }, { "epoch": 44.44, "learning_rate": 5.690909090909091e-05, "loss": 0.2133, "step": 2000 }, { "epoch": 44.67, "learning_rate": 5.668181818181818e-05, "loss": 0.196, "step": 2010 }, { "epoch": 44.89, "learning_rate": 5.645454545454546e-05, "loss": 0.1913, "step": 2020 }, { "epoch": 45.0, "eval_loss": 0.6030301451683044, "eval_runtime": 2.519, "eval_samples_per_second": 6.749, "eval_steps_per_second": 3.573, "eval_wer": 0.30274135876042907, "step": 2025 }, { "epoch": 45.11, "learning_rate": 5.622727272727273e-05, "loss": 0.1812, "step": 2030 }, { "epoch": 45.33, "learning_rate": 5.6000000000000006e-05, "loss": 0.2113, "step": 2040 }, { "epoch": 45.56, "learning_rate": 5.577272727272728e-05, "loss": 0.1956, "step": 2050 }, { "epoch": 45.78, "learning_rate": 5.5545454545454543e-05, "loss": 0.1811, "step": 2060 }, { "epoch": 46.0, "learning_rate": 5.531818181818182e-05, "loss": 0.1636, "step": 2070 }, { "epoch": 46.0, "eval_loss": 0.5812211036682129, "eval_runtime": 2.5308, "eval_samples_per_second": 6.717, "eval_steps_per_second": 3.556, "eval_wer": 0.300357568533969, "step": 2070 }, { "epoch": 46.22, "learning_rate": 5.5090909090909094e-05, "loss": 0.2279, "step": 2080 }, { "epoch": 46.44, "learning_rate": 5.486363636363636e-05, "loss": 0.1911, "step": 2090 }, { "epoch": 46.67, "learning_rate": 5.463636363636364e-05, "loss": 0.1824, "step": 2100 }, { "epoch": 46.89, "learning_rate": 5.440909090909091e-05, "loss": 0.2062, "step": 2110 }, { "epoch": 47.0, "eval_loss": 0.6080830097198486, "eval_runtime": 2.5078, "eval_samples_per_second": 6.779, "eval_steps_per_second": 3.589, "eval_wer": 0.300357568533969, "step": 2115 }, { "epoch": 47.11, "learning_rate": 5.418181818181819e-05, "loss": 0.1714, "step": 2120 }, { "epoch": 47.33, "learning_rate": 5.3954545454545455e-05, "loss": 0.211, "step": 2130 }, { "epoch": 47.56, "learning_rate": 5.372727272727273e-05, "loss": 0.2038, "step": 2140 }, { "epoch": 47.78, "learning_rate": 5.3500000000000006e-05, "loss": 0.1628, "step": 2150 }, { "epoch": 48.0, "learning_rate": 5.327272727272727e-05, "loss": 0.2031, "step": 2160 }, { "epoch": 48.0, "eval_loss": 0.5609662532806396, "eval_runtime": 2.542, "eval_samples_per_second": 6.688, "eval_steps_per_second": 3.541, "eval_wer": 0.31585220500595945, "step": 2160 }, { "epoch": 48.22, "learning_rate": 5.3045454545454544e-05, "loss": 0.2204, "step": 2170 }, { "epoch": 48.44, "learning_rate": 5.281818181818182e-05, "loss": 0.1909, "step": 2180 }, { "epoch": 48.67, "learning_rate": 5.259090909090909e-05, "loss": 0.1908, "step": 2190 }, { "epoch": 48.89, "learning_rate": 5.2363636363636374e-05, "loss": 0.1892, "step": 2200 }, { "epoch": 49.0, "eval_loss": 0.5863101482391357, "eval_runtime": 2.5418, "eval_samples_per_second": 6.688, "eval_steps_per_second": 3.541, "eval_wer": 0.3146603098927294, "step": 2205 }, { "epoch": 49.11, "learning_rate": 5.213636363636364e-05, "loss": 0.1453, "step": 2210 }, { "epoch": 49.33, "learning_rate": 5.1909090909090904e-05, "loss": 0.1623, "step": 2220 }, { "epoch": 49.56, "learning_rate": 5.168181818181819e-05, "loss": 0.2108, "step": 2230 }, { "epoch": 49.78, "learning_rate": 5.1454545454545455e-05, "loss": 0.2012, "step": 2240 }, { "epoch": 50.0, "learning_rate": 5.1227272727272734e-05, "loss": 0.1712, "step": 2250 }, { "epoch": 50.0, "eval_loss": 0.5942688584327698, "eval_runtime": 2.571, "eval_samples_per_second": 6.612, "eval_steps_per_second": 3.501, "eval_wer": 0.31585220500595945, "step": 2250 }, { "epoch": 50.22, "learning_rate": 5.1000000000000006e-05, "loss": 0.2248, "step": 2260 }, { "epoch": 50.44, "learning_rate": 5.077272727272727e-05, "loss": 0.175, "step": 2270 }, { "epoch": 50.67, "learning_rate": 5.054545454545455e-05, "loss": 0.2178, "step": 2280 }, { "epoch": 50.89, "learning_rate": 5.031818181818182e-05, "loss": 0.1886, "step": 2290 }, { "epoch": 51.0, "eval_loss": 0.5952860116958618, "eval_runtime": 2.4853, "eval_samples_per_second": 6.84, "eval_steps_per_second": 3.621, "eval_wer": 0.30512514898688914, "step": 2295 }, { "epoch": 51.11, "learning_rate": 5.009090909090909e-05, "loss": 0.1527, "step": 2300 }, { "epoch": 51.33, "learning_rate": 4.986363636363637e-05, "loss": 0.2095, "step": 2310 }, { "epoch": 51.56, "learning_rate": 4.963636363636364e-05, "loss": 0.2404, "step": 2320 }, { "epoch": 51.78, "learning_rate": 4.940909090909091e-05, "loss": 0.2528, "step": 2330 }, { "epoch": 52.0, "learning_rate": 4.9181818181818183e-05, "loss": 0.1748, "step": 2340 }, { "epoch": 52.0, "eval_loss": 0.5761290788650513, "eval_runtime": 2.5169, "eval_samples_per_second": 6.754, "eval_steps_per_second": 3.576, "eval_wer": 0.30870083432657924, "step": 2340 }, { "epoch": 52.22, "learning_rate": 4.8954545454545456e-05, "loss": 0.2298, "step": 2350 }, { "epoch": 52.44, "learning_rate": 4.872727272727273e-05, "loss": 0.2307, "step": 2360 }, { "epoch": 52.67, "learning_rate": 4.85e-05, "loss": 0.1971, "step": 2370 }, { "epoch": 52.89, "learning_rate": 4.827272727272727e-05, "loss": 0.1705, "step": 2380 }, { "epoch": 53.0, "eval_loss": 0.6045453548431396, "eval_runtime": 2.5267, "eval_samples_per_second": 6.728, "eval_steps_per_second": 3.562, "eval_wer": 0.2872467222884386, "step": 2385 }, { "epoch": 53.11, "learning_rate": 4.804545454545455e-05, "loss": 0.2131, "step": 2390 }, { "epoch": 53.33, "learning_rate": 4.781818181818182e-05, "loss": 0.2028, "step": 2400 }, { "epoch": 53.56, "learning_rate": 4.759090909090909e-05, "loss": 0.1936, "step": 2410 }, { "epoch": 53.78, "learning_rate": 4.736363636363637e-05, "loss": 0.1824, "step": 2420 }, { "epoch": 54.0, "learning_rate": 4.713636363636364e-05, "loss": 0.1794, "step": 2430 }, { "epoch": 54.0, "eval_loss": 0.5731208324432373, "eval_runtime": 2.5141, "eval_samples_per_second": 6.762, "eval_steps_per_second": 3.58, "eval_wer": 0.3075089392133492, "step": 2430 }, { "epoch": 54.22, "learning_rate": 4.690909090909091e-05, "loss": 0.205, "step": 2440 }, { "epoch": 54.44, "learning_rate": 4.6681818181818184e-05, "loss": 0.1968, "step": 2450 }, { "epoch": 54.67, "learning_rate": 4.6454545454545456e-05, "loss": 0.211, "step": 2460 }, { "epoch": 54.89, "learning_rate": 4.622727272727273e-05, "loss": 0.1815, "step": 2470 }, { "epoch": 55.0, "eval_loss": 0.594903290271759, "eval_runtime": 2.5112, "eval_samples_per_second": 6.77, "eval_steps_per_second": 3.584, "eval_wer": 0.28486293206197855, "step": 2475 }, { "epoch": 55.11, "learning_rate": 4.600000000000001e-05, "loss": 0.1664, "step": 2480 }, { "epoch": 55.33, "learning_rate": 4.577272727272727e-05, "loss": 0.2192, "step": 2490 }, { "epoch": 55.56, "learning_rate": 4.5545454545454544e-05, "loss": 0.2304, "step": 2500 }, { "epoch": 55.78, "learning_rate": 4.531818181818182e-05, "loss": 0.1865, "step": 2510 }, { "epoch": 56.0, "learning_rate": 4.5090909090909095e-05, "loss": 0.1571, "step": 2520 }, { "epoch": 56.0, "eval_loss": 0.5662998557090759, "eval_runtime": 2.5512, "eval_samples_per_second": 6.664, "eval_steps_per_second": 3.528, "eval_wer": 0.28843861740166865, "step": 2520 }, { "epoch": 56.22, "learning_rate": 4.486363636363636e-05, "loss": 0.2302, "step": 2530 }, { "epoch": 56.44, "learning_rate": 4.463636363636364e-05, "loss": 0.1863, "step": 2540 }, { "epoch": 56.67, "learning_rate": 4.440909090909091e-05, "loss": 0.1897, "step": 2550 }, { "epoch": 56.89, "learning_rate": 4.4181818181818184e-05, "loss": 0.1902, "step": 2560 }, { "epoch": 57.0, "eval_loss": 0.5903468132019043, "eval_runtime": 2.5114, "eval_samples_per_second": 6.769, "eval_steps_per_second": 3.584, "eval_wer": 0.29558998808104886, "step": 2565 }, { "epoch": 57.11, "learning_rate": 4.3954545454545456e-05, "loss": 0.4606, "step": 2570 }, { "epoch": 57.33, "learning_rate": 4.372727272727273e-05, "loss": 0.2324, "step": 2580 }, { "epoch": 57.56, "learning_rate": 4.35e-05, "loss": 0.1489, "step": 2590 }, { "epoch": 57.78, "learning_rate": 4.327272727272728e-05, "loss": 0.1761, "step": 2600 }, { "epoch": 58.0, "learning_rate": 4.304545454545455e-05, "loss": 0.2057, "step": 2610 }, { "epoch": 58.0, "eval_loss": 0.5819745659828186, "eval_runtime": 2.5442, "eval_samples_per_second": 6.682, "eval_steps_per_second": 3.537, "eval_wer": 0.2872467222884386, "step": 2610 }, { "epoch": 58.22, "learning_rate": 4.281818181818182e-05, "loss": 0.1581, "step": 2620 }, { "epoch": 58.44, "learning_rate": 4.2590909090909096e-05, "loss": 0.1782, "step": 2630 }, { "epoch": 58.67, "learning_rate": 4.236363636363637e-05, "loss": 0.2072, "step": 2640 }, { "epoch": 58.89, "learning_rate": 4.213636363636364e-05, "loss": 0.1904, "step": 2650 }, { "epoch": 59.0, "eval_loss": 0.592314600944519, "eval_runtime": 2.4863, "eval_samples_per_second": 6.837, "eval_steps_per_second": 3.62, "eval_wer": 0.2896305125148987, "step": 2655 }, { "epoch": 59.11, "learning_rate": 4.190909090909091e-05, "loss": 0.1978, "step": 2660 }, { "epoch": 59.33, "learning_rate": 4.1681818181818184e-05, "loss": 0.1678, "step": 2670 }, { "epoch": 59.56, "learning_rate": 4.1454545454545456e-05, "loss": 0.2256, "step": 2680 }, { "epoch": 59.78, "learning_rate": 4.122727272727273e-05, "loss": 0.1894, "step": 2690 }, { "epoch": 60.0, "learning_rate": 4.1e-05, "loss": 0.1677, "step": 2700 }, { "epoch": 60.0, "eval_loss": 0.5769378542900085, "eval_runtime": 2.4755, "eval_samples_per_second": 6.867, "eval_steps_per_second": 3.636, "eval_wer": 0.3075089392133492, "step": 2700 }, { "epoch": 60.22, "learning_rate": 4.077272727272727e-05, "loss": 0.2007, "step": 2710 }, { "epoch": 60.44, "learning_rate": 4.0545454545454545e-05, "loss": 0.2135, "step": 2720 }, { "epoch": 60.67, "learning_rate": 4.0318181818181824e-05, "loss": 0.1436, "step": 2730 }, { "epoch": 60.89, "learning_rate": 4.009090909090909e-05, "loss": 0.1859, "step": 2740 }, { "epoch": 61.0, "eval_loss": 0.5566421151161194, "eval_runtime": 2.4891, "eval_samples_per_second": 6.83, "eval_steps_per_second": 3.616, "eval_wer": 0.3146603098927294, "step": 2745 }, { "epoch": 61.11, "learning_rate": 3.986363636363636e-05, "loss": 0.1403, "step": 2750 }, { "epoch": 61.33, "learning_rate": 3.963636363636364e-05, "loss": 0.1937, "step": 2760 }, { "epoch": 61.56, "learning_rate": 3.940909090909091e-05, "loss": 0.1964, "step": 2770 }, { "epoch": 61.78, "learning_rate": 3.9181818181818184e-05, "loss": 0.1689, "step": 2780 }, { "epoch": 62.0, "learning_rate": 3.8954545454545456e-05, "loss": 0.2382, "step": 2790 }, { "epoch": 62.0, "eval_loss": 0.5849183201789856, "eval_runtime": 2.4922, "eval_samples_per_second": 6.821, "eval_steps_per_second": 3.611, "eval_wer": 0.30512514898688914, "step": 2790 }, { "epoch": 62.22, "learning_rate": 3.872727272727273e-05, "loss": 0.1529, "step": 2800 }, { "epoch": 62.44, "learning_rate": 3.85e-05, "loss": 0.2238, "step": 2810 }, { "epoch": 62.67, "learning_rate": 3.827272727272728e-05, "loss": 0.2719, "step": 2820 }, { "epoch": 62.89, "learning_rate": 3.8045454545454545e-05, "loss": 0.1753, "step": 2830 }, { "epoch": 63.0, "eval_loss": 0.5773067474365234, "eval_runtime": 2.4779, "eval_samples_per_second": 6.861, "eval_steps_per_second": 3.632, "eval_wer": 0.3075089392133492, "step": 2835 }, { "epoch": 63.11, "learning_rate": 3.781818181818182e-05, "loss": 0.147, "step": 2840 }, { "epoch": 63.33, "learning_rate": 3.7590909090909096e-05, "loss": 0.2222, "step": 2850 }, { "epoch": 63.56, "learning_rate": 3.736363636363637e-05, "loss": 0.2357, "step": 2860 }, { "epoch": 63.78, "learning_rate": 3.7136363636363633e-05, "loss": 0.1523, "step": 2870 }, { "epoch": 64.0, "learning_rate": 3.690909090909091e-05, "loss": 0.1651, "step": 2880 }, { "epoch": 64.0, "eval_loss": 0.5876759886741638, "eval_runtime": 2.5002, "eval_samples_per_second": 6.8, "eval_steps_per_second": 3.6, "eval_wer": 0.3039332538736591, "step": 2880 }, { "epoch": 64.22, "learning_rate": 3.6681818181818185e-05, "loss": 0.1937, "step": 2890 }, { "epoch": 64.44, "learning_rate": 3.645454545454546e-05, "loss": 0.2159, "step": 2900 }, { "epoch": 64.67, "learning_rate": 3.622727272727273e-05, "loss": 0.1541, "step": 2910 }, { "epoch": 64.89, "learning_rate": 3.6e-05, "loss": 0.1781, "step": 2920 }, { "epoch": 65.0, "eval_loss": 0.590542197227478, "eval_runtime": 2.5017, "eval_samples_per_second": 6.795, "eval_steps_per_second": 3.598, "eval_wer": 0.30274135876042907, "step": 2925 }, { "epoch": 65.11, "learning_rate": 3.577272727272727e-05, "loss": 0.1839, "step": 2930 }, { "epoch": 65.33, "learning_rate": 3.5545454545454545e-05, "loss": 0.1791, "step": 2940 }, { "epoch": 65.56, "learning_rate": 3.5318181818181824e-05, "loss": 0.217, "step": 2950 }, { "epoch": 65.78, "learning_rate": 3.509090909090909e-05, "loss": 0.2183, "step": 2960 }, { "epoch": 66.0, "learning_rate": 3.486363636363637e-05, "loss": 0.1582, "step": 2970 }, { "epoch": 66.0, "eval_loss": 0.5799685716629028, "eval_runtime": 2.4987, "eval_samples_per_second": 6.804, "eval_steps_per_second": 3.602, "eval_wer": 0.30154946364719903, "step": 2970 }, { "epoch": 66.22, "learning_rate": 3.463636363636364e-05, "loss": 0.1884, "step": 2980 }, { "epoch": 66.44, "learning_rate": 3.440909090909091e-05, "loss": 0.1901, "step": 2990 }, { "epoch": 66.67, "learning_rate": 3.4181818181818185e-05, "loss": 0.203, "step": 3000 }, { "epoch": 66.89, "learning_rate": 3.395454545454546e-05, "loss": 0.1538, "step": 3010 }, { "epoch": 67.0, "eval_loss": 0.6025242805480957, "eval_runtime": 2.4909, "eval_samples_per_second": 6.825, "eval_steps_per_second": 3.613, "eval_wer": 0.3075089392133492, "step": 3015 }, { "epoch": 67.11, "learning_rate": 3.372727272727273e-05, "loss": 0.2008, "step": 3020 }, { "epoch": 67.33, "learning_rate": 3.35e-05, "loss": 0.1811, "step": 3030 }, { "epoch": 67.56, "learning_rate": 3.327272727272727e-05, "loss": 0.1651, "step": 3040 }, { "epoch": 67.78, "learning_rate": 3.3045454545454545e-05, "loss": 0.2099, "step": 3050 }, { "epoch": 68.0, "learning_rate": 3.281818181818182e-05, "loss": 0.1606, "step": 3060 }, { "epoch": 68.0, "eval_loss": 0.5758008360862732, "eval_runtime": 2.5288, "eval_samples_per_second": 6.722, "eval_steps_per_second": 3.559, "eval_wer": 0.3039332538736591, "step": 3060 }, { "epoch": 68.22, "learning_rate": 3.2590909090909096e-05, "loss": 0.1881, "step": 3070 }, { "epoch": 68.44, "learning_rate": 3.236363636363636e-05, "loss": 0.2047, "step": 3080 }, { "epoch": 68.67, "learning_rate": 3.2136363636363634e-05, "loss": 0.2077, "step": 3090 }, { "epoch": 68.89, "learning_rate": 3.190909090909091e-05, "loss": 0.1522, "step": 3100 }, { "epoch": 69.0, "eval_loss": 0.5860080718994141, "eval_runtime": 2.5048, "eval_samples_per_second": 6.787, "eval_steps_per_second": 3.593, "eval_wer": 0.2932061978545888, "step": 3105 }, { "epoch": 69.11, "learning_rate": 3.1681818181818185e-05, "loss": 0.1474, "step": 3110 }, { "epoch": 69.33, "learning_rate": 3.145454545454546e-05, "loss": 0.1984, "step": 3120 }, { "epoch": 69.56, "learning_rate": 3.122727272727273e-05, "loss": 0.1927, "step": 3130 }, { "epoch": 69.78, "learning_rate": 3.1e-05, "loss": 0.2024, "step": 3140 }, { "epoch": 70.0, "learning_rate": 3.0772727272727273e-05, "loss": 0.1521, "step": 3150 }, { "epoch": 70.0, "eval_loss": 0.5895945429801941, "eval_runtime": 2.5235, "eval_samples_per_second": 6.737, "eval_steps_per_second": 3.567, "eval_wer": 0.29558998808104886, "step": 3150 }, { "epoch": 70.22, "learning_rate": 3.054545454545455e-05, "loss": 0.1619, "step": 3160 }, { "epoch": 70.44, "learning_rate": 3.0318181818181818e-05, "loss": 0.2155, "step": 3170 }, { "epoch": 70.67, "learning_rate": 3.0090909090909093e-05, "loss": 0.1886, "step": 3180 }, { "epoch": 70.89, "learning_rate": 2.9863636363636365e-05, "loss": 0.1592, "step": 3190 }, { "epoch": 71.0, "eval_loss": 0.5737584233283997, "eval_runtime": 2.5061, "eval_samples_per_second": 6.783, "eval_steps_per_second": 3.591, "eval_wer": 0.30274135876042907, "step": 3195 }, { "epoch": 71.11, "learning_rate": 2.963636363636364e-05, "loss": 0.2001, "step": 3200 }, { "epoch": 71.33, "learning_rate": 2.940909090909091e-05, "loss": 0.1797, "step": 3210 }, { "epoch": 71.56, "learning_rate": 2.9181818181818182e-05, "loss": 0.1987, "step": 3220 }, { "epoch": 71.78, "learning_rate": 2.8954545454545457e-05, "loss": 0.1859, "step": 3230 }, { "epoch": 72.0, "learning_rate": 2.872727272727273e-05, "loss": 0.2245, "step": 3240 }, { "epoch": 72.0, "eval_loss": 0.5781883597373962, "eval_runtime": 2.4952, "eval_samples_per_second": 6.813, "eval_steps_per_second": 3.607, "eval_wer": 0.3039332538736591, "step": 3240 }, { "epoch": 72.22, "learning_rate": 2.8499999999999998e-05, "loss": 0.1712, "step": 3250 }, { "epoch": 72.44, "learning_rate": 2.8272727272727274e-05, "loss": 0.1747, "step": 3260 }, { "epoch": 72.67, "learning_rate": 2.8045454545454546e-05, "loss": 0.1657, "step": 3270 }, { "epoch": 72.89, "learning_rate": 2.781818181818182e-05, "loss": 0.2185, "step": 3280 }, { "epoch": 73.0, "eval_loss": 0.5722064971923828, "eval_runtime": 2.5463, "eval_samples_per_second": 6.676, "eval_steps_per_second": 3.535, "eval_wer": 0.30274135876042907, "step": 3285 }, { "epoch": 73.11, "learning_rate": 2.759090909090909e-05, "loss": 0.1896, "step": 3290 }, { "epoch": 73.33, "learning_rate": 2.7363636363636362e-05, "loss": 0.2156, "step": 3300 }, { "epoch": 73.56, "learning_rate": 2.7136363636363638e-05, "loss": 0.156, "step": 3310 }, { "epoch": 73.78, "learning_rate": 2.6909090909090913e-05, "loss": 0.1841, "step": 3320 }, { "epoch": 74.0, "learning_rate": 2.6681818181818185e-05, "loss": 0.1597, "step": 3330 }, { "epoch": 74.0, "eval_loss": 0.589074432849884, "eval_runtime": 2.4952, "eval_samples_per_second": 6.813, "eval_steps_per_second": 3.607, "eval_wer": 0.300357568533969, "step": 3330 }, { "epoch": 74.22, "learning_rate": 2.6454545454545454e-05, "loss": 0.2157, "step": 3340 }, { "epoch": 74.44, "learning_rate": 2.622727272727273e-05, "loss": 0.1685, "step": 3350 }, { "epoch": 74.67, "learning_rate": 2.6000000000000002e-05, "loss": 0.207, "step": 3360 }, { "epoch": 74.89, "learning_rate": 2.5772727272727277e-05, "loss": 0.1713, "step": 3370 }, { "epoch": 75.0, "eval_loss": 0.5649510622024536, "eval_runtime": 2.4909, "eval_samples_per_second": 6.825, "eval_steps_per_second": 3.613, "eval_wer": 0.30274135876042907, "step": 3375 }, { "epoch": 75.11, "learning_rate": 2.5545454545454546e-05, "loss": 0.1287, "step": 3380 }, { "epoch": 75.33, "learning_rate": 2.5318181818181818e-05, "loss": 0.1519, "step": 3390 }, { "epoch": 75.56, "learning_rate": 2.5090909090909094e-05, "loss": 0.2106, "step": 3400 }, { "epoch": 75.78, "learning_rate": 2.4863636363636362e-05, "loss": 0.1806, "step": 3410 }, { "epoch": 76.0, "learning_rate": 2.4636363636363638e-05, "loss": 0.1464, "step": 3420 }, { "epoch": 76.0, "eval_loss": 0.5860361456871033, "eval_runtime": 2.556, "eval_samples_per_second": 6.651, "eval_steps_per_second": 3.521, "eval_wer": 0.3063170441001192, "step": 3420 }, { "epoch": 76.22, "learning_rate": 2.440909090909091e-05, "loss": 0.1975, "step": 3430 }, { "epoch": 76.44, "learning_rate": 2.4181818181818182e-05, "loss": 0.1766, "step": 3440 }, { "epoch": 76.67, "learning_rate": 2.3954545454545454e-05, "loss": 0.188, "step": 3450 }, { "epoch": 76.89, "learning_rate": 2.372727272727273e-05, "loss": 0.1551, "step": 3460 }, { "epoch": 77.0, "eval_loss": 0.5754880905151367, "eval_runtime": 2.491, "eval_samples_per_second": 6.825, "eval_steps_per_second": 3.613, "eval_wer": 0.30274135876042907, "step": 3465 }, { "epoch": 77.11, "learning_rate": 2.35e-05, "loss": 0.159, "step": 3470 }, { "epoch": 77.33, "learning_rate": 2.3272727272727274e-05, "loss": 0.2088, "step": 3480 }, { "epoch": 77.56, "learning_rate": 2.3045454545454546e-05, "loss": 0.1625, "step": 3490 }, { "epoch": 77.78, "learning_rate": 2.281818181818182e-05, "loss": 0.1743, "step": 3500 }, { "epoch": 78.0, "learning_rate": 2.2590909090909094e-05, "loss": 0.1509, "step": 3510 }, { "epoch": 78.0, "eval_loss": 0.5894579291343689, "eval_runtime": 2.4629, "eval_samples_per_second": 6.902, "eval_steps_per_second": 3.654, "eval_wer": 0.2943980929678188, "step": 3510 }, { "epoch": 78.22, "learning_rate": 2.2363636363636366e-05, "loss": 0.1762, "step": 3520 }, { "epoch": 78.44, "learning_rate": 2.2136363636363638e-05, "loss": 0.154, "step": 3530 }, { "epoch": 78.67, "learning_rate": 2.190909090909091e-05, "loss": 0.2085, "step": 3540 }, { "epoch": 78.89, "learning_rate": 2.1681818181818182e-05, "loss": 0.176, "step": 3550 }, { "epoch": 79.0, "eval_loss": 0.5749766826629639, "eval_runtime": 2.4871, "eval_samples_per_second": 6.835, "eval_steps_per_second": 3.619, "eval_wer": 0.29916567342073896, "step": 3555 }, { "epoch": 79.11, "learning_rate": 2.1454545454545455e-05, "loss": 0.1875, "step": 3560 }, { "epoch": 79.33, "learning_rate": 2.122727272727273e-05, "loss": 0.2078, "step": 3570 }, { "epoch": 79.56, "learning_rate": 2.1e-05, "loss": 0.1798, "step": 3580 }, { "epoch": 79.78, "learning_rate": 2.0772727272727274e-05, "loss": 0.1925, "step": 3590 }, { "epoch": 80.0, "learning_rate": 2.0545454545454546e-05, "loss": 0.1695, "step": 3600 }, { "epoch": 80.0, "eval_loss": 0.5759270191192627, "eval_runtime": 2.5291, "eval_samples_per_second": 6.722, "eval_steps_per_second": 3.559, "eval_wer": 0.300357568533969, "step": 3600 }, { "epoch": 80.22, "learning_rate": 2.031818181818182e-05, "loss": 0.1909, "step": 3610 }, { "epoch": 80.44, "learning_rate": 2.009090909090909e-05, "loss": 0.1797, "step": 3620 }, { "epoch": 80.67, "learning_rate": 1.9863636363636366e-05, "loss": 0.1598, "step": 3630 }, { "epoch": 80.89, "learning_rate": 1.9636363636363635e-05, "loss": 0.1797, "step": 3640 }, { "epoch": 81.0, "eval_loss": 0.5903642773628235, "eval_runtime": 2.5184, "eval_samples_per_second": 6.75, "eval_steps_per_second": 3.574, "eval_wer": 0.29916567342073896, "step": 3645 }, { "epoch": 81.11, "learning_rate": 1.940909090909091e-05, "loss": 0.1543, "step": 3650 }, { "epoch": 81.33, "learning_rate": 1.9181818181818183e-05, "loss": 0.1898, "step": 3660 }, { "epoch": 81.56, "learning_rate": 1.8954545454545455e-05, "loss": 0.2273, "step": 3670 }, { "epoch": 81.78, "learning_rate": 1.872727272727273e-05, "loss": 0.1537, "step": 3680 }, { "epoch": 82.0, "learning_rate": 1.85e-05, "loss": 0.1371, "step": 3690 }, { "epoch": 82.0, "eval_loss": 0.5922932624816895, "eval_runtime": 2.5106, "eval_samples_per_second": 6.771, "eval_steps_per_second": 3.585, "eval_wer": 0.30154946364719903, "step": 3690 }, { "epoch": 82.22, "learning_rate": 1.8272727272727275e-05, "loss": 0.1527, "step": 3700 }, { "epoch": 82.44, "learning_rate": 1.8045454545454547e-05, "loss": 0.1998, "step": 3710 }, { "epoch": 82.67, "learning_rate": 1.781818181818182e-05, "loss": 0.1513, "step": 3720 }, { "epoch": 82.89, "learning_rate": 1.759090909090909e-05, "loss": 0.1798, "step": 3730 }, { "epoch": 83.0, "eval_loss": 0.5864221453666687, "eval_runtime": 2.484, "eval_samples_per_second": 6.844, "eval_steps_per_second": 3.623, "eval_wer": 0.29916567342073896, "step": 3735 }, { "epoch": 83.11, "learning_rate": 1.7363636363636366e-05, "loss": 0.2202, "step": 3740 }, { "epoch": 83.33, "learning_rate": 1.7136363636363635e-05, "loss": 0.2187, "step": 3750 }, { "epoch": 83.56, "learning_rate": 1.690909090909091e-05, "loss": 0.1656, "step": 3760 }, { "epoch": 83.78, "learning_rate": 1.6681818181818183e-05, "loss": 0.1856, "step": 3770 }, { "epoch": 84.0, "learning_rate": 1.6454545454545455e-05, "loss": 0.1386, "step": 3780 }, { "epoch": 84.0, "eval_loss": 0.5732817649841309, "eval_runtime": 2.581, "eval_samples_per_second": 6.587, "eval_steps_per_second": 3.487, "eval_wer": 0.300357568533969, "step": 3780 }, { "epoch": 84.22, "learning_rate": 1.6227272727272727e-05, "loss": 0.1708, "step": 3790 }, { "epoch": 84.44, "learning_rate": 1.6000000000000003e-05, "loss": 0.1599, "step": 3800 }, { "epoch": 84.67, "learning_rate": 1.577272727272727e-05, "loss": 0.148, "step": 3810 }, { "epoch": 84.89, "learning_rate": 1.5545454545454547e-05, "loss": 0.2173, "step": 3820 }, { "epoch": 85.0, "eval_loss": 0.5751131176948547, "eval_runtime": 2.4769, "eval_samples_per_second": 6.864, "eval_steps_per_second": 3.634, "eval_wer": 0.300357568533969, "step": 3825 }, { "epoch": 85.11, "learning_rate": 1.531818181818182e-05, "loss": 0.1754, "step": 3830 }, { "epoch": 85.33, "learning_rate": 1.5090909090909091e-05, "loss": 0.1799, "step": 3840 }, { "epoch": 85.56, "learning_rate": 1.4863636363636365e-05, "loss": 0.1646, "step": 3850 }, { "epoch": 85.78, "learning_rate": 1.4636363636363637e-05, "loss": 0.1937, "step": 3860 }, { "epoch": 86.0, "learning_rate": 1.4409090909090911e-05, "loss": 0.151, "step": 3870 }, { "epoch": 86.0, "eval_loss": 0.5710622072219849, "eval_runtime": 2.5027, "eval_samples_per_second": 6.793, "eval_steps_per_second": 3.596, "eval_wer": 0.2967818831942789, "step": 3870 }, { "epoch": 86.22, "learning_rate": 1.4181818181818181e-05, "loss": 0.184, "step": 3880 }, { "epoch": 86.44, "learning_rate": 1.3954545454545457e-05, "loss": 0.171, "step": 3890 }, { "epoch": 86.67, "learning_rate": 1.3727272727272727e-05, "loss": 0.1646, "step": 3900 }, { "epoch": 86.89, "learning_rate": 1.3500000000000001e-05, "loss": 0.1579, "step": 3910 }, { "epoch": 87.0, "eval_loss": 0.575020968914032, "eval_runtime": 3.0073, "eval_samples_per_second": 5.653, "eval_steps_per_second": 2.993, "eval_wer": 0.29916567342073896, "step": 3915 }, { "epoch": 87.11, "learning_rate": 1.3272727272727273e-05, "loss": 0.1723, "step": 3920 }, { "epoch": 87.33, "learning_rate": 1.3045454545454547e-05, "loss": 0.1412, "step": 3930 }, { "epoch": 87.56, "learning_rate": 1.2818181818181818e-05, "loss": 0.2681, "step": 3940 }, { "epoch": 87.78, "learning_rate": 1.2590909090909091e-05, "loss": 0.1883, "step": 3950 }, { "epoch": 88.0, "learning_rate": 1.2363636363636365e-05, "loss": 0.1328, "step": 3960 }, { "epoch": 88.0, "eval_loss": 0.5764250755310059, "eval_runtime": 2.5237, "eval_samples_per_second": 6.736, "eval_steps_per_second": 3.566, "eval_wer": 0.2943980929678188, "step": 3960 }, { "epoch": 88.22, "learning_rate": 1.2136363636363637e-05, "loss": 0.1863, "step": 3970 }, { "epoch": 88.44, "learning_rate": 1.190909090909091e-05, "loss": 0.1689, "step": 3980 }, { "epoch": 88.67, "learning_rate": 1.1681818181818183e-05, "loss": 0.1521, "step": 3990 }, { "epoch": 88.89, "learning_rate": 1.1454545454545455e-05, "loss": 0.1657, "step": 4000 }, { "epoch": 89.0, "eval_loss": 0.5768557190895081, "eval_runtime": 2.5214, "eval_samples_per_second": 6.742, "eval_steps_per_second": 3.569, "eval_wer": 0.300357568533969, "step": 4005 }, { "epoch": 89.11, "learning_rate": 1.1227272727272728e-05, "loss": 0.2066, "step": 4010 }, { "epoch": 89.33, "learning_rate": 1.1000000000000001e-05, "loss": 0.1696, "step": 4020 }, { "epoch": 89.56, "learning_rate": 1.0772727272727274e-05, "loss": 0.1816, "step": 4030 }, { "epoch": 89.78, "learning_rate": 1.0545454545454546e-05, "loss": 0.1775, "step": 4040 }, { "epoch": 90.0, "learning_rate": 1.0318181818181818e-05, "loss": 0.1353, "step": 4050 }, { "epoch": 90.0, "eval_loss": 0.5714535713195801, "eval_runtime": 2.5276, "eval_samples_per_second": 6.726, "eval_steps_per_second": 3.561, "eval_wer": 0.29558998808104886, "step": 4050 }, { "epoch": 90.22, "learning_rate": 1.0090909090909092e-05, "loss": 0.2057, "step": 4060 }, { "epoch": 90.44, "learning_rate": 9.863636363636364e-06, "loss": 0.1699, "step": 4070 }, { "epoch": 90.67, "learning_rate": 9.636363636363636e-06, "loss": 0.1512, "step": 4080 }, { "epoch": 90.89, "learning_rate": 9.40909090909091e-06, "loss": 0.1982, "step": 4090 }, { "epoch": 91.0, "eval_loss": 0.5753502249717712, "eval_runtime": 2.5311, "eval_samples_per_second": 6.716, "eval_steps_per_second": 3.556, "eval_wer": 0.2967818831942789, "step": 4095 }, { "epoch": 91.11, "learning_rate": 9.181818181818182e-06, "loss": 0.1304, "step": 4100 }, { "epoch": 91.33, "learning_rate": 8.954545454545454e-06, "loss": 0.2255, "step": 4110 }, { "epoch": 91.56, "learning_rate": 8.727272727272728e-06, "loss": 0.1546, "step": 4120 }, { "epoch": 91.78, "learning_rate": 8.500000000000002e-06, "loss": 0.1734, "step": 4130 }, { "epoch": 92.0, "learning_rate": 8.272727272727274e-06, "loss": 0.1687, "step": 4140 }, { "epoch": 92.0, "eval_loss": 0.5725367665290833, "eval_runtime": 2.5116, "eval_samples_per_second": 6.769, "eval_steps_per_second": 3.583, "eval_wer": 0.29797377830750893, "step": 4140 }, { "epoch": 92.22, "learning_rate": 8.045454545454546e-06, "loss": 0.1566, "step": 4150 }, { "epoch": 92.44, "learning_rate": 7.81818181818182e-06, "loss": 0.1922, "step": 4160 }, { "epoch": 92.67, "learning_rate": 7.590909090909092e-06, "loss": 0.1669, "step": 4170 }, { "epoch": 92.89, "learning_rate": 7.363636363636364e-06, "loss": 0.1842, "step": 4180 }, { "epoch": 93.0, "eval_loss": 0.5749579668045044, "eval_runtime": 2.5011, "eval_samples_per_second": 6.797, "eval_steps_per_second": 3.598, "eval_wer": 0.29797377830750893, "step": 4185 }, { "epoch": 93.11, "learning_rate": 7.136363636363637e-06, "loss": 0.1336, "step": 4190 }, { "epoch": 93.33, "learning_rate": 6.909090909090909e-06, "loss": 0.1472, "step": 4200 }, { "epoch": 93.56, "learning_rate": 6.681818181818182e-06, "loss": 0.1875, "step": 4210 }, { "epoch": 93.78, "learning_rate": 6.454545454545455e-06, "loss": 0.169, "step": 4220 }, { "epoch": 94.0, "learning_rate": 6.227272727272727e-06, "loss": 0.1893, "step": 4230 }, { "epoch": 94.0, "eval_loss": 0.5788666009902954, "eval_runtime": 2.5149, "eval_samples_per_second": 6.76, "eval_steps_per_second": 3.579, "eval_wer": 0.2943980929678188, "step": 4230 }, { "epoch": 94.22, "learning_rate": 6e-06, "loss": 0.1958, "step": 4240 }, { "epoch": 94.44, "learning_rate": 5.772727272727272e-06, "loss": 0.175, "step": 4250 }, { "epoch": 94.67, "learning_rate": 5.545454545454546e-06, "loss": 0.1701, "step": 4260 }, { "epoch": 94.89, "learning_rate": 5.318181818181819e-06, "loss": 0.1744, "step": 4270 }, { "epoch": 95.0, "eval_loss": 0.5750417709350586, "eval_runtime": 2.5742, "eval_samples_per_second": 6.604, "eval_steps_per_second": 3.496, "eval_wer": 0.300357568533969, "step": 4275 }, { "epoch": 95.11, "learning_rate": 5.090909090909091e-06, "loss": 0.1389, "step": 4280 }, { "epoch": 95.33, "learning_rate": 4.863636363636364e-06, "loss": 0.1628, "step": 4290 }, { "epoch": 95.56, "learning_rate": 4.636363636363636e-06, "loss": 0.18, "step": 4300 }, { "epoch": 95.78, "learning_rate": 4.409090909090909e-06, "loss": 0.1921, "step": 4310 }, { "epoch": 96.0, "learning_rate": 4.181818181818182e-06, "loss": 0.1745, "step": 4320 }, { "epoch": 96.0, "eval_loss": 0.5794357657432556, "eval_runtime": 2.5187, "eval_samples_per_second": 6.75, "eval_steps_per_second": 3.573, "eval_wer": 0.29797377830750893, "step": 4320 }, { "epoch": 96.22, "learning_rate": 3.954545454545454e-06, "loss": 0.174, "step": 4330 }, { "epoch": 96.44, "learning_rate": 3.727272727272727e-06, "loss": 0.1382, "step": 4340 }, { "epoch": 96.67, "learning_rate": 3.5000000000000004e-06, "loss": 0.252, "step": 4350 }, { "epoch": 96.89, "learning_rate": 3.2727272727272733e-06, "loss": 0.1665, "step": 4360 }, { "epoch": 97.0, "eval_loss": 0.5754532814025879, "eval_runtime": 2.5009, "eval_samples_per_second": 6.798, "eval_steps_per_second": 3.599, "eval_wer": 0.300357568533969, "step": 4365 }, { "epoch": 97.11, "learning_rate": 3.0454545454545455e-06, "loss": 0.2097, "step": 4370 }, { "epoch": 97.33, "learning_rate": 2.8181818181818185e-06, "loss": 0.1816, "step": 4380 }, { "epoch": 97.56, "learning_rate": 2.590909090909091e-06, "loss": 0.1747, "step": 4390 }, { "epoch": 97.78, "learning_rate": 2.3636363636363636e-06, "loss": 0.1905, "step": 4400 }, { "epoch": 98.0, "learning_rate": 2.1363636363636365e-06, "loss": 0.1569, "step": 4410 }, { "epoch": 98.0, "eval_loss": 0.5763238072395325, "eval_runtime": 2.4952, "eval_samples_per_second": 6.813, "eval_steps_per_second": 3.607, "eval_wer": 0.2967818831942789, "step": 4410 }, { "epoch": 98.22, "learning_rate": 1.9090909090909095e-06, "loss": 0.1681, "step": 4420 }, { "epoch": 98.44, "learning_rate": 1.681818181818182e-06, "loss": 0.2023, "step": 4430 }, { "epoch": 98.67, "learning_rate": 1.4545454545454546e-06, "loss": 0.17, "step": 4440 }, { "epoch": 98.89, "learning_rate": 1.2272727272727272e-06, "loss": 0.1449, "step": 4450 }, { "epoch": 99.0, "eval_loss": 0.577908992767334, "eval_runtime": 2.5073, "eval_samples_per_second": 6.78, "eval_steps_per_second": 3.59, "eval_wer": 0.2967818831942789, "step": 4455 }, { "epoch": 99.11, "learning_rate": 1.0000000000000002e-06, "loss": 0.1801, "step": 4460 }, { "epoch": 99.33, "learning_rate": 7.727272727272728e-07, "loss": 0.2012, "step": 4470 }, { "epoch": 99.56, "learning_rate": 5.454545454545455e-07, "loss": 0.1804, "step": 4480 }, { "epoch": 99.78, "learning_rate": 3.181818181818182e-07, "loss": 0.188, "step": 4490 }, { "epoch": 100.0, "learning_rate": 9.090909090909091e-08, "loss": 0.1469, "step": 4500 }, { "epoch": 100.0, "eval_loss": 0.5774157643318176, "eval_runtime": 2.6458, "eval_samples_per_second": 6.425, "eval_steps_per_second": 3.402, "eval_wer": 0.2967818831942789, "step": 4500 }, { "epoch": 100.0, "step": 4500, "total_flos": 1.6941108528500076e+18, "train_loss": 0.2065306097931332, "train_runtime": 4259.6925, "train_samples_per_second": 4.202, "train_steps_per_second": 1.056 } ], "max_steps": 4500, "num_train_epochs": 100, "total_flos": 1.6941108528500076e+18, "trial_name": null, "trial_params": null }