{ "best_metric": 0.526544988155365, "best_model_checkpoint": "ai-light-dance_singing2_ft_wav2vec2-large-xlsr-53-5gram-v3/checkpoint-1120", "epoch": 9.998662505572893, "global_step": 2800, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.04, "learning_rate": 4.000000000000001e-06, "loss": 0.2599, "step": 10 }, { "epoch": 0.07, "learning_rate": 8.000000000000001e-06, "loss": 0.2274, "step": 20 }, { "epoch": 0.11, "learning_rate": 1.2e-05, "loss": 0.2026, "step": 30 }, { "epoch": 0.14, "learning_rate": 1.6000000000000003e-05, "loss": 0.2054, "step": 40 }, { "epoch": 0.18, "learning_rate": 2e-05, "loss": 0.2443, "step": 50 }, { "epoch": 0.21, "learning_rate": 2.4e-05, "loss": 0.22, "step": 60 }, { "epoch": 0.25, "learning_rate": 2.8e-05, "loss": 0.2178, "step": 70 }, { "epoch": 0.29, "learning_rate": 3.2000000000000005e-05, "loss": 0.2146, "step": 80 }, { "epoch": 0.32, "learning_rate": 3.6e-05, "loss": 0.221, "step": 90 }, { "epoch": 0.36, "learning_rate": 4e-05, "loss": 0.2718, "step": 100 }, { "epoch": 0.39, "learning_rate": 3.9851851851851856e-05, "loss": 0.2191, "step": 110 }, { "epoch": 0.43, "learning_rate": 3.970370370370371e-05, "loss": 0.2302, "step": 120 }, { "epoch": 0.46, "learning_rate": 3.955555555555556e-05, "loss": 0.243, "step": 130 }, { "epoch": 0.5, "learning_rate": 3.940740740740741e-05, "loss": 0.2235, "step": 140 }, { "epoch": 0.53, "learning_rate": 3.925925925925926e-05, "loss": 0.2856, "step": 150 }, { "epoch": 0.57, "learning_rate": 3.9111111111111115e-05, "loss": 0.2394, "step": 160 }, { "epoch": 0.61, "learning_rate": 3.896296296296297e-05, "loss": 0.2562, "step": 170 }, { "epoch": 0.64, "learning_rate": 3.8814814814814814e-05, "loss": 0.2313, "step": 180 }, { "epoch": 0.68, "learning_rate": 3.866666666666667e-05, "loss": 0.2232, "step": 190 }, { "epoch": 0.71, "learning_rate": 3.851851851851852e-05, "loss": 0.2711, "step": 200 }, { "epoch": 0.75, "learning_rate": 3.837037037037037e-05, "loss": 0.2356, "step": 210 }, { "epoch": 0.78, "learning_rate": 3.8222222222222226e-05, "loss": 0.2213, "step": 220 }, { "epoch": 0.82, "learning_rate": 3.807407407407408e-05, "loss": 0.2404, "step": 230 }, { "epoch": 0.86, "learning_rate": 3.792592592592593e-05, "loss": 0.2217, "step": 240 }, { "epoch": 0.89, "learning_rate": 3.777777777777778e-05, "loss": 0.2765, "step": 250 }, { "epoch": 0.93, "learning_rate": 3.762962962962963e-05, "loss": 0.221, "step": 260 }, { "epoch": 0.96, "learning_rate": 3.7481481481481484e-05, "loss": 0.2319, "step": 270 }, { "epoch": 1.0, "learning_rate": 3.733333333333334e-05, "loss": 0.2546, "step": 280 }, { "epoch": 1.0, "eval_loss": 0.6003746390342712, "eval_runtime": 230.0992, "eval_samples_per_second": 8.666, "eval_steps_per_second": 1.086, "eval_wer": 0.2795819789166692, "step": 280 }, { "epoch": 1.04, "learning_rate": 3.7185185185185184e-05, "loss": 0.235, "step": 290 }, { "epoch": 1.07, "learning_rate": 3.703703703703704e-05, "loss": 0.21, "step": 300 }, { "epoch": 1.11, "learning_rate": 3.6888888888888896e-05, "loss": 0.2169, "step": 310 }, { "epoch": 1.14, "learning_rate": 3.674074074074074e-05, "loss": 0.2021, "step": 320 }, { "epoch": 1.18, "learning_rate": 3.6592592592592596e-05, "loss": 0.2619, "step": 330 }, { "epoch": 1.21, "learning_rate": 3.644444444444445e-05, "loss": 0.2066, "step": 340 }, { "epoch": 1.25, "learning_rate": 3.62962962962963e-05, "loss": 0.2388, "step": 350 }, { "epoch": 1.29, "learning_rate": 3.614814814814815e-05, "loss": 0.214, "step": 360 }, { "epoch": 1.32, "learning_rate": 3.6e-05, "loss": 0.21, "step": 370 }, { "epoch": 1.36, "learning_rate": 3.5851851851851854e-05, "loss": 0.2413, "step": 380 }, { "epoch": 1.39, "learning_rate": 3.570370370370371e-05, "loss": 0.2171, "step": 390 }, { "epoch": 1.43, "learning_rate": 3.555555555555555e-05, "loss": 0.2071, "step": 400 }, { "epoch": 1.46, "learning_rate": 3.540740740740741e-05, "loss": 0.2209, "step": 410 }, { "epoch": 1.5, "learning_rate": 3.5259259259259266e-05, "loss": 0.2413, "step": 420 }, { "epoch": 1.53, "learning_rate": 3.511111111111111e-05, "loss": 0.2645, "step": 430 }, { "epoch": 1.57, "learning_rate": 3.4962962962962965e-05, "loss": 0.2205, "step": 440 }, { "epoch": 1.61, "learning_rate": 3.481481481481482e-05, "loss": 0.2232, "step": 450 }, { "epoch": 1.64, "learning_rate": 3.466666666666667e-05, "loss": 0.2049, "step": 460 }, { "epoch": 1.68, "learning_rate": 3.451851851851852e-05, "loss": 0.2131, "step": 470 }, { "epoch": 1.71, "learning_rate": 3.437037037037037e-05, "loss": 0.2783, "step": 480 }, { "epoch": 1.75, "learning_rate": 3.4222222222222224e-05, "loss": 0.2198, "step": 490 }, { "epoch": 1.78, "learning_rate": 3.4074074074074077e-05, "loss": 0.2095, "step": 500 }, { "epoch": 1.82, "learning_rate": 3.392592592592593e-05, "loss": 0.2142, "step": 510 }, { "epoch": 1.86, "learning_rate": 3.377777777777778e-05, "loss": 0.2028, "step": 520 }, { "epoch": 1.89, "learning_rate": 3.364444444444445e-05, "loss": 0.2421, "step": 530 }, { "epoch": 1.93, "learning_rate": 3.3496296296296295e-05, "loss": 0.2107, "step": 540 }, { "epoch": 1.96, "learning_rate": 3.3348148148148154e-05, "loss": 0.2087, "step": 550 }, { "epoch": 2.0, "learning_rate": 3.32e-05, "loss": 0.2325, "step": 560 }, { "epoch": 2.0, "eval_loss": 0.6336627006530762, "eval_runtime": 225.109, "eval_samples_per_second": 8.858, "eval_steps_per_second": 1.111, "eval_wer": 0.27289850229364765, "step": 560 }, { "epoch": 2.04, "learning_rate": 3.3051851851851854e-05, "loss": 0.2134, "step": 570 }, { "epoch": 2.07, "learning_rate": 3.290370370370371e-05, "loss": 0.2193, "step": 580 }, { "epoch": 2.11, "learning_rate": 3.275555555555556e-05, "loss": 0.1988, "step": 590 }, { "epoch": 2.14, "learning_rate": 3.260740740740741e-05, "loss": 0.1828, "step": 600 }, { "epoch": 2.18, "learning_rate": 3.245925925925926e-05, "loss": 0.2289, "step": 610 }, { "epoch": 2.21, "learning_rate": 3.231111111111111e-05, "loss": 0.1859, "step": 620 }, { "epoch": 2.25, "learning_rate": 3.2162962962962965e-05, "loss": 0.197, "step": 630 }, { "epoch": 2.29, "learning_rate": 3.201481481481482e-05, "loss": 0.1863, "step": 640 }, { "epoch": 2.32, "learning_rate": 3.186666666666667e-05, "loss": 0.1871, "step": 650 }, { "epoch": 2.36, "learning_rate": 3.1718518518518524e-05, "loss": 0.2339, "step": 660 }, { "epoch": 2.39, "learning_rate": 3.157037037037037e-05, "loss": 0.1992, "step": 670 }, { "epoch": 2.43, "learning_rate": 3.142222222222222e-05, "loss": 0.186, "step": 680 }, { "epoch": 2.46, "learning_rate": 3.1274074074074076e-05, "loss": 0.2001, "step": 690 }, { "epoch": 2.5, "learning_rate": 3.112592592592593e-05, "loss": 0.2037, "step": 700 }, { "epoch": 2.53, "learning_rate": 3.097777777777778e-05, "loss": 0.2373, "step": 710 }, { "epoch": 2.57, "learning_rate": 3.082962962962963e-05, "loss": 0.1834, "step": 720 }, { "epoch": 2.61, "learning_rate": 3.068148148148149e-05, "loss": 0.1828, "step": 730 }, { "epoch": 2.64, "learning_rate": 3.0533333333333335e-05, "loss": 0.1863, "step": 740 }, { "epoch": 2.68, "learning_rate": 3.0385185185185188e-05, "loss": 0.1874, "step": 750 }, { "epoch": 2.71, "learning_rate": 3.0237037037037037e-05, "loss": 0.2413, "step": 760 }, { "epoch": 2.75, "learning_rate": 3.008888888888889e-05, "loss": 0.2026, "step": 770 }, { "epoch": 2.78, "learning_rate": 2.994074074074074e-05, "loss": 0.1928, "step": 780 }, { "epoch": 2.82, "learning_rate": 2.9792592592592596e-05, "loss": 0.1906, "step": 790 }, { "epoch": 2.86, "learning_rate": 2.964444444444445e-05, "loss": 0.1809, "step": 800 }, { "epoch": 2.89, "learning_rate": 2.94962962962963e-05, "loss": 0.2385, "step": 810 }, { "epoch": 2.93, "learning_rate": 2.9348148148148152e-05, "loss": 0.1847, "step": 820 }, { "epoch": 2.96, "learning_rate": 2.92e-05, "loss": 0.1927, "step": 830 }, { "epoch": 3.0, "learning_rate": 2.9051851851851855e-05, "loss": 0.2185, "step": 840 }, { "epoch": 3.0, "eval_loss": 0.5546267628669739, "eval_runtime": 226.3237, "eval_samples_per_second": 8.81, "eval_steps_per_second": 1.105, "eval_wer": 0.2298812163927454, "step": 840 }, { "epoch": 3.04, "learning_rate": 2.8903703703703704e-05, "loss": 0.1902, "step": 850 }, { "epoch": 3.07, "learning_rate": 2.8755555555555557e-05, "loss": 0.1874, "step": 860 }, { "epoch": 3.11, "learning_rate": 2.8607407407407407e-05, "loss": 0.1798, "step": 870 }, { "epoch": 3.14, "learning_rate": 2.8459259259259263e-05, "loss": 0.171, "step": 880 }, { "epoch": 3.18, "learning_rate": 2.8311111111111113e-05, "loss": 0.2333, "step": 890 }, { "epoch": 3.21, "learning_rate": 2.8162962962962966e-05, "loss": 0.1749, "step": 900 }, { "epoch": 3.25, "learning_rate": 2.801481481481482e-05, "loss": 0.1693, "step": 910 }, { "epoch": 3.29, "learning_rate": 2.786666666666667e-05, "loss": 0.1843, "step": 920 }, { "epoch": 3.32, "learning_rate": 2.771851851851852e-05, "loss": 0.1783, "step": 930 }, { "epoch": 3.36, "learning_rate": 2.757037037037037e-05, "loss": 0.2224, "step": 940 }, { "epoch": 3.39, "learning_rate": 2.7422222222222224e-05, "loss": 0.1809, "step": 950 }, { "epoch": 3.43, "learning_rate": 2.7274074074074074e-05, "loss": 0.1664, "step": 960 }, { "epoch": 3.46, "learning_rate": 2.712592592592593e-05, "loss": 0.1757, "step": 970 }, { "epoch": 3.5, "learning_rate": 2.6977777777777777e-05, "loss": 0.1895, "step": 980 }, { "epoch": 3.53, "learning_rate": 2.6829629629629633e-05, "loss": 0.2236, "step": 990 }, { "epoch": 3.57, "learning_rate": 2.6681481481481483e-05, "loss": 0.1918, "step": 1000 }, { "epoch": 3.61, "learning_rate": 2.6533333333333336e-05, "loss": 0.1877, "step": 1010 }, { "epoch": 3.64, "learning_rate": 2.638518518518519e-05, "loss": 0.1983, "step": 1020 }, { "epoch": 3.68, "learning_rate": 2.623703703703704e-05, "loss": 0.187, "step": 1030 }, { "epoch": 3.71, "learning_rate": 2.608888888888889e-05, "loss": 0.2318, "step": 1040 }, { "epoch": 3.75, "learning_rate": 2.594074074074074e-05, "loss": 0.178, "step": 1050 }, { "epoch": 3.78, "learning_rate": 2.5792592592592597e-05, "loss": 0.1702, "step": 1060 }, { "epoch": 3.82, "learning_rate": 2.5644444444444444e-05, "loss": 0.166, "step": 1070 }, { "epoch": 3.86, "learning_rate": 2.54962962962963e-05, "loss": 0.1813, "step": 1080 }, { "epoch": 3.89, "learning_rate": 2.534814814814815e-05, "loss": 0.2244, "step": 1090 }, { "epoch": 3.93, "learning_rate": 2.5200000000000003e-05, "loss": 0.177, "step": 1100 }, { "epoch": 3.96, "learning_rate": 2.5051851851851856e-05, "loss": 0.1963, "step": 1110 }, { "epoch": 4.0, "learning_rate": 2.4903703703703705e-05, "loss": 0.1988, "step": 1120 }, { "epoch": 4.0, "eval_loss": 0.526544988155365, "eval_runtime": 225.7721, "eval_samples_per_second": 8.832, "eval_steps_per_second": 1.107, "eval_wer": 0.22556733602697696, "step": 1120 }, { "epoch": 4.04, "learning_rate": 2.475555555555556e-05, "loss": 0.1857, "step": 1130 }, { "epoch": 4.07, "learning_rate": 2.4607407407407408e-05, "loss": 0.1739, "step": 1140 }, { "epoch": 4.11, "learning_rate": 2.445925925925926e-05, "loss": 0.156, "step": 1150 }, { "epoch": 4.14, "learning_rate": 2.431111111111111e-05, "loss": 0.1673, "step": 1160 }, { "epoch": 4.18, "learning_rate": 2.4162962962962967e-05, "loss": 0.1971, "step": 1170 }, { "epoch": 4.21, "learning_rate": 2.4014814814814817e-05, "loss": 0.1627, "step": 1180 }, { "epoch": 4.25, "learning_rate": 2.386666666666667e-05, "loss": 0.1606, "step": 1190 }, { "epoch": 4.29, "learning_rate": 2.371851851851852e-05, "loss": 0.1633, "step": 1200 }, { "epoch": 4.32, "learning_rate": 2.3570370370370372e-05, "loss": 0.1594, "step": 1210 }, { "epoch": 4.36, "learning_rate": 2.3422222222222225e-05, "loss": 0.196, "step": 1220 }, { "epoch": 4.39, "learning_rate": 2.3274074074074075e-05, "loss": 0.1518, "step": 1230 }, { "epoch": 4.43, "learning_rate": 2.3125925925925928e-05, "loss": 0.1593, "step": 1240 }, { "epoch": 4.46, "learning_rate": 2.2977777777777778e-05, "loss": 0.1455, "step": 1250 }, { "epoch": 4.5, "learning_rate": 2.2829629629629634e-05, "loss": 0.1519, "step": 1260 }, { "epoch": 4.53, "learning_rate": 2.2681481481481484e-05, "loss": 0.1942, "step": 1270 }, { "epoch": 4.57, "learning_rate": 2.2533333333333337e-05, "loss": 0.1552, "step": 1280 }, { "epoch": 4.61, "learning_rate": 2.2385185185185186e-05, "loss": 0.1771, "step": 1290 }, { "epoch": 4.64, "learning_rate": 2.223703703703704e-05, "loss": 0.1638, "step": 1300 }, { "epoch": 4.68, "learning_rate": 2.208888888888889e-05, "loss": 0.156, "step": 1310 }, { "epoch": 4.71, "learning_rate": 2.1940740740740742e-05, "loss": 0.2078, "step": 1320 }, { "epoch": 4.75, "learning_rate": 2.1792592592592595e-05, "loss": 0.1466, "step": 1330 }, { "epoch": 4.78, "learning_rate": 2.1644444444444445e-05, "loss": 0.1682, "step": 1340 }, { "epoch": 4.82, "learning_rate": 2.14962962962963e-05, "loss": 0.1489, "step": 1350 }, { "epoch": 4.86, "learning_rate": 2.1348148148148147e-05, "loss": 0.1647, "step": 1360 }, { "epoch": 4.89, "learning_rate": 2.1200000000000004e-05, "loss": 0.1923, "step": 1370 }, { "epoch": 4.93, "learning_rate": 2.1051851851851853e-05, "loss": 0.1606, "step": 1380 }, { "epoch": 4.96, "learning_rate": 2.0903703703703706e-05, "loss": 0.1519, "step": 1390 }, { "epoch": 5.0, "learning_rate": 2.0755555555555556e-05, "loss": 0.1755, "step": 1400 }, { "epoch": 5.0, "eval_loss": 0.5577098727226257, "eval_runtime": 226.8308, "eval_samples_per_second": 8.791, "eval_steps_per_second": 1.102, "eval_wer": 0.22122307622201295, "step": 1400 }, { "epoch": 5.04, "learning_rate": 2.060740740740741e-05, "loss": 0.1447, "step": 1410 }, { "epoch": 5.07, "learning_rate": 2.0459259259259262e-05, "loss": 0.1422, "step": 1420 }, { "epoch": 5.11, "learning_rate": 2.031111111111111e-05, "loss": 0.1415, "step": 1430 }, { "epoch": 5.14, "learning_rate": 2.0162962962962968e-05, "loss": 0.137, "step": 1440 }, { "epoch": 5.18, "learning_rate": 2.0014814814814814e-05, "loss": 0.1631, "step": 1450 }, { "epoch": 5.21, "learning_rate": 1.9866666666666667e-05, "loss": 0.1369, "step": 1460 }, { "epoch": 5.25, "learning_rate": 1.971851851851852e-05, "loss": 0.1535, "step": 1470 }, { "epoch": 5.29, "learning_rate": 1.9570370370370373e-05, "loss": 0.1511, "step": 1480 }, { "epoch": 5.32, "learning_rate": 1.9422222222222223e-05, "loss": 0.1553, "step": 1490 }, { "epoch": 5.36, "learning_rate": 1.9274074074074076e-05, "loss": 0.1855, "step": 1500 }, { "epoch": 5.39, "learning_rate": 1.912592592592593e-05, "loss": 0.1362, "step": 1510 }, { "epoch": 5.43, "learning_rate": 1.897777777777778e-05, "loss": 0.1562, "step": 1520 }, { "epoch": 5.46, "learning_rate": 1.882962962962963e-05, "loss": 0.1374, "step": 1530 }, { "epoch": 5.5, "learning_rate": 1.868148148148148e-05, "loss": 0.1409, "step": 1540 }, { "epoch": 5.53, "learning_rate": 1.8533333333333334e-05, "loss": 0.1655, "step": 1550 }, { "epoch": 5.57, "learning_rate": 1.8385185185185187e-05, "loss": 0.1362, "step": 1560 }, { "epoch": 5.61, "learning_rate": 1.8237037037037037e-05, "loss": 0.1511, "step": 1570 }, { "epoch": 5.64, "learning_rate": 1.808888888888889e-05, "loss": 0.1366, "step": 1580 }, { "epoch": 5.68, "learning_rate": 1.7940740740740743e-05, "loss": 0.1383, "step": 1590 }, { "epoch": 5.71, "learning_rate": 1.7792592592592596e-05, "loss": 0.1756, "step": 1600 }, { "epoch": 5.75, "learning_rate": 1.7644444444444446e-05, "loss": 0.1441, "step": 1610 }, { "epoch": 5.78, "learning_rate": 1.74962962962963e-05, "loss": 0.145, "step": 1620 }, { "epoch": 5.82, "learning_rate": 1.734814814814815e-05, "loss": 0.1342, "step": 1630 }, { "epoch": 5.86, "learning_rate": 1.72e-05, "loss": 0.1343, "step": 1640 }, { "epoch": 5.89, "learning_rate": 1.7051851851851854e-05, "loss": 0.1805, "step": 1650 }, { "epoch": 5.93, "learning_rate": 1.6903703703703704e-05, "loss": 0.1395, "step": 1660 }, { "epoch": 5.96, "learning_rate": 1.6755555555555557e-05, "loss": 0.1261, "step": 1670 }, { "epoch": 6.0, "learning_rate": 1.660740740740741e-05, "loss": 0.1474, "step": 1680 }, { "epoch": 6.0, "eval_loss": 0.6352665424346924, "eval_runtime": 225.713, "eval_samples_per_second": 8.834, "eval_steps_per_second": 1.108, "eval_wer": 0.22410912294559043, "step": 1680 }, { "epoch": 6.04, "learning_rate": 1.6459259259259263e-05, "loss": 0.1294, "step": 1690 }, { "epoch": 6.07, "learning_rate": 1.6311111111111113e-05, "loss": 0.1248, "step": 1700 }, { "epoch": 6.11, "learning_rate": 1.6162962962962966e-05, "loss": 0.1221, "step": 1710 }, { "epoch": 6.14, "learning_rate": 1.6014814814814815e-05, "loss": 0.1251, "step": 1720 }, { "epoch": 6.18, "learning_rate": 1.586666666666667e-05, "loss": 0.1517, "step": 1730 }, { "epoch": 6.21, "learning_rate": 1.5718518518518518e-05, "loss": 0.116, "step": 1740 }, { "epoch": 6.25, "learning_rate": 1.557037037037037e-05, "loss": 0.1291, "step": 1750 }, { "epoch": 6.29, "learning_rate": 1.5422222222222224e-05, "loss": 0.1209, "step": 1760 }, { "epoch": 6.32, "learning_rate": 1.5274074074074074e-05, "loss": 0.1298, "step": 1770 }, { "epoch": 6.36, "learning_rate": 1.5125925925925927e-05, "loss": 0.1552, "step": 1780 }, { "epoch": 6.39, "learning_rate": 1.497777777777778e-05, "loss": 0.1127, "step": 1790 }, { "epoch": 6.43, "learning_rate": 1.4829629629629631e-05, "loss": 0.1341, "step": 1800 }, { "epoch": 6.46, "learning_rate": 1.4681481481481484e-05, "loss": 0.1249, "step": 1810 }, { "epoch": 6.5, "learning_rate": 1.4533333333333335e-05, "loss": 0.1221, "step": 1820 }, { "epoch": 6.53, "learning_rate": 1.4385185185185187e-05, "loss": 0.1611, "step": 1830 }, { "epoch": 6.57, "learning_rate": 1.4237037037037038e-05, "loss": 0.1324, "step": 1840 }, { "epoch": 6.61, "learning_rate": 1.408888888888889e-05, "loss": 0.1194, "step": 1850 }, { "epoch": 6.64, "learning_rate": 1.394074074074074e-05, "loss": 0.1219, "step": 1860 }, { "epoch": 6.68, "learning_rate": 1.3792592592592594e-05, "loss": 0.1208, "step": 1870 }, { "epoch": 6.71, "learning_rate": 1.3644444444444445e-05, "loss": 0.1627, "step": 1880 }, { "epoch": 6.75, "learning_rate": 1.3496296296296298e-05, "loss": 0.1335, "step": 1890 }, { "epoch": 6.78, "learning_rate": 1.334814814814815e-05, "loss": 0.1172, "step": 1900 }, { "epoch": 6.82, "learning_rate": 1.3200000000000002e-05, "loss": 0.1273, "step": 1910 }, { "epoch": 6.86, "learning_rate": 1.3051851851851854e-05, "loss": 0.1226, "step": 1920 }, { "epoch": 6.89, "learning_rate": 1.2903703703703705e-05, "loss": 0.1572, "step": 1930 }, { "epoch": 6.93, "learning_rate": 1.2755555555555556e-05, "loss": 0.1305, "step": 1940 }, { "epoch": 6.96, "learning_rate": 1.2607407407407408e-05, "loss": 0.1295, "step": 1950 }, { "epoch": 7.0, "learning_rate": 1.2459259259259259e-05, "loss": 0.1498, "step": 1960 }, { "epoch": 7.0, "eval_loss": 0.5758136510848999, "eval_runtime": 226.2345, "eval_samples_per_second": 8.814, "eval_steps_per_second": 1.105, "eval_wer": 0.20864598839505422, "step": 1960 }, { "epoch": 7.04, "learning_rate": 1.2311111111111112e-05, "loss": 0.1103, "step": 1970 }, { "epoch": 7.07, "learning_rate": 1.2162962962962963e-05, "loss": 0.1147, "step": 1980 }, { "epoch": 7.11, "learning_rate": 1.2014814814814815e-05, "loss": 0.1131, "step": 1990 }, { "epoch": 7.14, "learning_rate": 1.186666666666667e-05, "loss": 0.1199, "step": 2000 }, { "epoch": 7.18, "learning_rate": 1.171851851851852e-05, "loss": 0.1462, "step": 2010 }, { "epoch": 7.21, "learning_rate": 1.1570370370370372e-05, "loss": 0.1168, "step": 2020 }, { "epoch": 7.25, "learning_rate": 1.1422222222222223e-05, "loss": 0.1072, "step": 2030 }, { "epoch": 7.29, "learning_rate": 1.1274074074074075e-05, "loss": 0.1193, "step": 2040 }, { "epoch": 7.32, "learning_rate": 1.1125925925925926e-05, "loss": 0.109, "step": 2050 }, { "epoch": 7.36, "learning_rate": 1.0977777777777779e-05, "loss": 0.1455, "step": 2060 }, { "epoch": 7.39, "learning_rate": 1.082962962962963e-05, "loss": 0.1162, "step": 2070 }, { "epoch": 7.43, "learning_rate": 1.0681481481481482e-05, "loss": 0.1129, "step": 2080 }, { "epoch": 7.46, "learning_rate": 1.0533333333333333e-05, "loss": 0.1166, "step": 2090 }, { "epoch": 7.5, "learning_rate": 1.0385185185185188e-05, "loss": 0.1167, "step": 2100 }, { "epoch": 7.53, "learning_rate": 1.0237037037037039e-05, "loss": 0.135, "step": 2110 }, { "epoch": 7.57, "learning_rate": 1.008888888888889e-05, "loss": 0.1117, "step": 2120 }, { "epoch": 7.61, "learning_rate": 9.940740740740742e-06, "loss": 0.1162, "step": 2130 }, { "epoch": 7.64, "learning_rate": 9.792592592592593e-06, "loss": 0.1221, "step": 2140 }, { "epoch": 7.68, "learning_rate": 9.644444444444444e-06, "loss": 0.112, "step": 2150 }, { "epoch": 7.71, "learning_rate": 9.496296296296297e-06, "loss": 0.1394, "step": 2160 }, { "epoch": 7.75, "learning_rate": 9.348148148148149e-06, "loss": 0.1136, "step": 2170 }, { "epoch": 7.78, "learning_rate": 9.200000000000002e-06, "loss": 0.1148, "step": 2180 }, { "epoch": 7.82, "learning_rate": 9.051851851851853e-06, "loss": 0.1192, "step": 2190 }, { "epoch": 7.86, "learning_rate": 8.903703703703704e-06, "loss": 0.1174, "step": 2200 }, { "epoch": 7.89, "learning_rate": 8.755555555555556e-06, "loss": 0.1567, "step": 2210 }, { "epoch": 7.93, "learning_rate": 8.607407407407407e-06, "loss": 0.1097, "step": 2220 }, { "epoch": 7.96, "learning_rate": 8.45925925925926e-06, "loss": 0.1044, "step": 2230 }, { "epoch": 8.0, "learning_rate": 8.311111111111111e-06, "loss": 0.1252, "step": 2240 }, { "epoch": 8.0, "eval_loss": 0.5738044381141663, "eval_runtime": 227.2786, "eval_samples_per_second": 8.773, "eval_steps_per_second": 1.1, "eval_wer": 0.2052131117659568, "step": 2240 }, { "epoch": 8.04, "learning_rate": 8.162962962962964e-06, "loss": 0.1049, "step": 2250 }, { "epoch": 8.07, "learning_rate": 8.014814814814816e-06, "loss": 0.1069, "step": 2260 }, { "epoch": 8.11, "learning_rate": 7.866666666666667e-06, "loss": 0.1081, "step": 2270 }, { "epoch": 8.14, "learning_rate": 7.71851851851852e-06, "loss": 0.1062, "step": 2280 }, { "epoch": 8.18, "learning_rate": 7.570370370370371e-06, "loss": 0.1258, "step": 2290 }, { "epoch": 8.21, "learning_rate": 7.422222222222223e-06, "loss": 0.0965, "step": 2300 }, { "epoch": 8.25, "learning_rate": 7.274074074074075e-06, "loss": 0.1038, "step": 2310 }, { "epoch": 8.29, "learning_rate": 7.125925925925926e-06, "loss": 0.0984, "step": 2320 }, { "epoch": 8.32, "learning_rate": 6.977777777777779e-06, "loss": 0.1028, "step": 2330 }, { "epoch": 8.36, "learning_rate": 6.8296296296296305e-06, "loss": 0.1286, "step": 2340 }, { "epoch": 8.39, "learning_rate": 6.681481481481482e-06, "loss": 0.095, "step": 2350 }, { "epoch": 8.43, "learning_rate": 6.533333333333334e-06, "loss": 0.1056, "step": 2360 }, { "epoch": 8.46, "learning_rate": 6.385185185185185e-06, "loss": 0.1058, "step": 2370 }, { "epoch": 8.5, "learning_rate": 6.237037037037037e-06, "loss": 0.1036, "step": 2380 }, { "epoch": 8.53, "learning_rate": 6.08888888888889e-06, "loss": 0.1357, "step": 2390 }, { "epoch": 8.57, "learning_rate": 5.940740740740741e-06, "loss": 0.1043, "step": 2400 }, { "epoch": 8.61, "learning_rate": 5.792592592592593e-06, "loss": 0.1001, "step": 2410 }, { "epoch": 8.64, "learning_rate": 5.6444444444444445e-06, "loss": 0.1034, "step": 2420 }, { "epoch": 8.68, "learning_rate": 5.496296296296296e-06, "loss": 0.1088, "step": 2430 }, { "epoch": 8.71, "learning_rate": 5.348148148148149e-06, "loss": 0.1303, "step": 2440 }, { "epoch": 8.75, "learning_rate": 5.2e-06, "loss": 0.1042, "step": 2450 }, { "epoch": 8.78, "learning_rate": 5.051851851851852e-06, "loss": 0.1089, "step": 2460 }, { "epoch": 8.82, "learning_rate": 4.903703703703704e-06, "loss": 0.097, "step": 2470 }, { "epoch": 8.86, "learning_rate": 4.755555555555556e-06, "loss": 0.1007, "step": 2480 }, { "epoch": 8.89, "learning_rate": 4.607407407407408e-06, "loss": 0.1445, "step": 2490 }, { "epoch": 8.93, "learning_rate": 4.45925925925926e-06, "loss": 0.0931, "step": 2500 }, { "epoch": 8.96, "learning_rate": 4.3111111111111115e-06, "loss": 0.1075, "step": 2510 }, { "epoch": 9.0, "learning_rate": 4.162962962962963e-06, "loss": 0.1174, "step": 2520 }, { "epoch": 9.0, "eval_loss": 0.5993713140487671, "eval_runtime": 227.5851, "eval_samples_per_second": 8.762, "eval_steps_per_second": 1.098, "eval_wer": 0.2047574201780235, "step": 2520 }, { "epoch": 9.04, "learning_rate": 4.014814814814815e-06, "loss": 0.1068, "step": 2530 }, { "epoch": 9.07, "learning_rate": 3.866666666666667e-06, "loss": 0.0974, "step": 2540 }, { "epoch": 9.11, "learning_rate": 3.718518518518519e-06, "loss": 0.0902, "step": 2550 }, { "epoch": 9.14, "learning_rate": 3.5703703703703707e-06, "loss": 0.0903, "step": 2560 }, { "epoch": 9.18, "learning_rate": 3.4222222222222224e-06, "loss": 0.1347, "step": 2570 }, { "epoch": 9.21, "learning_rate": 3.2740740740740746e-06, "loss": 0.0958, "step": 2580 }, { "epoch": 9.25, "learning_rate": 3.125925925925926e-06, "loss": 0.088, "step": 2590 }, { "epoch": 9.29, "learning_rate": 2.9777777777777777e-06, "loss": 0.0977, "step": 2600 }, { "epoch": 9.32, "learning_rate": 2.82962962962963e-06, "loss": 0.0974, "step": 2610 }, { "epoch": 9.36, "learning_rate": 2.6814814814814816e-06, "loss": 0.1202, "step": 2620 }, { "epoch": 9.39, "learning_rate": 2.5333333333333338e-06, "loss": 0.099, "step": 2630 }, { "epoch": 9.43, "learning_rate": 2.3851851851851855e-06, "loss": 0.0985, "step": 2640 }, { "epoch": 9.46, "learning_rate": 2.2370370370370373e-06, "loss": 0.0904, "step": 2650 }, { "epoch": 9.5, "learning_rate": 2.088888888888889e-06, "loss": 0.0954, "step": 2660 }, { "epoch": 9.53, "learning_rate": 1.9407407407407408e-06, "loss": 0.1285, "step": 2670 }, { "epoch": 9.57, "learning_rate": 1.7925925925925927e-06, "loss": 0.0845, "step": 2680 }, { "epoch": 9.61, "learning_rate": 1.6444444444444447e-06, "loss": 0.0974, "step": 2690 }, { "epoch": 9.64, "learning_rate": 1.4962962962962964e-06, "loss": 0.0942, "step": 2700 }, { "epoch": 9.68, "learning_rate": 1.3481481481481482e-06, "loss": 0.0882, "step": 2710 }, { "epoch": 9.71, "learning_rate": 1.2000000000000002e-06, "loss": 0.1256, "step": 2720 }, { "epoch": 9.75, "learning_rate": 1.051851851851852e-06, "loss": 0.0905, "step": 2730 }, { "epoch": 9.78, "learning_rate": 9.037037037037038e-07, "loss": 0.0967, "step": 2740 }, { "epoch": 9.82, "learning_rate": 7.555555555555556e-07, "loss": 0.0997, "step": 2750 }, { "epoch": 9.86, "learning_rate": 6.074074074074075e-07, "loss": 0.0984, "step": 2760 }, { "epoch": 9.89, "learning_rate": 4.5925925925925927e-07, "loss": 0.1136, "step": 2770 }, { "epoch": 9.93, "learning_rate": 3.259259259259259e-07, "loss": 0.0894, "step": 2780 }, { "epoch": 9.96, "learning_rate": 1.777777777777778e-07, "loss": 0.0979, "step": 2790 }, { "epoch": 10.0, "learning_rate": 2.9629629629629632e-08, "loss": 0.1035, "step": 2800 }, { "epoch": 10.0, "eval_loss": 0.5987938046455383, "eval_runtime": 227.7628, "eval_samples_per_second": 8.755, "eval_steps_per_second": 1.098, "eval_wer": 0.20375489868457028, "step": 2800 }, { "epoch": 10.0, "step": 2800, "total_flos": 5.435692193960383e+19, "train_loss": 0.16274263473493714, "train_runtime": 34090.2009, "train_samples_per_second": 5.262, "train_steps_per_second": 0.082 } ], "max_steps": 2800, "num_train_epochs": 10, "total_flos": 5.435692193960383e+19, "trial_name": null, "trial_params": null }