{ "best_metric": 1.2034047842025757, "best_model_checkpoint": "ai-light-dance_stepmania_ft_wav2vec2-large-xlsr-53/checkpoint-1500", "epoch": 9.997091815538013, "global_step": 1500, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.07, "learning_rate": 8.000000000000001e-07, "loss": 11.702, "step": 10 }, { "epoch": 0.13, "learning_rate": 1.8e-06, "loss": 10.9687, "step": 20 }, { "epoch": 0.2, "learning_rate": 2.8000000000000003e-06, "loss": 9.7514, "step": 30 }, { "epoch": 0.27, "learning_rate": 3.8e-06, "loss": 9.9307, "step": 40 }, { "epoch": 0.33, "learning_rate": 4.800000000000001e-06, "loss": 10.3039, "step": 50 }, { "epoch": 0.4, "learning_rate": 5.8e-06, "loss": 9.273, "step": 60 }, { "epoch": 0.47, "learning_rate": 6.800000000000001e-06, "loss": 8.5606, "step": 70 }, { "epoch": 0.53, "learning_rate": 7.8e-06, "loss": 6.4897, "step": 80 }, { "epoch": 0.6, "learning_rate": 8.8e-06, "loss": 5.3634, "step": 90 }, { "epoch": 0.66, "learning_rate": 9.800000000000001e-06, "loss": 4.0245, "step": 100 }, { "epoch": 0.73, "learning_rate": 1.08e-05, "loss": 3.2108, "step": 110 }, { "epoch": 0.8, "learning_rate": 1.18e-05, "loss": 2.9914, "step": 120 }, { "epoch": 0.86, "learning_rate": 1.2800000000000001e-05, "loss": 2.753, "step": 130 }, { "epoch": 0.93, "learning_rate": 1.3800000000000002e-05, "loss": 3.0158, "step": 140 }, { "epoch": 1.0, "learning_rate": 1.48e-05, "loss": 2.5631, "step": 150 }, { "epoch": 1.0, "eval_loss": 2.48942494392395, "eval_runtime": 354.2668, "eval_samples_per_second": 7.548, "eval_steps_per_second": 0.756, "eval_wer": 1.0, "step": 150 }, { "epoch": 1.07, "learning_rate": 1.58e-05, "loss": 2.6394, "step": 160 }, { "epoch": 1.13, "learning_rate": 1.6800000000000002e-05, "loss": 2.3398, "step": 170 }, { "epoch": 1.2, "learning_rate": 1.78e-05, "loss": 2.3838, "step": 180 }, { "epoch": 1.27, "learning_rate": 1.88e-05, "loss": 2.3224, "step": 190 }, { "epoch": 1.33, "learning_rate": 1.9800000000000004e-05, "loss": 2.2243, "step": 200 }, { "epoch": 1.4, "learning_rate": 2.08e-05, "loss": 2.2158, "step": 210 }, { "epoch": 1.47, "learning_rate": 2.18e-05, "loss": 2.1537, "step": 220 }, { "epoch": 1.53, "learning_rate": 2.2800000000000002e-05, "loss": 2.2192, "step": 230 }, { "epoch": 1.6, "learning_rate": 2.38e-05, "loss": 2.0781, "step": 240 }, { "epoch": 1.66, "learning_rate": 2.48e-05, "loss": 2.0413, "step": 250 }, { "epoch": 1.73, "learning_rate": 2.58e-05, "loss": 2.1157, "step": 260 }, { "epoch": 1.8, "learning_rate": 2.6800000000000004e-05, "loss": 1.9832, "step": 270 }, { "epoch": 1.86, "learning_rate": 2.7800000000000005e-05, "loss": 2.0212, "step": 280 }, { "epoch": 1.93, "learning_rate": 2.88e-05, "loss": 1.9684, "step": 290 }, { "epoch": 2.0, "learning_rate": 2.98e-05, "loss": 1.9443, "step": 300 }, { "epoch": 2.0, "eval_loss": 1.8861066102981567, "eval_runtime": 350.5856, "eval_samples_per_second": 7.627, "eval_steps_per_second": 0.764, "eval_wer": 1.0, "step": 300 }, { "epoch": 2.07, "learning_rate": 3.08e-05, "loss": 2.0769, "step": 310 }, { "epoch": 2.13, "learning_rate": 3.18e-05, "loss": 1.9485, "step": 320 }, { "epoch": 2.2, "learning_rate": 3.2800000000000004e-05, "loss": 1.826, "step": 330 }, { "epoch": 2.27, "learning_rate": 3.38e-05, "loss": 1.9077, "step": 340 }, { "epoch": 2.33, "learning_rate": 3.48e-05, "loss": 1.8716, "step": 350 }, { "epoch": 2.4, "learning_rate": 3.58e-05, "loss": 1.7935, "step": 360 }, { "epoch": 2.47, "learning_rate": 3.68e-05, "loss": 1.882, "step": 370 }, { "epoch": 2.53, "learning_rate": 3.7800000000000004e-05, "loss": 1.8109, "step": 380 }, { "epoch": 2.6, "learning_rate": 3.88e-05, "loss": 1.7526, "step": 390 }, { "epoch": 2.66, "learning_rate": 3.9800000000000005e-05, "loss": 1.7931, "step": 400 }, { "epoch": 2.73, "learning_rate": 4.08e-05, "loss": 1.7584, "step": 410 }, { "epoch": 2.8, "learning_rate": 4.18e-05, "loss": 1.7913, "step": 420 }, { "epoch": 2.86, "learning_rate": 4.2800000000000004e-05, "loss": 1.7738, "step": 430 }, { "epoch": 2.93, "learning_rate": 4.38e-05, "loss": 1.8625, "step": 440 }, { "epoch": 3.0, "learning_rate": 4.4800000000000005e-05, "loss": 1.7618, "step": 450 }, { "epoch": 3.0, "eval_loss": 1.6731115579605103, "eval_runtime": 348.1297, "eval_samples_per_second": 7.681, "eval_steps_per_second": 0.77, "eval_wer": 1.0, "step": 450 }, { "epoch": 3.07, "learning_rate": 4.58e-05, "loss": 1.8866, "step": 460 }, { "epoch": 3.13, "learning_rate": 4.6800000000000006e-05, "loss": 1.5151, "step": 470 }, { "epoch": 3.2, "learning_rate": 4.78e-05, "loss": 1.5033, "step": 480 }, { "epoch": 3.27, "learning_rate": 4.88e-05, "loss": 1.6069, "step": 490 }, { "epoch": 3.33, "learning_rate": 4.9800000000000004e-05, "loss": 1.5053, "step": 500 }, { "epoch": 3.4, "learning_rate": 4.96e-05, "loss": 1.51, "step": 510 }, { "epoch": 3.47, "learning_rate": 4.91e-05, "loss": 1.3992, "step": 520 }, { "epoch": 3.53, "learning_rate": 4.86e-05, "loss": 1.3555, "step": 530 }, { "epoch": 3.6, "learning_rate": 4.8100000000000004e-05, "loss": 1.314, "step": 540 }, { "epoch": 3.66, "learning_rate": 4.76e-05, "loss": 1.3467, "step": 550 }, { "epoch": 3.73, "learning_rate": 4.71e-05, "loss": 1.2924, "step": 560 }, { "epoch": 3.8, "learning_rate": 4.660000000000001e-05, "loss": 1.3308, "step": 570 }, { "epoch": 3.86, "learning_rate": 4.61e-05, "loss": 1.287, "step": 580 }, { "epoch": 3.93, "learning_rate": 4.5600000000000004e-05, "loss": 1.2594, "step": 590 }, { "epoch": 4.0, "learning_rate": 4.5100000000000005e-05, "loss": 1.2354, "step": 600 }, { "epoch": 4.0, "eval_loss": 1.2470651865005493, "eval_runtime": 348.1833, "eval_samples_per_second": 7.68, "eval_steps_per_second": 0.77, "eval_wer": 0.9874748673324764, "step": 600 }, { "epoch": 4.07, "learning_rate": 4.46e-05, "loss": 1.3441, "step": 610 }, { "epoch": 4.13, "learning_rate": 4.41e-05, "loss": 1.244, "step": 620 }, { "epoch": 4.2, "learning_rate": 4.36e-05, "loss": 1.2392, "step": 630 }, { "epoch": 4.27, "learning_rate": 4.3100000000000004e-05, "loss": 1.2611, "step": 640 }, { "epoch": 4.33, "learning_rate": 4.26e-05, "loss": 1.2875, "step": 650 }, { "epoch": 4.4, "learning_rate": 4.21e-05, "loss": 1.2537, "step": 660 }, { "epoch": 4.47, "learning_rate": 4.16e-05, "loss": 1.2268, "step": 670 }, { "epoch": 4.53, "learning_rate": 4.11e-05, "loss": 1.2678, "step": 680 }, { "epoch": 4.6, "learning_rate": 4.0600000000000004e-05, "loss": 1.2417, "step": 690 }, { "epoch": 4.66, "learning_rate": 4.0100000000000006e-05, "loss": 1.2595, "step": 700 }, { "epoch": 4.73, "learning_rate": 3.960000000000001e-05, "loss": 1.2184, "step": 710 }, { "epoch": 4.8, "learning_rate": 3.91e-05, "loss": 1.275, "step": 720 }, { "epoch": 4.86, "learning_rate": 3.86e-05, "loss": 1.2265, "step": 730 }, { "epoch": 4.93, "learning_rate": 3.8100000000000005e-05, "loss": 1.2474, "step": 740 }, { "epoch": 5.0, "learning_rate": 3.76e-05, "loss": 1.2333, "step": 750 }, { "epoch": 5.0, "eval_loss": 1.2252651453018188, "eval_runtime": 350.248, "eval_samples_per_second": 7.635, "eval_steps_per_second": 0.765, "eval_wer": 0.9874748673324764, "step": 750 }, { "epoch": 5.07, "learning_rate": 3.71e-05, "loss": 1.332, "step": 760 }, { "epoch": 5.13, "learning_rate": 3.66e-05, "loss": 1.2276, "step": 770 }, { "epoch": 5.2, "learning_rate": 3.61e-05, "loss": 1.2372, "step": 780 }, { "epoch": 5.27, "learning_rate": 3.56e-05, "loss": 1.2368, "step": 790 }, { "epoch": 5.33, "learning_rate": 3.51e-05, "loss": 1.2508, "step": 800 }, { "epoch": 5.4, "learning_rate": 3.46e-05, "loss": 1.2263, "step": 810 }, { "epoch": 5.47, "learning_rate": 3.41e-05, "loss": 1.2129, "step": 820 }, { "epoch": 5.53, "learning_rate": 3.3600000000000004e-05, "loss": 1.2554, "step": 830 }, { "epoch": 5.6, "learning_rate": 3.3100000000000005e-05, "loss": 1.2452, "step": 840 }, { "epoch": 5.66, "learning_rate": 3.26e-05, "loss": 1.2158, "step": 850 }, { "epoch": 5.73, "learning_rate": 3.21e-05, "loss": 1.214, "step": 860 }, { "epoch": 5.8, "learning_rate": 3.16e-05, "loss": 1.2457, "step": 870 }, { "epoch": 5.86, "learning_rate": 3.1100000000000004e-05, "loss": 1.2069, "step": 880 }, { "epoch": 5.93, "learning_rate": 3.06e-05, "loss": 1.214, "step": 890 }, { "epoch": 6.0, "learning_rate": 3.01e-05, "loss": 1.2037, "step": 900 }, { "epoch": 6.0, "eval_loss": 1.216780185699463, "eval_runtime": 349.4398, "eval_samples_per_second": 7.652, "eval_steps_per_second": 0.767, "eval_wer": 0.9874748673324764, "step": 900 }, { "epoch": 6.07, "learning_rate": 2.96e-05, "loss": 1.2874, "step": 910 }, { "epoch": 6.13, "learning_rate": 2.91e-05, "loss": 1.2136, "step": 920 }, { "epoch": 6.2, "learning_rate": 2.86e-05, "loss": 1.2235, "step": 930 }, { "epoch": 6.27, "learning_rate": 2.8100000000000005e-05, "loss": 1.2094, "step": 940 }, { "epoch": 6.33, "learning_rate": 2.7600000000000003e-05, "loss": 1.2486, "step": 950 }, { "epoch": 6.4, "learning_rate": 2.7100000000000005e-05, "loss": 1.2061, "step": 960 }, { "epoch": 6.47, "learning_rate": 2.6600000000000003e-05, "loss": 1.2071, "step": 970 }, { "epoch": 6.53, "learning_rate": 2.61e-05, "loss": 1.2246, "step": 980 }, { "epoch": 6.6, "learning_rate": 2.5600000000000002e-05, "loss": 1.2058, "step": 990 }, { "epoch": 6.66, "learning_rate": 2.51e-05, "loss": 1.2219, "step": 1000 }, { "epoch": 6.73, "learning_rate": 2.46e-05, "loss": 1.2154, "step": 1010 }, { "epoch": 6.8, "learning_rate": 2.41e-05, "loss": 1.2243, "step": 1020 }, { "epoch": 6.86, "learning_rate": 2.36e-05, "loss": 1.1954, "step": 1030 }, { "epoch": 6.93, "learning_rate": 2.3100000000000002e-05, "loss": 1.2119, "step": 1040 }, { "epoch": 7.0, "learning_rate": 2.26e-05, "loss": 1.2184, "step": 1050 }, { "epoch": 7.0, "eval_loss": 1.2119824886322021, "eval_runtime": 349.477, "eval_samples_per_second": 7.651, "eval_steps_per_second": 0.767, "eval_wer": 0.9874795760289679, "step": 1050 }, { "epoch": 7.07, "learning_rate": 2.2100000000000002e-05, "loss": 1.2809, "step": 1060 }, { "epoch": 7.13, "learning_rate": 2.16e-05, "loss": 1.1977, "step": 1070 }, { "epoch": 7.2, "learning_rate": 2.11e-05, "loss": 1.1931, "step": 1080 }, { "epoch": 7.27, "learning_rate": 2.06e-05, "loss": 1.2054, "step": 1090 }, { "epoch": 7.33, "learning_rate": 2.01e-05, "loss": 1.2307, "step": 1100 }, { "epoch": 7.4, "learning_rate": 1.9600000000000002e-05, "loss": 1.1989, "step": 1110 }, { "epoch": 7.47, "learning_rate": 1.91e-05, "loss": 1.1982, "step": 1120 }, { "epoch": 7.53, "learning_rate": 1.86e-05, "loss": 1.2141, "step": 1130 }, { "epoch": 7.6, "learning_rate": 1.81e-05, "loss": 1.2, "step": 1140 }, { "epoch": 7.66, "learning_rate": 1.76e-05, "loss": 1.1957, "step": 1150 }, { "epoch": 7.73, "learning_rate": 1.7100000000000002e-05, "loss": 1.194, "step": 1160 }, { "epoch": 7.8, "learning_rate": 1.66e-05, "loss": 1.2201, "step": 1170 }, { "epoch": 7.86, "learning_rate": 1.6100000000000002e-05, "loss": 1.186, "step": 1180 }, { "epoch": 7.93, "learning_rate": 1.56e-05, "loss": 1.1822, "step": 1190 }, { "epoch": 8.0, "learning_rate": 1.51e-05, "loss": 1.1932, "step": 1200 }, { "epoch": 8.0, "eval_loss": 1.207992434501648, "eval_runtime": 350.7609, "eval_samples_per_second": 7.623, "eval_steps_per_second": 0.764, "eval_wer": 0.9874795760289679, "step": 1200 }, { "epoch": 8.07, "learning_rate": 1.4599999999999999e-05, "loss": 1.2688, "step": 1210 }, { "epoch": 8.13, "learning_rate": 1.4099999999999999e-05, "loss": 1.1872, "step": 1220 }, { "epoch": 8.2, "learning_rate": 1.3600000000000002e-05, "loss": 1.19, "step": 1230 }, { "epoch": 8.27, "learning_rate": 1.3100000000000002e-05, "loss": 1.2102, "step": 1240 }, { "epoch": 8.33, "learning_rate": 1.2600000000000001e-05, "loss": 1.203, "step": 1250 }, { "epoch": 8.4, "learning_rate": 1.2100000000000001e-05, "loss": 1.1807, "step": 1260 }, { "epoch": 8.47, "learning_rate": 1.16e-05, "loss": 1.1691, "step": 1270 }, { "epoch": 8.53, "learning_rate": 1.11e-05, "loss": 1.2134, "step": 1280 }, { "epoch": 8.6, "learning_rate": 1.06e-05, "loss": 1.1918, "step": 1290 }, { "epoch": 8.66, "learning_rate": 1.0100000000000002e-05, "loss": 1.1963, "step": 1300 }, { "epoch": 8.73, "learning_rate": 9.600000000000001e-06, "loss": 1.1756, "step": 1310 }, { "epoch": 8.8, "learning_rate": 9.100000000000001e-06, "loss": 1.2069, "step": 1320 }, { "epoch": 8.86, "learning_rate": 8.599999999999999e-06, "loss": 1.1816, "step": 1330 }, { "epoch": 8.93, "learning_rate": 8.1e-06, "loss": 1.1738, "step": 1340 }, { "epoch": 9.0, "learning_rate": 7.6e-06, "loss": 1.179, "step": 1350 }, { "epoch": 9.0, "eval_loss": 1.2039426565170288, "eval_runtime": 350.0793, "eval_samples_per_second": 7.638, "eval_steps_per_second": 0.766, "eval_wer": 0.9874795760289679, "step": 1350 }, { "epoch": 9.07, "learning_rate": 7.1e-06, "loss": 1.2694, "step": 1360 }, { "epoch": 9.13, "learning_rate": 6.6e-06, "loss": 1.1817, "step": 1370 }, { "epoch": 9.2, "learning_rate": 6.1e-06, "loss": 1.185, "step": 1380 }, { "epoch": 9.27, "learning_rate": 5.600000000000001e-06, "loss": 1.1811, "step": 1390 }, { "epoch": 9.33, "learning_rate": 5.1e-06, "loss": 1.1886, "step": 1400 }, { "epoch": 9.4, "learning_rate": 4.6e-06, "loss": 1.1752, "step": 1410 }, { "epoch": 9.47, "learning_rate": 4.1000000000000006e-06, "loss": 1.1839, "step": 1420 }, { "epoch": 9.53, "learning_rate": 3.6e-06, "loss": 1.2065, "step": 1430 }, { "epoch": 9.6, "learning_rate": 3.1e-06, "loss": 1.1765, "step": 1440 }, { "epoch": 9.66, "learning_rate": 2.6e-06, "loss": 1.1774, "step": 1450 }, { "epoch": 9.73, "learning_rate": 2.1000000000000002e-06, "loss": 1.165, "step": 1460 }, { "epoch": 9.8, "learning_rate": 1.6000000000000001e-06, "loss": 1.1928, "step": 1470 }, { "epoch": 9.86, "learning_rate": 1.1e-06, "loss": 1.1778, "step": 1480 }, { "epoch": 9.93, "learning_rate": 6.000000000000001e-07, "loss": 1.1757, "step": 1490 }, { "epoch": 10.0, "learning_rate": 1.0000000000000001e-07, "loss": 1.1722, "step": 1500 }, { "epoch": 10.0, "eval_loss": 1.2034047842025757, "eval_runtime": 350.0329, "eval_samples_per_second": 7.639, "eval_steps_per_second": 0.766, "eval_wer": 0.9874701586359848, "step": 1500 }, { "epoch": 10.0, "step": 1500, "total_flos": 7.288767136199884e+19, "train_loss": 1.9466693312327068, "train_runtime": 75996.317, "train_samples_per_second": 3.166, "train_steps_per_second": 0.02 } ], "max_steps": 1500, "num_train_epochs": 10, "total_flos": 7.288767136199884e+19, "trial_name": null, "trial_params": null }