|
{ |
|
"best_metric": 1.2034047842025757, |
|
"best_model_checkpoint": "ai-light-dance_stepmania_ft_wav2vec2-large-xlsr-53/checkpoint-1500", |
|
"epoch": 9.997091815538013, |
|
"global_step": 1500, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.07, |
|
"learning_rate": 8.000000000000001e-07, |
|
"loss": 11.702, |
|
"step": 10 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"learning_rate": 1.8e-06, |
|
"loss": 10.9687, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"learning_rate": 2.8000000000000003e-06, |
|
"loss": 9.7514, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 0.27, |
|
"learning_rate": 3.8e-06, |
|
"loss": 9.9307, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 0.33, |
|
"learning_rate": 4.800000000000001e-06, |
|
"loss": 10.3039, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 0.4, |
|
"learning_rate": 5.8e-06, |
|
"loss": 9.273, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 0.47, |
|
"learning_rate": 6.800000000000001e-06, |
|
"loss": 8.5606, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 0.53, |
|
"learning_rate": 7.8e-06, |
|
"loss": 6.4897, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 0.6, |
|
"learning_rate": 8.8e-06, |
|
"loss": 5.3634, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 0.66, |
|
"learning_rate": 9.800000000000001e-06, |
|
"loss": 4.0245, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 0.73, |
|
"learning_rate": 1.08e-05, |
|
"loss": 3.2108, |
|
"step": 110 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"learning_rate": 1.18e-05, |
|
"loss": 2.9914, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 0.86, |
|
"learning_rate": 1.2800000000000001e-05, |
|
"loss": 2.753, |
|
"step": 130 |
|
}, |
|
{ |
|
"epoch": 0.93, |
|
"learning_rate": 1.3800000000000002e-05, |
|
"loss": 3.0158, |
|
"step": 140 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 1.48e-05, |
|
"loss": 2.5631, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_loss": 2.48942494392395, |
|
"eval_runtime": 354.2668, |
|
"eval_samples_per_second": 7.548, |
|
"eval_steps_per_second": 0.756, |
|
"eval_wer": 1.0, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 1.07, |
|
"learning_rate": 1.58e-05, |
|
"loss": 2.6394, |
|
"step": 160 |
|
}, |
|
{ |
|
"epoch": 1.13, |
|
"learning_rate": 1.6800000000000002e-05, |
|
"loss": 2.3398, |
|
"step": 170 |
|
}, |
|
{ |
|
"epoch": 1.2, |
|
"learning_rate": 1.78e-05, |
|
"loss": 2.3838, |
|
"step": 180 |
|
}, |
|
{ |
|
"epoch": 1.27, |
|
"learning_rate": 1.88e-05, |
|
"loss": 2.3224, |
|
"step": 190 |
|
}, |
|
{ |
|
"epoch": 1.33, |
|
"learning_rate": 1.9800000000000004e-05, |
|
"loss": 2.2243, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 1.4, |
|
"learning_rate": 2.08e-05, |
|
"loss": 2.2158, |
|
"step": 210 |
|
}, |
|
{ |
|
"epoch": 1.47, |
|
"learning_rate": 2.18e-05, |
|
"loss": 2.1537, |
|
"step": 220 |
|
}, |
|
{ |
|
"epoch": 1.53, |
|
"learning_rate": 2.2800000000000002e-05, |
|
"loss": 2.2192, |
|
"step": 230 |
|
}, |
|
{ |
|
"epoch": 1.6, |
|
"learning_rate": 2.38e-05, |
|
"loss": 2.0781, |
|
"step": 240 |
|
}, |
|
{ |
|
"epoch": 1.66, |
|
"learning_rate": 2.48e-05, |
|
"loss": 2.0413, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 1.73, |
|
"learning_rate": 2.58e-05, |
|
"loss": 2.1157, |
|
"step": 260 |
|
}, |
|
{ |
|
"epoch": 1.8, |
|
"learning_rate": 2.6800000000000004e-05, |
|
"loss": 1.9832, |
|
"step": 270 |
|
}, |
|
{ |
|
"epoch": 1.86, |
|
"learning_rate": 2.7800000000000005e-05, |
|
"loss": 2.0212, |
|
"step": 280 |
|
}, |
|
{ |
|
"epoch": 1.93, |
|
"learning_rate": 2.88e-05, |
|
"loss": 1.9684, |
|
"step": 290 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 2.98e-05, |
|
"loss": 1.9443, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_loss": 1.8861066102981567, |
|
"eval_runtime": 350.5856, |
|
"eval_samples_per_second": 7.627, |
|
"eval_steps_per_second": 0.764, |
|
"eval_wer": 1.0, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 2.07, |
|
"learning_rate": 3.08e-05, |
|
"loss": 2.0769, |
|
"step": 310 |
|
}, |
|
{ |
|
"epoch": 2.13, |
|
"learning_rate": 3.18e-05, |
|
"loss": 1.9485, |
|
"step": 320 |
|
}, |
|
{ |
|
"epoch": 2.2, |
|
"learning_rate": 3.2800000000000004e-05, |
|
"loss": 1.826, |
|
"step": 330 |
|
}, |
|
{ |
|
"epoch": 2.27, |
|
"learning_rate": 3.38e-05, |
|
"loss": 1.9077, |
|
"step": 340 |
|
}, |
|
{ |
|
"epoch": 2.33, |
|
"learning_rate": 3.48e-05, |
|
"loss": 1.8716, |
|
"step": 350 |
|
}, |
|
{ |
|
"epoch": 2.4, |
|
"learning_rate": 3.58e-05, |
|
"loss": 1.7935, |
|
"step": 360 |
|
}, |
|
{ |
|
"epoch": 2.47, |
|
"learning_rate": 3.68e-05, |
|
"loss": 1.882, |
|
"step": 370 |
|
}, |
|
{ |
|
"epoch": 2.53, |
|
"learning_rate": 3.7800000000000004e-05, |
|
"loss": 1.8109, |
|
"step": 380 |
|
}, |
|
{ |
|
"epoch": 2.6, |
|
"learning_rate": 3.88e-05, |
|
"loss": 1.7526, |
|
"step": 390 |
|
}, |
|
{ |
|
"epoch": 2.66, |
|
"learning_rate": 3.9800000000000005e-05, |
|
"loss": 1.7931, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 2.73, |
|
"learning_rate": 4.08e-05, |
|
"loss": 1.7584, |
|
"step": 410 |
|
}, |
|
{ |
|
"epoch": 2.8, |
|
"learning_rate": 4.18e-05, |
|
"loss": 1.7913, |
|
"step": 420 |
|
}, |
|
{ |
|
"epoch": 2.86, |
|
"learning_rate": 4.2800000000000004e-05, |
|
"loss": 1.7738, |
|
"step": 430 |
|
}, |
|
{ |
|
"epoch": 2.93, |
|
"learning_rate": 4.38e-05, |
|
"loss": 1.8625, |
|
"step": 440 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 4.4800000000000005e-05, |
|
"loss": 1.7618, |
|
"step": 450 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_loss": 1.6731115579605103, |
|
"eval_runtime": 348.1297, |
|
"eval_samples_per_second": 7.681, |
|
"eval_steps_per_second": 0.77, |
|
"eval_wer": 1.0, |
|
"step": 450 |
|
}, |
|
{ |
|
"epoch": 3.07, |
|
"learning_rate": 4.58e-05, |
|
"loss": 1.8866, |
|
"step": 460 |
|
}, |
|
{ |
|
"epoch": 3.13, |
|
"learning_rate": 4.6800000000000006e-05, |
|
"loss": 1.5151, |
|
"step": 470 |
|
}, |
|
{ |
|
"epoch": 3.2, |
|
"learning_rate": 4.78e-05, |
|
"loss": 1.5033, |
|
"step": 480 |
|
}, |
|
{ |
|
"epoch": 3.27, |
|
"learning_rate": 4.88e-05, |
|
"loss": 1.6069, |
|
"step": 490 |
|
}, |
|
{ |
|
"epoch": 3.33, |
|
"learning_rate": 4.9800000000000004e-05, |
|
"loss": 1.5053, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 3.4, |
|
"learning_rate": 4.96e-05, |
|
"loss": 1.51, |
|
"step": 510 |
|
}, |
|
{ |
|
"epoch": 3.47, |
|
"learning_rate": 4.91e-05, |
|
"loss": 1.3992, |
|
"step": 520 |
|
}, |
|
{ |
|
"epoch": 3.53, |
|
"learning_rate": 4.86e-05, |
|
"loss": 1.3555, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 3.6, |
|
"learning_rate": 4.8100000000000004e-05, |
|
"loss": 1.314, |
|
"step": 540 |
|
}, |
|
{ |
|
"epoch": 3.66, |
|
"learning_rate": 4.76e-05, |
|
"loss": 1.3467, |
|
"step": 550 |
|
}, |
|
{ |
|
"epoch": 3.73, |
|
"learning_rate": 4.71e-05, |
|
"loss": 1.2924, |
|
"step": 560 |
|
}, |
|
{ |
|
"epoch": 3.8, |
|
"learning_rate": 4.660000000000001e-05, |
|
"loss": 1.3308, |
|
"step": 570 |
|
}, |
|
{ |
|
"epoch": 3.86, |
|
"learning_rate": 4.61e-05, |
|
"loss": 1.287, |
|
"step": 580 |
|
}, |
|
{ |
|
"epoch": 3.93, |
|
"learning_rate": 4.5600000000000004e-05, |
|
"loss": 1.2594, |
|
"step": 590 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 4.5100000000000005e-05, |
|
"loss": 1.2354, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_loss": 1.2470651865005493, |
|
"eval_runtime": 348.1833, |
|
"eval_samples_per_second": 7.68, |
|
"eval_steps_per_second": 0.77, |
|
"eval_wer": 0.9874748673324764, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 4.07, |
|
"learning_rate": 4.46e-05, |
|
"loss": 1.3441, |
|
"step": 610 |
|
}, |
|
{ |
|
"epoch": 4.13, |
|
"learning_rate": 4.41e-05, |
|
"loss": 1.244, |
|
"step": 620 |
|
}, |
|
{ |
|
"epoch": 4.2, |
|
"learning_rate": 4.36e-05, |
|
"loss": 1.2392, |
|
"step": 630 |
|
}, |
|
{ |
|
"epoch": 4.27, |
|
"learning_rate": 4.3100000000000004e-05, |
|
"loss": 1.2611, |
|
"step": 640 |
|
}, |
|
{ |
|
"epoch": 4.33, |
|
"learning_rate": 4.26e-05, |
|
"loss": 1.2875, |
|
"step": 650 |
|
}, |
|
{ |
|
"epoch": 4.4, |
|
"learning_rate": 4.21e-05, |
|
"loss": 1.2537, |
|
"step": 660 |
|
}, |
|
{ |
|
"epoch": 4.47, |
|
"learning_rate": 4.16e-05, |
|
"loss": 1.2268, |
|
"step": 670 |
|
}, |
|
{ |
|
"epoch": 4.53, |
|
"learning_rate": 4.11e-05, |
|
"loss": 1.2678, |
|
"step": 680 |
|
}, |
|
{ |
|
"epoch": 4.6, |
|
"learning_rate": 4.0600000000000004e-05, |
|
"loss": 1.2417, |
|
"step": 690 |
|
}, |
|
{ |
|
"epoch": 4.66, |
|
"learning_rate": 4.0100000000000006e-05, |
|
"loss": 1.2595, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 4.73, |
|
"learning_rate": 3.960000000000001e-05, |
|
"loss": 1.2184, |
|
"step": 710 |
|
}, |
|
{ |
|
"epoch": 4.8, |
|
"learning_rate": 3.91e-05, |
|
"loss": 1.275, |
|
"step": 720 |
|
}, |
|
{ |
|
"epoch": 4.86, |
|
"learning_rate": 3.86e-05, |
|
"loss": 1.2265, |
|
"step": 730 |
|
}, |
|
{ |
|
"epoch": 4.93, |
|
"learning_rate": 3.8100000000000005e-05, |
|
"loss": 1.2474, |
|
"step": 740 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 3.76e-05, |
|
"loss": 1.2333, |
|
"step": 750 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_loss": 1.2252651453018188, |
|
"eval_runtime": 350.248, |
|
"eval_samples_per_second": 7.635, |
|
"eval_steps_per_second": 0.765, |
|
"eval_wer": 0.9874748673324764, |
|
"step": 750 |
|
}, |
|
{ |
|
"epoch": 5.07, |
|
"learning_rate": 3.71e-05, |
|
"loss": 1.332, |
|
"step": 760 |
|
}, |
|
{ |
|
"epoch": 5.13, |
|
"learning_rate": 3.66e-05, |
|
"loss": 1.2276, |
|
"step": 770 |
|
}, |
|
{ |
|
"epoch": 5.2, |
|
"learning_rate": 3.61e-05, |
|
"loss": 1.2372, |
|
"step": 780 |
|
}, |
|
{ |
|
"epoch": 5.27, |
|
"learning_rate": 3.56e-05, |
|
"loss": 1.2368, |
|
"step": 790 |
|
}, |
|
{ |
|
"epoch": 5.33, |
|
"learning_rate": 3.51e-05, |
|
"loss": 1.2508, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 5.4, |
|
"learning_rate": 3.46e-05, |
|
"loss": 1.2263, |
|
"step": 810 |
|
}, |
|
{ |
|
"epoch": 5.47, |
|
"learning_rate": 3.41e-05, |
|
"loss": 1.2129, |
|
"step": 820 |
|
}, |
|
{ |
|
"epoch": 5.53, |
|
"learning_rate": 3.3600000000000004e-05, |
|
"loss": 1.2554, |
|
"step": 830 |
|
}, |
|
{ |
|
"epoch": 5.6, |
|
"learning_rate": 3.3100000000000005e-05, |
|
"loss": 1.2452, |
|
"step": 840 |
|
}, |
|
{ |
|
"epoch": 5.66, |
|
"learning_rate": 3.26e-05, |
|
"loss": 1.2158, |
|
"step": 850 |
|
}, |
|
{ |
|
"epoch": 5.73, |
|
"learning_rate": 3.21e-05, |
|
"loss": 1.214, |
|
"step": 860 |
|
}, |
|
{ |
|
"epoch": 5.8, |
|
"learning_rate": 3.16e-05, |
|
"loss": 1.2457, |
|
"step": 870 |
|
}, |
|
{ |
|
"epoch": 5.86, |
|
"learning_rate": 3.1100000000000004e-05, |
|
"loss": 1.2069, |
|
"step": 880 |
|
}, |
|
{ |
|
"epoch": 5.93, |
|
"learning_rate": 3.06e-05, |
|
"loss": 1.214, |
|
"step": 890 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"learning_rate": 3.01e-05, |
|
"loss": 1.2037, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_loss": 1.216780185699463, |
|
"eval_runtime": 349.4398, |
|
"eval_samples_per_second": 7.652, |
|
"eval_steps_per_second": 0.767, |
|
"eval_wer": 0.9874748673324764, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 6.07, |
|
"learning_rate": 2.96e-05, |
|
"loss": 1.2874, |
|
"step": 910 |
|
}, |
|
{ |
|
"epoch": 6.13, |
|
"learning_rate": 2.91e-05, |
|
"loss": 1.2136, |
|
"step": 920 |
|
}, |
|
{ |
|
"epoch": 6.2, |
|
"learning_rate": 2.86e-05, |
|
"loss": 1.2235, |
|
"step": 930 |
|
}, |
|
{ |
|
"epoch": 6.27, |
|
"learning_rate": 2.8100000000000005e-05, |
|
"loss": 1.2094, |
|
"step": 940 |
|
}, |
|
{ |
|
"epoch": 6.33, |
|
"learning_rate": 2.7600000000000003e-05, |
|
"loss": 1.2486, |
|
"step": 950 |
|
}, |
|
{ |
|
"epoch": 6.4, |
|
"learning_rate": 2.7100000000000005e-05, |
|
"loss": 1.2061, |
|
"step": 960 |
|
}, |
|
{ |
|
"epoch": 6.47, |
|
"learning_rate": 2.6600000000000003e-05, |
|
"loss": 1.2071, |
|
"step": 970 |
|
}, |
|
{ |
|
"epoch": 6.53, |
|
"learning_rate": 2.61e-05, |
|
"loss": 1.2246, |
|
"step": 980 |
|
}, |
|
{ |
|
"epoch": 6.6, |
|
"learning_rate": 2.5600000000000002e-05, |
|
"loss": 1.2058, |
|
"step": 990 |
|
}, |
|
{ |
|
"epoch": 6.66, |
|
"learning_rate": 2.51e-05, |
|
"loss": 1.2219, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 6.73, |
|
"learning_rate": 2.46e-05, |
|
"loss": 1.2154, |
|
"step": 1010 |
|
}, |
|
{ |
|
"epoch": 6.8, |
|
"learning_rate": 2.41e-05, |
|
"loss": 1.2243, |
|
"step": 1020 |
|
}, |
|
{ |
|
"epoch": 6.86, |
|
"learning_rate": 2.36e-05, |
|
"loss": 1.1954, |
|
"step": 1030 |
|
}, |
|
{ |
|
"epoch": 6.93, |
|
"learning_rate": 2.3100000000000002e-05, |
|
"loss": 1.2119, |
|
"step": 1040 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"learning_rate": 2.26e-05, |
|
"loss": 1.2184, |
|
"step": 1050 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_loss": 1.2119824886322021, |
|
"eval_runtime": 349.477, |
|
"eval_samples_per_second": 7.651, |
|
"eval_steps_per_second": 0.767, |
|
"eval_wer": 0.9874795760289679, |
|
"step": 1050 |
|
}, |
|
{ |
|
"epoch": 7.07, |
|
"learning_rate": 2.2100000000000002e-05, |
|
"loss": 1.2809, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 7.13, |
|
"learning_rate": 2.16e-05, |
|
"loss": 1.1977, |
|
"step": 1070 |
|
}, |
|
{ |
|
"epoch": 7.2, |
|
"learning_rate": 2.11e-05, |
|
"loss": 1.1931, |
|
"step": 1080 |
|
}, |
|
{ |
|
"epoch": 7.27, |
|
"learning_rate": 2.06e-05, |
|
"loss": 1.2054, |
|
"step": 1090 |
|
}, |
|
{ |
|
"epoch": 7.33, |
|
"learning_rate": 2.01e-05, |
|
"loss": 1.2307, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 7.4, |
|
"learning_rate": 1.9600000000000002e-05, |
|
"loss": 1.1989, |
|
"step": 1110 |
|
}, |
|
{ |
|
"epoch": 7.47, |
|
"learning_rate": 1.91e-05, |
|
"loss": 1.1982, |
|
"step": 1120 |
|
}, |
|
{ |
|
"epoch": 7.53, |
|
"learning_rate": 1.86e-05, |
|
"loss": 1.2141, |
|
"step": 1130 |
|
}, |
|
{ |
|
"epoch": 7.6, |
|
"learning_rate": 1.81e-05, |
|
"loss": 1.2, |
|
"step": 1140 |
|
}, |
|
{ |
|
"epoch": 7.66, |
|
"learning_rate": 1.76e-05, |
|
"loss": 1.1957, |
|
"step": 1150 |
|
}, |
|
{ |
|
"epoch": 7.73, |
|
"learning_rate": 1.7100000000000002e-05, |
|
"loss": 1.194, |
|
"step": 1160 |
|
}, |
|
{ |
|
"epoch": 7.8, |
|
"learning_rate": 1.66e-05, |
|
"loss": 1.2201, |
|
"step": 1170 |
|
}, |
|
{ |
|
"epoch": 7.86, |
|
"learning_rate": 1.6100000000000002e-05, |
|
"loss": 1.186, |
|
"step": 1180 |
|
}, |
|
{ |
|
"epoch": 7.93, |
|
"learning_rate": 1.56e-05, |
|
"loss": 1.1822, |
|
"step": 1190 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"learning_rate": 1.51e-05, |
|
"loss": 1.1932, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_loss": 1.207992434501648, |
|
"eval_runtime": 350.7609, |
|
"eval_samples_per_second": 7.623, |
|
"eval_steps_per_second": 0.764, |
|
"eval_wer": 0.9874795760289679, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 8.07, |
|
"learning_rate": 1.4599999999999999e-05, |
|
"loss": 1.2688, |
|
"step": 1210 |
|
}, |
|
{ |
|
"epoch": 8.13, |
|
"learning_rate": 1.4099999999999999e-05, |
|
"loss": 1.1872, |
|
"step": 1220 |
|
}, |
|
{ |
|
"epoch": 8.2, |
|
"learning_rate": 1.3600000000000002e-05, |
|
"loss": 1.19, |
|
"step": 1230 |
|
}, |
|
{ |
|
"epoch": 8.27, |
|
"learning_rate": 1.3100000000000002e-05, |
|
"loss": 1.2102, |
|
"step": 1240 |
|
}, |
|
{ |
|
"epoch": 8.33, |
|
"learning_rate": 1.2600000000000001e-05, |
|
"loss": 1.203, |
|
"step": 1250 |
|
}, |
|
{ |
|
"epoch": 8.4, |
|
"learning_rate": 1.2100000000000001e-05, |
|
"loss": 1.1807, |
|
"step": 1260 |
|
}, |
|
{ |
|
"epoch": 8.47, |
|
"learning_rate": 1.16e-05, |
|
"loss": 1.1691, |
|
"step": 1270 |
|
}, |
|
{ |
|
"epoch": 8.53, |
|
"learning_rate": 1.11e-05, |
|
"loss": 1.2134, |
|
"step": 1280 |
|
}, |
|
{ |
|
"epoch": 8.6, |
|
"learning_rate": 1.06e-05, |
|
"loss": 1.1918, |
|
"step": 1290 |
|
}, |
|
{ |
|
"epoch": 8.66, |
|
"learning_rate": 1.0100000000000002e-05, |
|
"loss": 1.1963, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 8.73, |
|
"learning_rate": 9.600000000000001e-06, |
|
"loss": 1.1756, |
|
"step": 1310 |
|
}, |
|
{ |
|
"epoch": 8.8, |
|
"learning_rate": 9.100000000000001e-06, |
|
"loss": 1.2069, |
|
"step": 1320 |
|
}, |
|
{ |
|
"epoch": 8.86, |
|
"learning_rate": 8.599999999999999e-06, |
|
"loss": 1.1816, |
|
"step": 1330 |
|
}, |
|
{ |
|
"epoch": 8.93, |
|
"learning_rate": 8.1e-06, |
|
"loss": 1.1738, |
|
"step": 1340 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"learning_rate": 7.6e-06, |
|
"loss": 1.179, |
|
"step": 1350 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_loss": 1.2039426565170288, |
|
"eval_runtime": 350.0793, |
|
"eval_samples_per_second": 7.638, |
|
"eval_steps_per_second": 0.766, |
|
"eval_wer": 0.9874795760289679, |
|
"step": 1350 |
|
}, |
|
{ |
|
"epoch": 9.07, |
|
"learning_rate": 7.1e-06, |
|
"loss": 1.2694, |
|
"step": 1360 |
|
}, |
|
{ |
|
"epoch": 9.13, |
|
"learning_rate": 6.6e-06, |
|
"loss": 1.1817, |
|
"step": 1370 |
|
}, |
|
{ |
|
"epoch": 9.2, |
|
"learning_rate": 6.1e-06, |
|
"loss": 1.185, |
|
"step": 1380 |
|
}, |
|
{ |
|
"epoch": 9.27, |
|
"learning_rate": 5.600000000000001e-06, |
|
"loss": 1.1811, |
|
"step": 1390 |
|
}, |
|
{ |
|
"epoch": 9.33, |
|
"learning_rate": 5.1e-06, |
|
"loss": 1.1886, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 9.4, |
|
"learning_rate": 4.6e-06, |
|
"loss": 1.1752, |
|
"step": 1410 |
|
}, |
|
{ |
|
"epoch": 9.47, |
|
"learning_rate": 4.1000000000000006e-06, |
|
"loss": 1.1839, |
|
"step": 1420 |
|
}, |
|
{ |
|
"epoch": 9.53, |
|
"learning_rate": 3.6e-06, |
|
"loss": 1.2065, |
|
"step": 1430 |
|
}, |
|
{ |
|
"epoch": 9.6, |
|
"learning_rate": 3.1e-06, |
|
"loss": 1.1765, |
|
"step": 1440 |
|
}, |
|
{ |
|
"epoch": 9.66, |
|
"learning_rate": 2.6e-06, |
|
"loss": 1.1774, |
|
"step": 1450 |
|
}, |
|
{ |
|
"epoch": 9.73, |
|
"learning_rate": 2.1000000000000002e-06, |
|
"loss": 1.165, |
|
"step": 1460 |
|
}, |
|
{ |
|
"epoch": 9.8, |
|
"learning_rate": 1.6000000000000001e-06, |
|
"loss": 1.1928, |
|
"step": 1470 |
|
}, |
|
{ |
|
"epoch": 9.86, |
|
"learning_rate": 1.1e-06, |
|
"loss": 1.1778, |
|
"step": 1480 |
|
}, |
|
{ |
|
"epoch": 9.93, |
|
"learning_rate": 6.000000000000001e-07, |
|
"loss": 1.1757, |
|
"step": 1490 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"learning_rate": 1.0000000000000001e-07, |
|
"loss": 1.1722, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_loss": 1.2034047842025757, |
|
"eval_runtime": 350.0329, |
|
"eval_samples_per_second": 7.639, |
|
"eval_steps_per_second": 0.766, |
|
"eval_wer": 0.9874701586359848, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"step": 1500, |
|
"total_flos": 7.288767136199884e+19, |
|
"train_loss": 1.9466693312327068, |
|
"train_runtime": 75996.317, |
|
"train_samples_per_second": 3.166, |
|
"train_steps_per_second": 0.02 |
|
} |
|
], |
|
"max_steps": 1500, |
|
"num_train_epochs": 10, |
|
"total_flos": 7.288767136199884e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|