diff --git "a/checkpoint-10500/trainer_state.json" "b/checkpoint-10500/trainer_state.json" new file mode 100644--- /dev/null +++ "b/checkpoint-10500/trainer_state.json" @@ -0,0 +1,12805 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.9556714471968708, + "global_step": 10500, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 2e-09, + "loss": 23.1708, + "step": 5 + }, + { + "epoch": 0.0, + "learning_rate": 1.2e-08, + "loss": 17.4647, + "step": 10 + }, + { + "epoch": 0.0, + "learning_rate": 2.2e-08, + "loss": 16.726, + "step": 15 + }, + { + "epoch": 0.0, + "learning_rate": 3.2e-08, + "loss": 16.6276, + "step": 20 + }, + { + "epoch": 0.0, + "learning_rate": 4.2e-08, + "loss": 14.8649, + "step": 25 + }, + { + "epoch": 0.01, + "learning_rate": 5.1999999999999996e-08, + "loss": 15.1187, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 6.2e-08, + "loss": 14.6901, + "step": 35 + }, + { + "epoch": 0.01, + "learning_rate": 7.2e-08, + "loss": 14.3665, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 8.2e-08, + "loss": 14.6373, + "step": 45 + }, + { + "epoch": 0.01, + "learning_rate": 9.199999999999999e-08, + "loss": 14.0672, + "step": 50 + }, + { + "epoch": 0.01, + "learning_rate": 1.0199999999999999e-07, + "loss": 18.1758, + "step": 55 + }, + { + "epoch": 0.01, + "learning_rate": 1.12e-07, + "loss": 18.3919, + "step": 60 + }, + { + "epoch": 0.01, + "learning_rate": 1.2199999999999998e-07, + "loss": 17.8389, + "step": 65 + }, + { + "epoch": 0.01, + "learning_rate": 1.32e-07, + "loss": 15.098, + "step": 70 + }, + { + "epoch": 0.01, + "learning_rate": 1.4199999999999997e-07, + "loss": 15.2273, + "step": 75 + }, + { + "epoch": 0.01, + "learning_rate": 1.5199999999999998e-07, + "loss": 14.9402, + "step": 80 + }, + { + "epoch": 0.02, + "learning_rate": 1.62e-07, + "loss": 14.2399, + "step": 85 + }, + { + "epoch": 0.02, + "learning_rate": 1.7199999999999998e-07, + "loss": 14.0017, + "step": 90 + }, + { + "epoch": 0.02, + "learning_rate": 1.82e-07, + "loss": 14.2729, + "step": 95 + }, + { + "epoch": 0.02, + "learning_rate": 1.92e-07, + "loss": 14.4501, + "step": 100 + }, + { + "epoch": 0.02, + "learning_rate": 2.02e-07, + "loss": 17.7063, + "step": 105 + }, + { + "epoch": 0.02, + "learning_rate": 2.12e-07, + "loss": 17.2415, + "step": 110 + }, + { + "epoch": 0.02, + "learning_rate": 2.22e-07, + "loss": 17.3164, + "step": 115 + }, + { + "epoch": 0.02, + "learning_rate": 2.32e-07, + "loss": 15.1226, + "step": 120 + }, + { + "epoch": 0.02, + "learning_rate": 2.4199999999999997e-07, + "loss": 14.7632, + "step": 125 + }, + { + "epoch": 0.02, + "learning_rate": 2.52e-07, + "loss": 14.269, + "step": 130 + }, + { + "epoch": 0.03, + "learning_rate": 2.62e-07, + "loss": 14.3178, + "step": 135 + }, + { + "epoch": 0.03, + "learning_rate": 2.72e-07, + "loss": 13.9972, + "step": 140 + }, + { + "epoch": 0.03, + "learning_rate": 2.8199999999999996e-07, + "loss": 14.4335, + "step": 145 + }, + { + "epoch": 0.03, + "learning_rate": 2.9199999999999997e-07, + "loss": 14.1463, + "step": 150 + }, + { + "epoch": 0.03, + "learning_rate": 3.02e-07, + "loss": 16.1839, + "step": 155 + }, + { + "epoch": 0.03, + "learning_rate": 3.12e-07, + "loss": 17.0019, + "step": 160 + }, + { + "epoch": 0.03, + "learning_rate": 3.22e-07, + "loss": 16.061, + "step": 165 + }, + { + "epoch": 0.03, + "learning_rate": 3.32e-07, + "loss": 13.9992, + "step": 170 + }, + { + "epoch": 0.03, + "learning_rate": 3.42e-07, + "loss": 14.0072, + "step": 175 + }, + { + "epoch": 0.03, + "learning_rate": 3.52e-07, + "loss": 13.4026, + "step": 180 + }, + { + "epoch": 0.03, + "learning_rate": 3.62e-07, + "loss": 13.1469, + "step": 185 + }, + { + "epoch": 0.04, + "learning_rate": 3.72e-07, + "loss": 13.2259, + "step": 190 + }, + { + "epoch": 0.04, + "learning_rate": 3.82e-07, + "loss": 13.0371, + "step": 195 + }, + { + "epoch": 0.04, + "learning_rate": 3.8999999999999997e-07, + "loss": 14.4267, + "step": 200 + }, + { + "epoch": 0.04, + "learning_rate": 4e-07, + "loss": 17.5423, + "step": 205 + }, + { + "epoch": 0.04, + "learning_rate": 4.0999999999999994e-07, + "loss": 15.3916, + "step": 210 + }, + { + "epoch": 0.04, + "learning_rate": 4.1999999999999995e-07, + "loss": 14.2848, + "step": 215 + }, + { + "epoch": 0.04, + "learning_rate": 4.2999999999999996e-07, + "loss": 15.4372, + "step": 220 + }, + { + "epoch": 0.04, + "learning_rate": 4.3999999999999997e-07, + "loss": 12.914, + "step": 225 + }, + { + "epoch": 0.04, + "learning_rate": 4.5e-07, + "loss": 12.8913, + "step": 230 + }, + { + "epoch": 0.04, + "learning_rate": 4.6e-07, + "loss": 12.2806, + "step": 235 + }, + { + "epoch": 0.04, + "learning_rate": 4.6999999999999995e-07, + "loss": 11.734, + "step": 240 + }, + { + "epoch": 0.05, + "learning_rate": 4.8e-07, + "loss": 10.8097, + "step": 245 + }, + { + "epoch": 0.05, + "learning_rate": 4.9e-07, + "loss": 11.4272, + "step": 250 + }, + { + "epoch": 0.05, + "learning_rate": 5e-07, + "loss": 14.283, + "step": 255 + }, + { + "epoch": 0.05, + "learning_rate": 5.1e-07, + "loss": 12.6282, + "step": 260 + }, + { + "epoch": 0.05, + "learning_rate": 5.2e-07, + "loss": 13.4567, + "step": 265 + }, + { + "epoch": 0.05, + "learning_rate": 5.3e-07, + "loss": 11.2645, + "step": 270 + }, + { + "epoch": 0.05, + "learning_rate": 5.4e-07, + "loss": 10.2447, + "step": 275 + }, + { + "epoch": 0.05, + "learning_rate": 5.5e-07, + "loss": 10.9771, + "step": 280 + }, + { + "epoch": 0.05, + "learning_rate": 5.6e-07, + "loss": 10.9162, + "step": 285 + }, + { + "epoch": 0.05, + "learning_rate": 5.699999999999999e-07, + "loss": 10.2676, + "step": 290 + }, + { + "epoch": 0.05, + "learning_rate": 5.8e-07, + "loss": 8.9776, + "step": 295 + }, + { + "epoch": 0.06, + "learning_rate": 5.9e-07, + "loss": 9.0533, + "step": 300 + }, + { + "epoch": 0.06, + "learning_rate": 5.979999999999999e-07, + "loss": 14.5471, + "step": 305 + }, + { + "epoch": 0.06, + "learning_rate": 6.079999999999999e-07, + "loss": 12.7666, + "step": 310 + }, + { + "epoch": 0.06, + "learning_rate": 6.18e-07, + "loss": 9.7622, + "step": 315 + }, + { + "epoch": 0.06, + "learning_rate": 6.28e-07, + "loss": 9.0693, + "step": 320 + }, + { + "epoch": 0.06, + "learning_rate": 6.38e-07, + "loss": 9.1909, + "step": 325 + }, + { + "epoch": 0.06, + "learning_rate": 6.48e-07, + "loss": 9.2916, + "step": 330 + }, + { + "epoch": 0.06, + "learning_rate": 6.58e-07, + "loss": 7.4726, + "step": 335 + }, + { + "epoch": 0.06, + "learning_rate": 6.68e-07, + "loss": 9.438, + "step": 340 + }, + { + "epoch": 0.06, + "learning_rate": 6.78e-07, + "loss": 6.7858, + "step": 345 + }, + { + "epoch": 0.07, + "learning_rate": 6.879999999999999e-07, + "loss": 6.6149, + "step": 350 + }, + { + "epoch": 0.07, + "learning_rate": 6.979999999999999e-07, + "loss": 10.9064, + "step": 355 + }, + { + "epoch": 0.07, + "learning_rate": 7.079999999999999e-07, + "loss": 6.9364, + "step": 360 + }, + { + "epoch": 0.07, + "learning_rate": 7.179999999999999e-07, + "loss": 8.5146, + "step": 365 + }, + { + "epoch": 0.07, + "learning_rate": 7.28e-07, + "loss": 5.9193, + "step": 370 + }, + { + "epoch": 0.07, + "learning_rate": 7.38e-07, + "loss": 6.343, + "step": 375 + }, + { + "epoch": 0.07, + "learning_rate": 7.48e-07, + "loss": 4.9407, + "step": 380 + }, + { + "epoch": 0.07, + "learning_rate": 7.58e-07, + "loss": 6.2009, + "step": 385 + }, + { + "epoch": 0.07, + "learning_rate": 7.68e-07, + "loss": 6.2122, + "step": 390 + }, + { + "epoch": 0.07, + "learning_rate": 7.78e-07, + "loss": 6.305, + "step": 395 + }, + { + "epoch": 0.07, + "learning_rate": 7.88e-07, + "loss": 6.0134, + "step": 400 + }, + { + "epoch": 0.08, + "learning_rate": 7.98e-07, + "loss": 6.3882, + "step": 405 + }, + { + "epoch": 0.08, + "learning_rate": 8.08e-07, + "loss": 7.8588, + "step": 410 + }, + { + "epoch": 0.08, + "learning_rate": 8.179999999999999e-07, + "loss": 4.2314, + "step": 415 + }, + { + "epoch": 0.08, + "learning_rate": 8.28e-07, + "loss": 5.1779, + "step": 420 + }, + { + "epoch": 0.08, + "learning_rate": 8.38e-07, + "loss": 3.6178, + "step": 425 + }, + { + "epoch": 0.08, + "learning_rate": 8.48e-07, + "loss": 3.8777, + "step": 430 + }, + { + "epoch": 0.08, + "learning_rate": 8.58e-07, + "loss": 6.0639, + "step": 435 + }, + { + "epoch": 0.08, + "learning_rate": 8.68e-07, + "loss": 4.7344, + "step": 440 + }, + { + "epoch": 0.08, + "learning_rate": 8.78e-07, + "loss": 4.4478, + "step": 445 + }, + { + "epoch": 0.08, + "learning_rate": 8.88e-07, + "loss": 3.6034, + "step": 450 + }, + { + "epoch": 0.08, + "learning_rate": 8.98e-07, + "loss": 3.4378, + "step": 455 + }, + { + "epoch": 0.09, + "learning_rate": 9.08e-07, + "loss": 3.8416, + "step": 460 + }, + { + "epoch": 0.09, + "learning_rate": 9.18e-07, + "loss": 3.3023, + "step": 465 + }, + { + "epoch": 0.09, + "learning_rate": 9.28e-07, + "loss": 3.3863, + "step": 470 + }, + { + "epoch": 0.09, + "learning_rate": 9.379999999999998e-07, + "loss": 3.2869, + "step": 475 + }, + { + "epoch": 0.09, + "learning_rate": 9.479999999999999e-07, + "loss": 3.3075, + "step": 480 + }, + { + "epoch": 0.09, + "learning_rate": 9.58e-07, + "loss": 4.247, + "step": 485 + }, + { + "epoch": 0.09, + "learning_rate": 9.679999999999999e-07, + "loss": 3.5028, + "step": 490 + }, + { + "epoch": 0.09, + "learning_rate": 9.78e-07, + "loss": 5.2398, + "step": 495 + }, + { + "epoch": 0.09, + "learning_rate": 9.88e-07, + "loss": 4.051, + "step": 500 + }, + { + "epoch": 0.09, + "eval_loss": 3.1419003009796143, + "eval_runtime": 101.742, + "eval_samples_per_second": 11.736, + "eval_steps_per_second": 1.474, + "eval_wer": 1.0, + "step": 500 + }, + { + "epoch": 0.09, + "learning_rate": 9.98e-07, + "loss": 4.4604, + "step": 505 + }, + { + "epoch": 0.09, + "learning_rate": 1.008e-06, + "loss": 3.2391, + "step": 510 + }, + { + "epoch": 0.1, + "learning_rate": 1.018e-06, + "loss": 3.1886, + "step": 515 + }, + { + "epoch": 0.1, + "learning_rate": 1.028e-06, + "loss": 3.132, + "step": 520 + }, + { + "epoch": 0.1, + "learning_rate": 1.038e-06, + "loss": 3.2774, + "step": 525 + }, + { + "epoch": 0.1, + "learning_rate": 1.048e-06, + "loss": 3.6977, + "step": 530 + }, + { + "epoch": 0.1, + "learning_rate": 1.058e-06, + "loss": 3.3265, + "step": 535 + }, + { + "epoch": 0.1, + "learning_rate": 1.068e-06, + "loss": 3.095, + "step": 540 + }, + { + "epoch": 0.1, + "learning_rate": 1.078e-06, + "loss": 3.3518, + "step": 545 + }, + { + "epoch": 0.1, + "learning_rate": 1.088e-06, + "loss": 3.1893, + "step": 550 + }, + { + "epoch": 0.1, + "learning_rate": 1.0980000000000001e-06, + "loss": 3.1898, + "step": 555 + }, + { + "epoch": 0.1, + "learning_rate": 1.108e-06, + "loss": 4.1224, + "step": 560 + }, + { + "epoch": 0.11, + "learning_rate": 1.1180000000000001e-06, + "loss": 3.0569, + "step": 565 + }, + { + "epoch": 0.11, + "learning_rate": 1.1279999999999998e-06, + "loss": 5.0761, + "step": 570 + }, + { + "epoch": 0.11, + "learning_rate": 1.138e-06, + "loss": 4.0581, + "step": 575 + }, + { + "epoch": 0.11, + "learning_rate": 1.1479999999999999e-06, + "loss": 3.6377, + "step": 580 + }, + { + "epoch": 0.11, + "learning_rate": 1.158e-06, + "loss": 3.4788, + "step": 585 + }, + { + "epoch": 0.11, + "learning_rate": 1.1679999999999999e-06, + "loss": 3.0537, + "step": 590 + }, + { + "epoch": 0.11, + "learning_rate": 1.178e-06, + "loss": 3.0412, + "step": 595 + }, + { + "epoch": 0.11, + "learning_rate": 1.1879999999999999e-06, + "loss": 3.1245, + "step": 600 + }, + { + "epoch": 0.11, + "learning_rate": 1.1979999999999998e-06, + "loss": 3.2805, + "step": 605 + }, + { + "epoch": 0.11, + "learning_rate": 1.208e-06, + "loss": 2.9896, + "step": 610 + }, + { + "epoch": 0.11, + "learning_rate": 1.2179999999999998e-06, + "loss": 3.5087, + "step": 615 + }, + { + "epoch": 0.12, + "learning_rate": 1.228e-06, + "loss": 3.4038, + "step": 620 + }, + { + "epoch": 0.12, + "learning_rate": 1.2379999999999998e-06, + "loss": 3.5193, + "step": 625 + }, + { + "epoch": 0.12, + "learning_rate": 1.248e-06, + "loss": 3.0089, + "step": 630 + }, + { + "epoch": 0.12, + "learning_rate": 1.2579999999999999e-06, + "loss": 2.9954, + "step": 635 + }, + { + "epoch": 0.12, + "learning_rate": 1.268e-06, + "loss": 3.0579, + "step": 640 + }, + { + "epoch": 0.12, + "learning_rate": 1.2779999999999999e-06, + "loss": 3.8326, + "step": 645 + }, + { + "epoch": 0.12, + "learning_rate": 1.288e-06, + "loss": 3.2384, + "step": 650 + }, + { + "epoch": 0.12, + "learning_rate": 1.298e-06, + "loss": 3.452, + "step": 655 + }, + { + "epoch": 0.12, + "learning_rate": 1.308e-06, + "loss": 3.7447, + "step": 660 + }, + { + "epoch": 0.12, + "learning_rate": 1.318e-06, + "loss": 3.5435, + "step": 665 + }, + { + "epoch": 0.12, + "learning_rate": 1.328e-06, + "loss": 3.0208, + "step": 670 + }, + { + "epoch": 0.13, + "learning_rate": 1.338e-06, + "loss": 3.3091, + "step": 675 + }, + { + "epoch": 0.13, + "learning_rate": 1.348e-06, + "loss": 3.3663, + "step": 680 + }, + { + "epoch": 0.13, + "learning_rate": 1.358e-06, + "loss": 2.9651, + "step": 685 + }, + { + "epoch": 0.13, + "learning_rate": 1.368e-06, + "loss": 2.9384, + "step": 690 + }, + { + "epoch": 0.13, + "learning_rate": 1.3779999999999998e-06, + "loss": 2.9415, + "step": 695 + }, + { + "epoch": 0.13, + "learning_rate": 1.3879999999999999e-06, + "loss": 2.9731, + "step": 700 + }, + { + "epoch": 0.13, + "learning_rate": 1.3979999999999998e-06, + "loss": 3.4581, + "step": 705 + }, + { + "epoch": 0.13, + "learning_rate": 1.408e-06, + "loss": 2.9852, + "step": 710 + }, + { + "epoch": 0.13, + "learning_rate": 1.4179999999999998e-06, + "loss": 2.9559, + "step": 715 + }, + { + "epoch": 0.13, + "learning_rate": 1.428e-06, + "loss": 3.2803, + "step": 720 + }, + { + "epoch": 0.14, + "learning_rate": 1.4379999999999998e-06, + "loss": 2.9441, + "step": 725 + }, + { + "epoch": 0.14, + "learning_rate": 1.448e-06, + "loss": 3.9254, + "step": 730 + }, + { + "epoch": 0.14, + "learning_rate": 1.4579999999999998e-06, + "loss": 3.1551, + "step": 735 + }, + { + "epoch": 0.14, + "learning_rate": 1.468e-06, + "loss": 5.0411, + "step": 740 + }, + { + "epoch": 0.14, + "learning_rate": 1.4779999999999999e-06, + "loss": 2.9128, + "step": 745 + }, + { + "epoch": 0.14, + "learning_rate": 1.488e-06, + "loss": 3.168, + "step": 750 + }, + { + "epoch": 0.14, + "learning_rate": 1.4979999999999999e-06, + "loss": 3.1407, + "step": 755 + }, + { + "epoch": 0.14, + "learning_rate": 1.508e-06, + "loss": 3.2372, + "step": 760 + }, + { + "epoch": 0.14, + "learning_rate": 1.518e-06, + "loss": 3.2442, + "step": 765 + }, + { + "epoch": 0.14, + "learning_rate": 1.528e-06, + "loss": 2.9669, + "step": 770 + }, + { + "epoch": 0.14, + "learning_rate": 1.538e-06, + "loss": 3.0412, + "step": 775 + }, + { + "epoch": 0.15, + "learning_rate": 1.548e-06, + "loss": 2.918, + "step": 780 + }, + { + "epoch": 0.15, + "learning_rate": 1.558e-06, + "loss": 3.2461, + "step": 785 + }, + { + "epoch": 0.15, + "learning_rate": 1.568e-06, + "loss": 2.9181, + "step": 790 + }, + { + "epoch": 0.15, + "learning_rate": 1.578e-06, + "loss": 3.2525, + "step": 795 + }, + { + "epoch": 0.15, + "learning_rate": 1.588e-06, + "loss": 3.3201, + "step": 800 + }, + { + "epoch": 0.15, + "learning_rate": 1.598e-06, + "loss": 3.0265, + "step": 805 + }, + { + "epoch": 0.15, + "learning_rate": 1.608e-06, + "loss": 2.886, + "step": 810 + }, + { + "epoch": 0.15, + "learning_rate": 1.618e-06, + "loss": 3.0627, + "step": 815 + }, + { + "epoch": 0.15, + "learning_rate": 1.628e-06, + "loss": 2.9099, + "step": 820 + }, + { + "epoch": 0.15, + "learning_rate": 1.6379999999999998e-06, + "loss": 2.9201, + "step": 825 + }, + { + "epoch": 0.15, + "learning_rate": 1.648e-06, + "loss": 3.0767, + "step": 830 + }, + { + "epoch": 0.16, + "learning_rate": 1.6579999999999998e-06, + "loss": 2.8778, + "step": 835 + }, + { + "epoch": 0.16, + "learning_rate": 1.668e-06, + "loss": 2.995, + "step": 840 + }, + { + "epoch": 0.16, + "learning_rate": 1.6779999999999999e-06, + "loss": 2.8796, + "step": 845 + }, + { + "epoch": 0.16, + "learning_rate": 1.6879999999999998e-06, + "loss": 2.9054, + "step": 850 + }, + { + "epoch": 0.16, + "learning_rate": 1.6979999999999999e-06, + "loss": 3.3809, + "step": 855 + }, + { + "epoch": 0.16, + "learning_rate": 1.7079999999999998e-06, + "loss": 2.9066, + "step": 860 + }, + { + "epoch": 0.16, + "learning_rate": 1.718e-06, + "loss": 2.9675, + "step": 865 + }, + { + "epoch": 0.16, + "learning_rate": 1.7279999999999998e-06, + "loss": 3.2022, + "step": 870 + }, + { + "epoch": 0.16, + "learning_rate": 1.738e-06, + "loss": 2.9072, + "step": 875 + }, + { + "epoch": 0.16, + "learning_rate": 1.7479999999999998e-06, + "loss": 3.569, + "step": 880 + }, + { + "epoch": 0.16, + "learning_rate": 1.758e-06, + "loss": 3.073, + "step": 885 + }, + { + "epoch": 0.17, + "learning_rate": 1.7679999999999998e-06, + "loss": 3.1634, + "step": 890 + }, + { + "epoch": 0.17, + "learning_rate": 1.778e-06, + "loss": 2.9443, + "step": 895 + }, + { + "epoch": 0.17, + "learning_rate": 1.7879999999999999e-06, + "loss": 2.9246, + "step": 900 + }, + { + "epoch": 0.17, + "learning_rate": 1.798e-06, + "loss": 2.9731, + "step": 905 + }, + { + "epoch": 0.17, + "learning_rate": 1.8079999999999999e-06, + "loss": 2.8715, + "step": 910 + }, + { + "epoch": 0.17, + "learning_rate": 1.818e-06, + "loss": 2.8709, + "step": 915 + }, + { + "epoch": 0.17, + "learning_rate": 1.828e-06, + "loss": 2.8895, + "step": 920 + }, + { + "epoch": 0.17, + "learning_rate": 1.838e-06, + "loss": 2.9853, + "step": 925 + }, + { + "epoch": 0.17, + "learning_rate": 1.848e-06, + "loss": 2.9241, + "step": 930 + }, + { + "epoch": 0.17, + "learning_rate": 1.858e-06, + "loss": 2.8844, + "step": 935 + }, + { + "epoch": 0.18, + "learning_rate": 1.868e-06, + "loss": 2.871, + "step": 940 + }, + { + "epoch": 0.18, + "learning_rate": 1.8779999999999998e-06, + "loss": 2.8814, + "step": 945 + }, + { + "epoch": 0.18, + "learning_rate": 1.8879999999999998e-06, + "loss": 2.8748, + "step": 950 + }, + { + "epoch": 0.18, + "learning_rate": 1.8979999999999999e-06, + "loss": 3.0096, + "step": 955 + }, + { + "epoch": 0.18, + "learning_rate": 1.9079999999999998e-06, + "loss": 2.8701, + "step": 960 + }, + { + "epoch": 0.18, + "learning_rate": 1.9179999999999997e-06, + "loss": 2.8968, + "step": 965 + }, + { + "epoch": 0.18, + "learning_rate": 1.928e-06, + "loss": 3.0461, + "step": 970 + }, + { + "epoch": 0.18, + "learning_rate": 1.938e-06, + "loss": 2.9494, + "step": 975 + }, + { + "epoch": 0.18, + "learning_rate": 1.948e-06, + "loss": 4.5448, + "step": 980 + }, + { + "epoch": 0.18, + "learning_rate": 1.9579999999999997e-06, + "loss": 2.9924, + "step": 985 + }, + { + "epoch": 0.18, + "learning_rate": 1.968e-06, + "loss": 2.9612, + "step": 990 + }, + { + "epoch": 0.19, + "learning_rate": 1.978e-06, + "loss": 3.2622, + "step": 995 + }, + { + "epoch": 0.19, + "learning_rate": 1.988e-06, + "loss": 2.8626, + "step": 1000 + }, + { + "epoch": 0.19, + "eval_loss": 2.8933510780334473, + "eval_runtime": 138.873, + "eval_samples_per_second": 8.598, + "eval_steps_per_second": 1.08, + "eval_wer": 1.0, + "step": 1000 + }, + { + "epoch": 0.19, + "learning_rate": 1.9979999999999998e-06, + "loss": 2.8847, + "step": 1005 + }, + { + "epoch": 0.19, + "learning_rate": 1.9991784760731156e-06, + "loss": 2.8753, + "step": 1010 + }, + { + "epoch": 0.19, + "learning_rate": 1.99815157116451e-06, + "loss": 2.9105, + "step": 1015 + }, + { + "epoch": 0.19, + "learning_rate": 1.9971246662559046e-06, + "loss": 2.9129, + "step": 1020 + }, + { + "epoch": 0.19, + "learning_rate": 1.9960977613472992e-06, + "loss": 3.202, + "step": 1025 + }, + { + "epoch": 0.19, + "learning_rate": 1.995070856438694e-06, + "loss": 3.0123, + "step": 1030 + }, + { + "epoch": 0.19, + "learning_rate": 1.9940439515300882e-06, + "loss": 3.4388, + "step": 1035 + }, + { + "epoch": 0.19, + "learning_rate": 1.993017046621483e-06, + "loss": 2.9159, + "step": 1040 + }, + { + "epoch": 0.19, + "learning_rate": 1.991990141712877e-06, + "loss": 2.9784, + "step": 1045 + }, + { + "epoch": 0.2, + "learning_rate": 1.990963236804272e-06, + "loss": 2.8644, + "step": 1050 + }, + { + "epoch": 0.2, + "learning_rate": 1.989936331895666e-06, + "loss": 2.8842, + "step": 1055 + }, + { + "epoch": 0.2, + "learning_rate": 1.988909426987061e-06, + "loss": 2.9332, + "step": 1060 + }, + { + "epoch": 0.2, + "learning_rate": 1.9878825220784556e-06, + "loss": 2.8966, + "step": 1065 + }, + { + "epoch": 0.2, + "learning_rate": 1.9868556171698503e-06, + "loss": 2.9699, + "step": 1070 + }, + { + "epoch": 0.2, + "learning_rate": 1.9858287122612445e-06, + "loss": 2.8659, + "step": 1075 + }, + { + "epoch": 0.2, + "learning_rate": 1.9848018073526392e-06, + "loss": 2.9186, + "step": 1080 + }, + { + "epoch": 0.2, + "learning_rate": 1.9837749024440335e-06, + "loss": 2.871, + "step": 1085 + }, + { + "epoch": 0.2, + "learning_rate": 1.982747997535428e-06, + "loss": 2.8712, + "step": 1090 + }, + { + "epoch": 0.2, + "learning_rate": 1.9817210926268225e-06, + "loss": 2.839, + "step": 1095 + }, + { + "epoch": 0.2, + "learning_rate": 1.980694187718217e-06, + "loss": 2.9186, + "step": 1100 + }, + { + "epoch": 0.21, + "learning_rate": 1.979667282809612e-06, + "loss": 3.1007, + "step": 1105 + }, + { + "epoch": 0.21, + "learning_rate": 1.9786403779010066e-06, + "loss": 2.8781, + "step": 1110 + }, + { + "epoch": 0.21, + "learning_rate": 1.977613472992401e-06, + "loss": 3.292, + "step": 1115 + }, + { + "epoch": 0.21, + "learning_rate": 1.9765865680837955e-06, + "loss": 3.0817, + "step": 1120 + }, + { + "epoch": 0.21, + "learning_rate": 1.97555966317519e-06, + "loss": 2.9705, + "step": 1125 + }, + { + "epoch": 0.21, + "learning_rate": 1.9745327582665845e-06, + "loss": 2.9304, + "step": 1130 + }, + { + "epoch": 0.21, + "learning_rate": 1.9735058533579788e-06, + "loss": 2.8766, + "step": 1135 + }, + { + "epoch": 0.21, + "learning_rate": 1.9724789484493735e-06, + "loss": 2.8477, + "step": 1140 + }, + { + "epoch": 0.21, + "learning_rate": 1.971452043540768e-06, + "loss": 2.9345, + "step": 1145 + }, + { + "epoch": 0.21, + "learning_rate": 1.9704251386321624e-06, + "loss": 2.9276, + "step": 1150 + }, + { + "epoch": 0.22, + "learning_rate": 1.969398233723557e-06, + "loss": 2.9444, + "step": 1155 + }, + { + "epoch": 0.22, + "learning_rate": 1.968371328814952e-06, + "loss": 2.9099, + "step": 1160 + }, + { + "epoch": 0.22, + "learning_rate": 1.967344423906346e-06, + "loss": 2.8898, + "step": 1165 + }, + { + "epoch": 0.22, + "learning_rate": 1.966317518997741e-06, + "loss": 2.9451, + "step": 1170 + }, + { + "epoch": 0.22, + "learning_rate": 1.965290614089135e-06, + "loss": 2.87, + "step": 1175 + }, + { + "epoch": 0.22, + "learning_rate": 1.9642637091805298e-06, + "loss": 2.9508, + "step": 1180 + }, + { + "epoch": 0.22, + "learning_rate": 1.9632368042719245e-06, + "loss": 2.9362, + "step": 1185 + }, + { + "epoch": 0.22, + "learning_rate": 1.9622098993633187e-06, + "loss": 2.9366, + "step": 1190 + }, + { + "epoch": 0.22, + "learning_rate": 1.9611829944547134e-06, + "loss": 3.0603, + "step": 1195 + }, + { + "epoch": 0.22, + "learning_rate": 1.960156089546108e-06, + "loss": 2.8994, + "step": 1200 + }, + { + "epoch": 0.22, + "learning_rate": 1.9591291846375024e-06, + "loss": 3.0001, + "step": 1205 + }, + { + "epoch": 0.23, + "learning_rate": 1.958102279728897e-06, + "loss": 2.8472, + "step": 1210 + }, + { + "epoch": 0.23, + "learning_rate": 1.9570753748202914e-06, + "loss": 2.9021, + "step": 1215 + }, + { + "epoch": 0.23, + "learning_rate": 1.956048469911686e-06, + "loss": 2.8638, + "step": 1220 + }, + { + "epoch": 0.23, + "learning_rate": 1.9550215650030808e-06, + "loss": 2.8506, + "step": 1225 + }, + { + "epoch": 0.23, + "learning_rate": 1.953994660094475e-06, + "loss": 2.8397, + "step": 1230 + }, + { + "epoch": 0.23, + "learning_rate": 1.9529677551858697e-06, + "loss": 3.468, + "step": 1235 + }, + { + "epoch": 0.23, + "learning_rate": 1.9519408502772644e-06, + "loss": 2.9221, + "step": 1240 + }, + { + "epoch": 0.23, + "learning_rate": 1.9509139453686587e-06, + "loss": 3.2824, + "step": 1245 + }, + { + "epoch": 0.23, + "learning_rate": 1.9498870404600534e-06, + "loss": 2.9593, + "step": 1250 + }, + { + "epoch": 0.23, + "learning_rate": 1.9488601355514477e-06, + "loss": 2.9068, + "step": 1255 + }, + { + "epoch": 0.23, + "learning_rate": 1.9478332306428424e-06, + "loss": 2.8651, + "step": 1260 + }, + { + "epoch": 0.24, + "learning_rate": 1.946806325734237e-06, + "loss": 2.8539, + "step": 1265 + }, + { + "epoch": 0.24, + "learning_rate": 1.9457794208256313e-06, + "loss": 2.955, + "step": 1270 + }, + { + "epoch": 0.24, + "learning_rate": 1.944752515917026e-06, + "loss": 3.0867, + "step": 1275 + }, + { + "epoch": 0.24, + "learning_rate": 1.9437256110084207e-06, + "loss": 2.894, + "step": 1280 + }, + { + "epoch": 0.24, + "learning_rate": 1.942698706099815e-06, + "loss": 2.8836, + "step": 1285 + }, + { + "epoch": 0.24, + "learning_rate": 1.9416718011912097e-06, + "loss": 2.8627, + "step": 1290 + }, + { + "epoch": 0.24, + "learning_rate": 1.940644896282604e-06, + "loss": 2.8886, + "step": 1295 + }, + { + "epoch": 0.24, + "learning_rate": 1.9396179913739987e-06, + "loss": 2.91, + "step": 1300 + }, + { + "epoch": 0.24, + "learning_rate": 1.938591086465393e-06, + "loss": 2.8789, + "step": 1305 + }, + { + "epoch": 0.24, + "learning_rate": 1.9375641815567877e-06, + "loss": 2.9238, + "step": 1310 + }, + { + "epoch": 0.24, + "learning_rate": 1.9365372766481823e-06, + "loss": 2.9038, + "step": 1315 + }, + { + "epoch": 0.25, + "learning_rate": 1.935510371739577e-06, + "loss": 2.8612, + "step": 1320 + }, + { + "epoch": 0.25, + "learning_rate": 1.9344834668309713e-06, + "loss": 2.8983, + "step": 1325 + }, + { + "epoch": 0.25, + "learning_rate": 1.933456561922366e-06, + "loss": 2.878, + "step": 1330 + }, + { + "epoch": 0.25, + "learning_rate": 1.9324296570137603e-06, + "loss": 2.8546, + "step": 1335 + }, + { + "epoch": 0.25, + "learning_rate": 1.931402752105155e-06, + "loss": 3.1733, + "step": 1340 + }, + { + "epoch": 0.25, + "learning_rate": 1.9303758471965493e-06, + "loss": 3.0895, + "step": 1345 + }, + { + "epoch": 0.25, + "learning_rate": 1.929348942287944e-06, + "loss": 2.8654, + "step": 1350 + }, + { + "epoch": 0.25, + "learning_rate": 1.9283220373793387e-06, + "loss": 2.9303, + "step": 1355 + }, + { + "epoch": 0.25, + "learning_rate": 1.9272951324707333e-06, + "loss": 2.9429, + "step": 1360 + }, + { + "epoch": 0.25, + "learning_rate": 1.9262682275621276e-06, + "loss": 2.8373, + "step": 1365 + }, + { + "epoch": 0.26, + "learning_rate": 1.9252413226535223e-06, + "loss": 2.9104, + "step": 1370 + }, + { + "epoch": 0.26, + "learning_rate": 1.9242144177449166e-06, + "loss": 2.8777, + "step": 1375 + }, + { + "epoch": 0.26, + "learning_rate": 1.9231875128363113e-06, + "loss": 3.0137, + "step": 1380 + }, + { + "epoch": 0.26, + "learning_rate": 1.9221606079277056e-06, + "loss": 2.9153, + "step": 1385 + }, + { + "epoch": 0.26, + "learning_rate": 1.9211337030191003e-06, + "loss": 2.8599, + "step": 1390 + }, + { + "epoch": 0.26, + "learning_rate": 1.920106798110495e-06, + "loss": 3.5802, + "step": 1395 + }, + { + "epoch": 0.26, + "learning_rate": 1.9190798932018897e-06, + "loss": 2.8061, + "step": 1400 + }, + { + "epoch": 0.26, + "learning_rate": 1.918052988293284e-06, + "loss": 2.9472, + "step": 1405 + }, + { + "epoch": 0.26, + "learning_rate": 1.9170260833846786e-06, + "loss": 2.8901, + "step": 1410 + }, + { + "epoch": 0.26, + "learning_rate": 1.915999178476073e-06, + "loss": 3.3134, + "step": 1415 + }, + { + "epoch": 0.26, + "learning_rate": 1.9149722735674676e-06, + "loss": 2.8888, + "step": 1420 + }, + { + "epoch": 0.27, + "learning_rate": 1.913945368658862e-06, + "loss": 2.8508, + "step": 1425 + }, + { + "epoch": 0.27, + "learning_rate": 1.9129184637502566e-06, + "loss": 2.8544, + "step": 1430 + }, + { + "epoch": 0.27, + "learning_rate": 1.9118915588416513e-06, + "loss": 2.8625, + "step": 1435 + }, + { + "epoch": 0.27, + "learning_rate": 1.9108646539330455e-06, + "loss": 2.8544, + "step": 1440 + }, + { + "epoch": 0.27, + "learning_rate": 1.9098377490244402e-06, + "loss": 2.8768, + "step": 1445 + }, + { + "epoch": 0.27, + "learning_rate": 1.908810844115835e-06, + "loss": 2.917, + "step": 1450 + }, + { + "epoch": 0.27, + "learning_rate": 1.907783939207229e-06, + "loss": 2.8553, + "step": 1455 + }, + { + "epoch": 0.27, + "learning_rate": 1.906757034298624e-06, + "loss": 2.8264, + "step": 1460 + }, + { + "epoch": 0.27, + "learning_rate": 1.9057301293900184e-06, + "loss": 2.9097, + "step": 1465 + }, + { + "epoch": 0.27, + "learning_rate": 1.9047032244814129e-06, + "loss": 3.0831, + "step": 1470 + }, + { + "epoch": 0.27, + "learning_rate": 1.9036763195728074e-06, + "loss": 2.8505, + "step": 1475 + }, + { + "epoch": 0.28, + "learning_rate": 1.902649414664202e-06, + "loss": 2.9628, + "step": 1480 + }, + { + "epoch": 0.28, + "learning_rate": 1.9016225097555965e-06, + "loss": 3.1449, + "step": 1485 + }, + { + "epoch": 0.28, + "learning_rate": 1.900595604846991e-06, + "loss": 2.8451, + "step": 1490 + }, + { + "epoch": 0.28, + "learning_rate": 1.8995686999383855e-06, + "loss": 2.8117, + "step": 1495 + }, + { + "epoch": 0.28, + "learning_rate": 1.8985417950297802e-06, + "loss": 2.8544, + "step": 1500 + }, + { + "epoch": 0.28, + "eval_loss": 2.8667774200439453, + "eval_runtime": 138.7148, + "eval_samples_per_second": 8.608, + "eval_steps_per_second": 1.081, + "eval_wer": 1.0, + "step": 1500 + }, + { + "epoch": 0.28, + "learning_rate": 1.8975148901211747e-06, + "loss": 2.867, + "step": 1505 + }, + { + "epoch": 0.28, + "learning_rate": 1.8964879852125692e-06, + "loss": 2.8454, + "step": 1510 + }, + { + "epoch": 0.28, + "learning_rate": 1.8954610803039637e-06, + "loss": 2.8422, + "step": 1515 + }, + { + "epoch": 0.28, + "learning_rate": 1.8944341753953584e-06, + "loss": 2.9662, + "step": 1520 + }, + { + "epoch": 0.28, + "learning_rate": 1.8934072704867528e-06, + "loss": 2.9235, + "step": 1525 + }, + { + "epoch": 0.28, + "learning_rate": 1.8923803655781473e-06, + "loss": 2.8577, + "step": 1530 + }, + { + "epoch": 0.29, + "learning_rate": 1.8913534606695418e-06, + "loss": 3.5179, + "step": 1535 + }, + { + "epoch": 0.29, + "learning_rate": 1.8903265557609365e-06, + "loss": 2.8604, + "step": 1540 + }, + { + "epoch": 0.29, + "learning_rate": 1.889299650852331e-06, + "loss": 2.8331, + "step": 1545 + }, + { + "epoch": 0.29, + "learning_rate": 1.8882727459437255e-06, + "loss": 2.8456, + "step": 1550 + }, + { + "epoch": 0.29, + "learning_rate": 1.88724584103512e-06, + "loss": 2.9088, + "step": 1555 + }, + { + "epoch": 0.29, + "learning_rate": 1.8862189361265147e-06, + "loss": 2.9141, + "step": 1560 + }, + { + "epoch": 0.29, + "learning_rate": 1.8851920312179091e-06, + "loss": 2.8593, + "step": 1565 + }, + { + "epoch": 0.29, + "learning_rate": 1.8841651263093036e-06, + "loss": 2.8582, + "step": 1570 + }, + { + "epoch": 0.29, + "learning_rate": 1.8831382214006981e-06, + "loss": 2.8991, + "step": 1575 + }, + { + "epoch": 0.29, + "learning_rate": 1.8821113164920928e-06, + "loss": 2.9633, + "step": 1580 + }, + { + "epoch": 0.3, + "learning_rate": 1.881084411583487e-06, + "loss": 2.8986, + "step": 1585 + }, + { + "epoch": 0.3, + "learning_rate": 1.8800575066748818e-06, + "loss": 2.8375, + "step": 1590 + }, + { + "epoch": 0.3, + "learning_rate": 1.8790306017662763e-06, + "loss": 2.9018, + "step": 1595 + }, + { + "epoch": 0.3, + "learning_rate": 1.878003696857671e-06, + "loss": 2.9049, + "step": 1600 + }, + { + "epoch": 0.3, + "learning_rate": 1.8769767919490652e-06, + "loss": 2.8384, + "step": 1605 + }, + { + "epoch": 0.3, + "learning_rate": 1.87594988704046e-06, + "loss": 2.8415, + "step": 1610 + }, + { + "epoch": 0.3, + "learning_rate": 1.8749229821318544e-06, + "loss": 3.1296, + "step": 1615 + }, + { + "epoch": 0.3, + "learning_rate": 1.8738960772232491e-06, + "loss": 2.9117, + "step": 1620 + }, + { + "epoch": 0.3, + "learning_rate": 1.8728691723146434e-06, + "loss": 2.8328, + "step": 1625 + }, + { + "epoch": 0.3, + "learning_rate": 1.871842267406038e-06, + "loss": 2.8658, + "step": 1630 + }, + { + "epoch": 0.3, + "learning_rate": 1.8708153624974326e-06, + "loss": 2.8803, + "step": 1635 + }, + { + "epoch": 0.31, + "learning_rate": 1.8697884575888273e-06, + "loss": 2.8543, + "step": 1640 + }, + { + "epoch": 0.31, + "learning_rate": 1.8687615526802215e-06, + "loss": 2.8685, + "step": 1645 + }, + { + "epoch": 0.31, + "learning_rate": 1.8677346477716162e-06, + "loss": 2.9056, + "step": 1650 + }, + { + "epoch": 0.31, + "learning_rate": 1.8667077428630107e-06, + "loss": 2.8946, + "step": 1655 + }, + { + "epoch": 0.31, + "learning_rate": 1.8656808379544054e-06, + "loss": 2.9043, + "step": 1660 + }, + { + "epoch": 0.31, + "learning_rate": 1.8646539330457997e-06, + "loss": 3.2464, + "step": 1665 + }, + { + "epoch": 0.31, + "learning_rate": 1.8636270281371944e-06, + "loss": 2.8617, + "step": 1670 + }, + { + "epoch": 0.31, + "learning_rate": 1.8626001232285889e-06, + "loss": 2.8053, + "step": 1675 + }, + { + "epoch": 0.31, + "learning_rate": 1.8615732183199836e-06, + "loss": 2.846, + "step": 1680 + }, + { + "epoch": 0.31, + "learning_rate": 1.860546313411378e-06, + "loss": 2.9291, + "step": 1685 + }, + { + "epoch": 0.31, + "learning_rate": 1.8595194085027725e-06, + "loss": 2.8725, + "step": 1690 + }, + { + "epoch": 0.32, + "learning_rate": 1.8584925035941672e-06, + "loss": 2.86, + "step": 1695 + }, + { + "epoch": 0.32, + "learning_rate": 1.8574655986855617e-06, + "loss": 2.8348, + "step": 1700 + }, + { + "epoch": 0.32, + "learning_rate": 1.8564386937769562e-06, + "loss": 2.899, + "step": 1705 + }, + { + "epoch": 0.32, + "learning_rate": 1.8554117888683507e-06, + "loss": 2.9245, + "step": 1710 + }, + { + "epoch": 0.32, + "learning_rate": 1.8543848839597454e-06, + "loss": 2.8713, + "step": 1715 + }, + { + "epoch": 0.32, + "learning_rate": 1.8533579790511399e-06, + "loss": 2.8944, + "step": 1720 + }, + { + "epoch": 0.32, + "learning_rate": 1.8523310741425344e-06, + "loss": 2.9117, + "step": 1725 + }, + { + "epoch": 0.32, + "learning_rate": 1.8513041692339288e-06, + "loss": 3.192, + "step": 1730 + }, + { + "epoch": 0.32, + "learning_rate": 1.8502772643253235e-06, + "loss": 2.9314, + "step": 1735 + }, + { + "epoch": 0.32, + "learning_rate": 1.8492503594167178e-06, + "loss": 2.8147, + "step": 1740 + }, + { + "epoch": 0.33, + "learning_rate": 1.8482234545081125e-06, + "loss": 2.8892, + "step": 1745 + }, + { + "epoch": 0.33, + "learning_rate": 1.847196549599507e-06, + "loss": 2.8516, + "step": 1750 + }, + { + "epoch": 0.33, + "learning_rate": 1.8461696446909017e-06, + "loss": 2.8361, + "step": 1755 + }, + { + "epoch": 0.33, + "learning_rate": 1.845142739782296e-06, + "loss": 2.8513, + "step": 1760 + }, + { + "epoch": 0.33, + "learning_rate": 1.8441158348736907e-06, + "loss": 2.8812, + "step": 1765 + }, + { + "epoch": 0.33, + "learning_rate": 1.8430889299650851e-06, + "loss": 2.9485, + "step": 1770 + }, + { + "epoch": 0.33, + "learning_rate": 1.8420620250564798e-06, + "loss": 2.8524, + "step": 1775 + }, + { + "epoch": 0.33, + "learning_rate": 1.8410351201478741e-06, + "loss": 3.5713, + "step": 1780 + }, + { + "epoch": 0.33, + "learning_rate": 1.8400082152392688e-06, + "loss": 2.8501, + "step": 1785 + }, + { + "epoch": 0.33, + "learning_rate": 1.8389813103306633e-06, + "loss": 2.8184, + "step": 1790 + }, + { + "epoch": 0.33, + "learning_rate": 1.837954405422058e-06, + "loss": 2.8074, + "step": 1795 + }, + { + "epoch": 0.34, + "learning_rate": 1.8369275005134523e-06, + "loss": 2.8764, + "step": 1800 + }, + { + "epoch": 0.34, + "learning_rate": 1.835900595604847e-06, + "loss": 2.9097, + "step": 1805 + }, + { + "epoch": 0.34, + "learning_rate": 1.8348736906962415e-06, + "loss": 2.8483, + "step": 1810 + }, + { + "epoch": 0.34, + "learning_rate": 1.8338467857876361e-06, + "loss": 2.8487, + "step": 1815 + }, + { + "epoch": 0.34, + "learning_rate": 1.8328198808790304e-06, + "loss": 2.8502, + "step": 1820 + }, + { + "epoch": 0.34, + "learning_rate": 1.8317929759704251e-06, + "loss": 2.838, + "step": 1825 + }, + { + "epoch": 0.34, + "learning_rate": 1.8307660710618196e-06, + "loss": 2.8157, + "step": 1830 + }, + { + "epoch": 0.34, + "learning_rate": 1.8297391661532143e-06, + "loss": 2.8304, + "step": 1835 + }, + { + "epoch": 0.34, + "learning_rate": 1.8287122612446086e-06, + "loss": 2.8154, + "step": 1840 + }, + { + "epoch": 0.34, + "learning_rate": 1.8276853563360033e-06, + "loss": 2.795, + "step": 1845 + }, + { + "epoch": 0.34, + "learning_rate": 1.8266584514273978e-06, + "loss": 2.8491, + "step": 1850 + }, + { + "epoch": 0.35, + "learning_rate": 1.8256315465187925e-06, + "loss": 2.8307, + "step": 1855 + }, + { + "epoch": 0.35, + "learning_rate": 1.8246046416101867e-06, + "loss": 2.8661, + "step": 1860 + }, + { + "epoch": 0.35, + "learning_rate": 1.8235777367015814e-06, + "loss": 2.847, + "step": 1865 + }, + { + "epoch": 0.35, + "learning_rate": 1.822550831792976e-06, + "loss": 2.9903, + "step": 1870 + }, + { + "epoch": 0.35, + "learning_rate": 1.8215239268843706e-06, + "loss": 2.8249, + "step": 1875 + }, + { + "epoch": 0.35, + "learning_rate": 1.8204970219757649e-06, + "loss": 2.8958, + "step": 1880 + }, + { + "epoch": 0.35, + "learning_rate": 1.8194701170671596e-06, + "loss": 2.8271, + "step": 1885 + }, + { + "epoch": 0.35, + "learning_rate": 1.818443212158554e-06, + "loss": 2.7845, + "step": 1890 + }, + { + "epoch": 0.35, + "learning_rate": 1.8174163072499488e-06, + "loss": 2.809, + "step": 1895 + }, + { + "epoch": 0.35, + "learning_rate": 1.816389402341343e-06, + "loss": 2.7484, + "step": 1900 + }, + { + "epoch": 0.35, + "learning_rate": 1.8153624974327377e-06, + "loss": 2.8483, + "step": 1905 + }, + { + "epoch": 0.36, + "learning_rate": 1.8143355925241322e-06, + "loss": 2.793, + "step": 1910 + }, + { + "epoch": 0.36, + "learning_rate": 1.8133086876155267e-06, + "loss": 2.9283, + "step": 1915 + }, + { + "epoch": 0.36, + "learning_rate": 1.8122817827069212e-06, + "loss": 2.8682, + "step": 1920 + }, + { + "epoch": 0.36, + "learning_rate": 1.8112548777983159e-06, + "loss": 3.1691, + "step": 1925 + }, + { + "epoch": 0.36, + "learning_rate": 1.8102279728897104e-06, + "loss": 2.7775, + "step": 1930 + }, + { + "epoch": 0.36, + "learning_rate": 1.8092010679811048e-06, + "loss": 2.7845, + "step": 1935 + }, + { + "epoch": 0.36, + "learning_rate": 1.8081741630724993e-06, + "loss": 2.8187, + "step": 1940 + }, + { + "epoch": 0.36, + "learning_rate": 1.807147258163894e-06, + "loss": 3.2324, + "step": 1945 + }, + { + "epoch": 0.36, + "learning_rate": 1.8061203532552885e-06, + "loss": 2.762, + "step": 1950 + }, + { + "epoch": 0.36, + "learning_rate": 1.805093448346683e-06, + "loss": 2.8946, + "step": 1955 + }, + { + "epoch": 0.37, + "learning_rate": 1.8040665434380775e-06, + "loss": 2.8937, + "step": 1960 + }, + { + "epoch": 0.37, + "learning_rate": 1.8030396385294722e-06, + "loss": 2.8476, + "step": 1965 + }, + { + "epoch": 0.37, + "learning_rate": 1.8020127336208667e-06, + "loss": 2.7975, + "step": 1970 + }, + { + "epoch": 0.37, + "learning_rate": 1.8009858287122612e-06, + "loss": 2.7058, + "step": 1975 + }, + { + "epoch": 0.37, + "learning_rate": 1.7999589238036556e-06, + "loss": 2.7794, + "step": 1980 + }, + { + "epoch": 0.37, + "learning_rate": 1.7989320188950503e-06, + "loss": 2.7986, + "step": 1985 + }, + { + "epoch": 0.37, + "learning_rate": 1.7979051139864448e-06, + "loss": 2.7735, + "step": 1990 + }, + { + "epoch": 0.37, + "learning_rate": 1.7968782090778393e-06, + "loss": 3.2428, + "step": 1995 + }, + { + "epoch": 0.37, + "learning_rate": 1.7958513041692338e-06, + "loss": 2.8012, + "step": 2000 + }, + { + "epoch": 0.37, + "eval_loss": 2.72654390335083, + "eval_runtime": 158.5883, + "eval_samples_per_second": 7.529, + "eval_steps_per_second": 0.946, + "eval_wer": 1.0, + "step": 2000 + }, + { + "epoch": 0.37, + "learning_rate": 1.7948243992606285e-06, + "loss": 2.788, + "step": 2005 + }, + { + "epoch": 0.37, + "learning_rate": 1.793797494352023e-06, + "loss": 2.8242, + "step": 2010 + }, + { + "epoch": 0.38, + "learning_rate": 1.7927705894434175e-06, + "loss": 2.9338, + "step": 2015 + }, + { + "epoch": 0.38, + "learning_rate": 1.791743684534812e-06, + "loss": 2.7148, + "step": 2020 + }, + { + "epoch": 0.38, + "learning_rate": 1.7907167796262066e-06, + "loss": 4.2617, + "step": 2025 + }, + { + "epoch": 0.38, + "learning_rate": 1.7896898747176011e-06, + "loss": 2.6996, + "step": 2030 + }, + { + "epoch": 0.38, + "learning_rate": 1.7886629698089956e-06, + "loss": 2.803, + "step": 2035 + }, + { + "epoch": 0.38, + "learning_rate": 1.78763606490039e-06, + "loss": 2.8994, + "step": 2040 + }, + { + "epoch": 0.38, + "learning_rate": 1.7866091599917848e-06, + "loss": 2.7159, + "step": 2045 + }, + { + "epoch": 0.38, + "learning_rate": 1.785582255083179e-06, + "loss": 2.727, + "step": 2050 + }, + { + "epoch": 0.38, + "learning_rate": 1.7845553501745738e-06, + "loss": 2.748, + "step": 2055 + }, + { + "epoch": 0.38, + "learning_rate": 1.7835284452659682e-06, + "loss": 3.1073, + "step": 2060 + }, + { + "epoch": 0.38, + "learning_rate": 1.782501540357363e-06, + "loss": 2.7317, + "step": 2065 + }, + { + "epoch": 0.39, + "learning_rate": 1.7814746354487572e-06, + "loss": 2.7702, + "step": 2070 + }, + { + "epoch": 0.39, + "learning_rate": 1.780447730540152e-06, + "loss": 2.6403, + "step": 2075 + }, + { + "epoch": 0.39, + "learning_rate": 1.7794208256315464e-06, + "loss": 2.6535, + "step": 2080 + }, + { + "epoch": 0.39, + "learning_rate": 1.778393920722941e-06, + "loss": 2.6274, + "step": 2085 + }, + { + "epoch": 0.39, + "learning_rate": 1.7773670158143354e-06, + "loss": 2.6284, + "step": 2090 + }, + { + "epoch": 0.39, + "learning_rate": 1.77634011090573e-06, + "loss": 2.7832, + "step": 2095 + }, + { + "epoch": 0.39, + "learning_rate": 1.7753132059971246e-06, + "loss": 2.6126, + "step": 2100 + }, + { + "epoch": 0.39, + "learning_rate": 1.7742863010885192e-06, + "loss": 2.6608, + "step": 2105 + }, + { + "epoch": 0.39, + "learning_rate": 1.7732593961799135e-06, + "loss": 2.7854, + "step": 2110 + }, + { + "epoch": 0.39, + "learning_rate": 1.7722324912713082e-06, + "loss": 2.6561, + "step": 2115 + }, + { + "epoch": 0.39, + "learning_rate": 1.7712055863627027e-06, + "loss": 2.5986, + "step": 2120 + }, + { + "epoch": 0.4, + "learning_rate": 1.7701786814540974e-06, + "loss": 2.6772, + "step": 2125 + }, + { + "epoch": 0.4, + "learning_rate": 1.7691517765454917e-06, + "loss": 2.5899, + "step": 2130 + }, + { + "epoch": 0.4, + "learning_rate": 1.7681248716368864e-06, + "loss": 2.6522, + "step": 2135 + }, + { + "epoch": 0.4, + "learning_rate": 1.7670979667282809e-06, + "loss": 2.7009, + "step": 2140 + }, + { + "epoch": 0.4, + "learning_rate": 1.7660710618196756e-06, + "loss": 2.5363, + "step": 2145 + }, + { + "epoch": 0.4, + "learning_rate": 1.7650441569110698e-06, + "loss": 2.5242, + "step": 2150 + }, + { + "epoch": 0.4, + "learning_rate": 1.7640172520024645e-06, + "loss": 2.535, + "step": 2155 + }, + { + "epoch": 0.4, + "learning_rate": 1.762990347093859e-06, + "loss": 2.6498, + "step": 2160 + }, + { + "epoch": 0.4, + "learning_rate": 1.7619634421852537e-06, + "loss": 2.7191, + "step": 2165 + }, + { + "epoch": 0.4, + "learning_rate": 1.760936537276648e-06, + "loss": 2.5465, + "step": 2170 + }, + { + "epoch": 0.41, + "learning_rate": 1.7599096323680427e-06, + "loss": 2.5029, + "step": 2175 + }, + { + "epoch": 0.41, + "learning_rate": 1.7588827274594372e-06, + "loss": 3.0624, + "step": 2180 + }, + { + "epoch": 0.41, + "learning_rate": 1.7578558225508319e-06, + "loss": 2.5327, + "step": 2185 + }, + { + "epoch": 0.41, + "learning_rate": 1.7568289176422261e-06, + "loss": 2.5604, + "step": 2190 + }, + { + "epoch": 0.41, + "learning_rate": 1.7558020127336208e-06, + "loss": 2.6551, + "step": 2195 + }, + { + "epoch": 0.41, + "learning_rate": 1.7547751078250153e-06, + "loss": 2.7544, + "step": 2200 + }, + { + "epoch": 0.41, + "learning_rate": 1.75374820291641e-06, + "loss": 2.8209, + "step": 2205 + }, + { + "epoch": 0.41, + "learning_rate": 1.7527212980078043e-06, + "loss": 2.7117, + "step": 2210 + }, + { + "epoch": 0.41, + "learning_rate": 1.751694393099199e-06, + "loss": 2.563, + "step": 2215 + }, + { + "epoch": 0.41, + "learning_rate": 1.7506674881905935e-06, + "loss": 2.585, + "step": 2220 + }, + { + "epoch": 0.41, + "learning_rate": 1.749640583281988e-06, + "loss": 2.6235, + "step": 2225 + }, + { + "epoch": 0.42, + "learning_rate": 1.7486136783733824e-06, + "loss": 2.5745, + "step": 2230 + }, + { + "epoch": 0.42, + "learning_rate": 1.7475867734647771e-06, + "loss": 2.5579, + "step": 2235 + }, + { + "epoch": 0.42, + "learning_rate": 1.7465598685561716e-06, + "loss": 2.6564, + "step": 2240 + }, + { + "epoch": 0.42, + "learning_rate": 1.745532963647566e-06, + "loss": 2.6688, + "step": 2245 + }, + { + "epoch": 0.42, + "learning_rate": 1.7445060587389606e-06, + "loss": 2.8039, + "step": 2250 + }, + { + "epoch": 0.42, + "learning_rate": 1.7434791538303553e-06, + "loss": 2.6522, + "step": 2255 + }, + { + "epoch": 0.42, + "learning_rate": 1.7424522489217498e-06, + "loss": 3.1135, + "step": 2260 + }, + { + "epoch": 0.42, + "learning_rate": 1.7414253440131443e-06, + "loss": 2.4431, + "step": 2265 + }, + { + "epoch": 0.42, + "learning_rate": 1.7403984391045387e-06, + "loss": 2.4361, + "step": 2270 + }, + { + "epoch": 0.42, + "learning_rate": 1.7393715341959334e-06, + "loss": 2.4744, + "step": 2275 + }, + { + "epoch": 0.42, + "learning_rate": 1.738344629287328e-06, + "loss": 2.4935, + "step": 2280 + }, + { + "epoch": 0.43, + "learning_rate": 1.7373177243787224e-06, + "loss": 2.5459, + "step": 2285 + }, + { + "epoch": 0.43, + "learning_rate": 1.7362908194701169e-06, + "loss": 3.1449, + "step": 2290 + }, + { + "epoch": 0.43, + "learning_rate": 1.7352639145615116e-06, + "loss": 2.9531, + "step": 2295 + }, + { + "epoch": 0.43, + "learning_rate": 1.734237009652906e-06, + "loss": 2.7413, + "step": 2300 + }, + { + "epoch": 0.43, + "learning_rate": 1.7332101047443006e-06, + "loss": 2.5559, + "step": 2305 + }, + { + "epoch": 0.43, + "learning_rate": 1.732183199835695e-06, + "loss": 2.5224, + "step": 2310 + }, + { + "epoch": 0.43, + "learning_rate": 1.7311562949270897e-06, + "loss": 2.355, + "step": 2315 + }, + { + "epoch": 0.43, + "learning_rate": 1.7301293900184842e-06, + "loss": 2.3918, + "step": 2320 + }, + { + "epoch": 0.43, + "learning_rate": 1.7291024851098787e-06, + "loss": 2.5834, + "step": 2325 + }, + { + "epoch": 0.43, + "learning_rate": 1.7280755802012732e-06, + "loss": 2.3767, + "step": 2330 + }, + { + "epoch": 0.43, + "learning_rate": 1.7270486752926679e-06, + "loss": 2.5311, + "step": 2335 + }, + { + "epoch": 0.44, + "learning_rate": 1.7260217703840624e-06, + "loss": 2.3856, + "step": 2340 + }, + { + "epoch": 0.44, + "learning_rate": 1.7249948654754569e-06, + "loss": 3.6706, + "step": 2345 + }, + { + "epoch": 0.44, + "learning_rate": 1.7239679605668513e-06, + "loss": 2.2921, + "step": 2350 + }, + { + "epoch": 0.44, + "learning_rate": 1.722941055658246e-06, + "loss": 2.6198, + "step": 2355 + }, + { + "epoch": 0.44, + "learning_rate": 1.7219141507496403e-06, + "loss": 2.5341, + "step": 2360 + }, + { + "epoch": 0.44, + "learning_rate": 1.720887245841035e-06, + "loss": 2.5211, + "step": 2365 + }, + { + "epoch": 0.44, + "learning_rate": 1.7198603409324295e-06, + "loss": 2.3758, + "step": 2370 + }, + { + "epoch": 0.44, + "learning_rate": 1.7188334360238242e-06, + "loss": 2.3367, + "step": 2375 + }, + { + "epoch": 0.44, + "learning_rate": 1.7178065311152185e-06, + "loss": 2.4326, + "step": 2380 + }, + { + "epoch": 0.44, + "learning_rate": 1.7167796262066132e-06, + "loss": 2.2972, + "step": 2385 + }, + { + "epoch": 0.45, + "learning_rate": 1.7157527212980076e-06, + "loss": 2.4532, + "step": 2390 + }, + { + "epoch": 0.45, + "learning_rate": 1.7147258163894023e-06, + "loss": 2.3251, + "step": 2395 + }, + { + "epoch": 0.45, + "learning_rate": 1.7136989114807966e-06, + "loss": 2.2711, + "step": 2400 + }, + { + "epoch": 0.45, + "learning_rate": 1.7126720065721913e-06, + "loss": 2.4129, + "step": 2405 + }, + { + "epoch": 0.45, + "learning_rate": 1.7116451016635858e-06, + "loss": 2.4588, + "step": 2410 + }, + { + "epoch": 0.45, + "learning_rate": 1.7106181967549805e-06, + "loss": 2.5394, + "step": 2415 + }, + { + "epoch": 0.45, + "learning_rate": 1.7095912918463748e-06, + "loss": 2.3018, + "step": 2420 + }, + { + "epoch": 0.45, + "learning_rate": 1.7085643869377695e-06, + "loss": 2.5115, + "step": 2425 + }, + { + "epoch": 0.45, + "learning_rate": 1.707537482029164e-06, + "loss": 2.259, + "step": 2430 + }, + { + "epoch": 0.45, + "learning_rate": 1.7065105771205587e-06, + "loss": 2.3676, + "step": 2435 + }, + { + "epoch": 0.45, + "learning_rate": 1.705483672211953e-06, + "loss": 2.6998, + "step": 2440 + }, + { + "epoch": 0.46, + "learning_rate": 1.7044567673033476e-06, + "loss": 2.4527, + "step": 2445 + }, + { + "epoch": 0.46, + "learning_rate": 1.703429862394742e-06, + "loss": 2.3832, + "step": 2450 + }, + { + "epoch": 0.46, + "learning_rate": 1.7024029574861368e-06, + "loss": 2.3461, + "step": 2455 + }, + { + "epoch": 0.46, + "learning_rate": 1.701376052577531e-06, + "loss": 2.2367, + "step": 2460 + }, + { + "epoch": 0.46, + "learning_rate": 1.7003491476689258e-06, + "loss": 2.2527, + "step": 2465 + }, + { + "epoch": 0.46, + "learning_rate": 1.6993222427603203e-06, + "loss": 2.2838, + "step": 2470 + }, + { + "epoch": 0.46, + "learning_rate": 1.698295337851715e-06, + "loss": 2.5507, + "step": 2475 + }, + { + "epoch": 0.46, + "learning_rate": 1.6972684329431092e-06, + "loss": 2.3646, + "step": 2480 + }, + { + "epoch": 0.46, + "learning_rate": 1.696241528034504e-06, + "loss": 2.248, + "step": 2485 + }, + { + "epoch": 0.46, + "learning_rate": 1.6952146231258984e-06, + "loss": 2.1861, + "step": 2490 + }, + { + "epoch": 0.46, + "learning_rate": 1.6941877182172931e-06, + "loss": 2.2259, + "step": 2495 + }, + { + "epoch": 0.47, + "learning_rate": 1.6931608133086874e-06, + "loss": 2.3309, + "step": 2500 + }, + { + "epoch": 0.47, + "eval_loss": 2.0526249408721924, + "eval_runtime": 162.7261, + "eval_samples_per_second": 7.337, + "eval_steps_per_second": 0.922, + "eval_wer": 1.0, + "step": 2500 + }, + { + "epoch": 0.47, + "learning_rate": 1.692133908400082e-06, + "loss": 2.2051, + "step": 2505 + }, + { + "epoch": 0.47, + "learning_rate": 1.6911070034914766e-06, + "loss": 2.1754, + "step": 2510 + }, + { + "epoch": 0.47, + "learning_rate": 1.690080098582871e-06, + "loss": 2.2147, + "step": 2515 + }, + { + "epoch": 0.47, + "learning_rate": 1.6890531936742657e-06, + "loss": 2.0856, + "step": 2520 + }, + { + "epoch": 0.47, + "learning_rate": 1.6880262887656602e-06, + "loss": 2.1742, + "step": 2525 + }, + { + "epoch": 0.47, + "learning_rate": 1.686999383857055e-06, + "loss": 2.2649, + "step": 2530 + }, + { + "epoch": 0.47, + "learning_rate": 1.6859724789484492e-06, + "loss": 2.5063, + "step": 2535 + }, + { + "epoch": 0.47, + "learning_rate": 1.684945574039844e-06, + "loss": 2.2344, + "step": 2540 + }, + { + "epoch": 0.47, + "learning_rate": 1.6839186691312384e-06, + "loss": 2.4601, + "step": 2545 + }, + { + "epoch": 0.47, + "learning_rate": 1.682891764222633e-06, + "loss": 2.2304, + "step": 2550 + }, + { + "epoch": 0.48, + "learning_rate": 1.6818648593140274e-06, + "loss": 2.0962, + "step": 2555 + }, + { + "epoch": 0.48, + "learning_rate": 1.680837954405422e-06, + "loss": 2.1322, + "step": 2560 + }, + { + "epoch": 0.48, + "learning_rate": 1.6798110494968165e-06, + "loss": 2.1372, + "step": 2565 + }, + { + "epoch": 0.48, + "learning_rate": 1.6787841445882112e-06, + "loss": 2.1914, + "step": 2570 + }, + { + "epoch": 0.48, + "learning_rate": 1.6777572396796055e-06, + "loss": 2.321, + "step": 2575 + }, + { + "epoch": 0.48, + "learning_rate": 1.6767303347710002e-06, + "loss": 2.1254, + "step": 2580 + }, + { + "epoch": 0.48, + "learning_rate": 1.6757034298623947e-06, + "loss": 2.2112, + "step": 2585 + }, + { + "epoch": 0.48, + "learning_rate": 1.6746765249537894e-06, + "loss": 2.3469, + "step": 2590 + }, + { + "epoch": 0.48, + "learning_rate": 1.6736496200451837e-06, + "loss": 2.8565, + "step": 2595 + }, + { + "epoch": 0.48, + "learning_rate": 1.6726227151365784e-06, + "loss": 2.4071, + "step": 2600 + }, + { + "epoch": 0.49, + "learning_rate": 1.6715958102279728e-06, + "loss": 2.4843, + "step": 2605 + }, + { + "epoch": 0.49, + "learning_rate": 1.6705689053193675e-06, + "loss": 2.2168, + "step": 2610 + }, + { + "epoch": 0.49, + "learning_rate": 1.6695420004107618e-06, + "loss": 2.5841, + "step": 2615 + }, + { + "epoch": 0.49, + "learning_rate": 1.6685150955021565e-06, + "loss": 2.2403, + "step": 2620 + }, + { + "epoch": 0.49, + "learning_rate": 1.667488190593551e-06, + "loss": 2.0698, + "step": 2625 + }, + { + "epoch": 0.49, + "learning_rate": 1.6664612856849457e-06, + "loss": 2.3543, + "step": 2630 + }, + { + "epoch": 0.49, + "learning_rate": 1.66543438077634e-06, + "loss": 2.3407, + "step": 2635 + }, + { + "epoch": 0.49, + "learning_rate": 1.6644074758677347e-06, + "loss": 2.4341, + "step": 2640 + }, + { + "epoch": 0.49, + "learning_rate": 1.6633805709591291e-06, + "loss": 2.2227, + "step": 2645 + }, + { + "epoch": 0.49, + "learning_rate": 1.6623536660505238e-06, + "loss": 2.1824, + "step": 2650 + }, + { + "epoch": 0.49, + "learning_rate": 1.6613267611419181e-06, + "loss": 2.0214, + "step": 2655 + }, + { + "epoch": 0.5, + "learning_rate": 1.6602998562333128e-06, + "loss": 2.0735, + "step": 2660 + }, + { + "epoch": 0.5, + "learning_rate": 1.6592729513247073e-06, + "loss": 2.5132, + "step": 2665 + }, + { + "epoch": 0.5, + "learning_rate": 1.658246046416102e-06, + "loss": 2.3907, + "step": 2670 + }, + { + "epoch": 0.5, + "learning_rate": 1.6572191415074963e-06, + "loss": 2.051, + "step": 2675 + }, + { + "epoch": 0.5, + "learning_rate": 1.656192236598891e-06, + "loss": 2.2869, + "step": 2680 + }, + { + "epoch": 0.5, + "learning_rate": 1.6551653316902854e-06, + "loss": 2.0994, + "step": 2685 + }, + { + "epoch": 0.5, + "learning_rate": 1.65413842678168e-06, + "loss": 2.0096, + "step": 2690 + }, + { + "epoch": 0.5, + "learning_rate": 1.6531115218730744e-06, + "loss": 2.0538, + "step": 2695 + }, + { + "epoch": 0.5, + "learning_rate": 1.6520846169644691e-06, + "loss": 2.2783, + "step": 2700 + }, + { + "epoch": 0.5, + "learning_rate": 1.6510577120558636e-06, + "loss": 2.2621, + "step": 2705 + }, + { + "epoch": 0.5, + "learning_rate": 1.650030807147258e-06, + "loss": 2.152, + "step": 2710 + }, + { + "epoch": 0.51, + "learning_rate": 1.6490039022386526e-06, + "loss": 2.1277, + "step": 2715 + }, + { + "epoch": 0.51, + "learning_rate": 1.6479769973300473e-06, + "loss": 1.9992, + "step": 2720 + }, + { + "epoch": 0.51, + "learning_rate": 1.6469500924214417e-06, + "loss": 2.0336, + "step": 2725 + }, + { + "epoch": 0.51, + "learning_rate": 1.6459231875128362e-06, + "loss": 2.1393, + "step": 2730 + }, + { + "epoch": 0.51, + "learning_rate": 1.6448962826042307e-06, + "loss": 1.9702, + "step": 2735 + }, + { + "epoch": 0.51, + "learning_rate": 1.6438693776956254e-06, + "loss": 2.0614, + "step": 2740 + }, + { + "epoch": 0.51, + "learning_rate": 1.64284247278702e-06, + "loss": 2.0463, + "step": 2745 + }, + { + "epoch": 0.51, + "learning_rate": 1.6418155678784144e-06, + "loss": 2.027, + "step": 2750 + }, + { + "epoch": 0.51, + "learning_rate": 1.6407886629698089e-06, + "loss": 1.9492, + "step": 2755 + }, + { + "epoch": 0.51, + "learning_rate": 1.6397617580612036e-06, + "loss": 2.1043, + "step": 2760 + }, + { + "epoch": 0.51, + "learning_rate": 1.638734853152598e-06, + "loss": 2.0343, + "step": 2765 + }, + { + "epoch": 0.52, + "learning_rate": 1.6377079482439925e-06, + "loss": 2.1734, + "step": 2770 + }, + { + "epoch": 0.52, + "learning_rate": 1.636681043335387e-06, + "loss": 2.2739, + "step": 2775 + }, + { + "epoch": 0.52, + "learning_rate": 1.6356541384267817e-06, + "loss": 1.9545, + "step": 2780 + }, + { + "epoch": 0.52, + "learning_rate": 1.6346272335181762e-06, + "loss": 2.1237, + "step": 2785 + }, + { + "epoch": 0.52, + "learning_rate": 1.6336003286095707e-06, + "loss": 1.9395, + "step": 2790 + }, + { + "epoch": 0.52, + "learning_rate": 1.6325734237009652e-06, + "loss": 2.1862, + "step": 2795 + }, + { + "epoch": 0.52, + "learning_rate": 1.6315465187923599e-06, + "loss": 2.2151, + "step": 2800 + }, + { + "epoch": 0.52, + "learning_rate": 1.6305196138837544e-06, + "loss": 1.9663, + "step": 2805 + }, + { + "epoch": 0.52, + "learning_rate": 1.6294927089751488e-06, + "loss": 1.9221, + "step": 2810 + }, + { + "epoch": 0.52, + "learning_rate": 1.6284658040665433e-06, + "loss": 2.4582, + "step": 2815 + }, + { + "epoch": 0.53, + "learning_rate": 1.627438899157938e-06, + "loss": 2.0649, + "step": 2820 + }, + { + "epoch": 0.53, + "learning_rate": 1.6264119942493323e-06, + "loss": 2.2205, + "step": 2825 + }, + { + "epoch": 0.53, + "learning_rate": 1.625385089340727e-06, + "loss": 2.0404, + "step": 2830 + }, + { + "epoch": 0.53, + "learning_rate": 1.6243581844321215e-06, + "loss": 2.0706, + "step": 2835 + }, + { + "epoch": 0.53, + "learning_rate": 1.6233312795235162e-06, + "loss": 1.9393, + "step": 2840 + }, + { + "epoch": 0.53, + "learning_rate": 1.6223043746149104e-06, + "loss": 1.8826, + "step": 2845 + }, + { + "epoch": 0.53, + "learning_rate": 1.6212774697063051e-06, + "loss": 2.0004, + "step": 2850 + }, + { + "epoch": 0.53, + "learning_rate": 1.6202505647976996e-06, + "loss": 1.7917, + "step": 2855 + }, + { + "epoch": 0.53, + "learning_rate": 1.6192236598890943e-06, + "loss": 2.2027, + "step": 2860 + }, + { + "epoch": 0.53, + "learning_rate": 1.6181967549804886e-06, + "loss": 1.814, + "step": 2865 + }, + { + "epoch": 0.53, + "learning_rate": 1.6171698500718833e-06, + "loss": 2.1004, + "step": 2870 + }, + { + "epoch": 0.54, + "learning_rate": 1.6161429451632778e-06, + "loss": 2.0044, + "step": 2875 + }, + { + "epoch": 0.54, + "learning_rate": 1.6151160402546725e-06, + "loss": 1.9016, + "step": 2880 + }, + { + "epoch": 0.54, + "learning_rate": 1.6140891353460668e-06, + "loss": 1.8864, + "step": 2885 + }, + { + "epoch": 0.54, + "learning_rate": 1.6130622304374615e-06, + "loss": 1.9027, + "step": 2890 + }, + { + "epoch": 0.54, + "learning_rate": 1.612035325528856e-06, + "loss": 2.0984, + "step": 2895 + }, + { + "epoch": 0.54, + "learning_rate": 1.6110084206202506e-06, + "loss": 1.8449, + "step": 2900 + }, + { + "epoch": 0.54, + "learning_rate": 1.609981515711645e-06, + "loss": 1.9141, + "step": 2905 + }, + { + "epoch": 0.54, + "learning_rate": 1.6089546108030396e-06, + "loss": 1.8873, + "step": 2910 + }, + { + "epoch": 0.54, + "learning_rate": 1.607927705894434e-06, + "loss": 2.0334, + "step": 2915 + }, + { + "epoch": 0.54, + "learning_rate": 1.6069008009858288e-06, + "loss": 2.0702, + "step": 2920 + }, + { + "epoch": 0.54, + "learning_rate": 1.605873896077223e-06, + "loss": 2.1452, + "step": 2925 + }, + { + "epoch": 0.55, + "learning_rate": 1.6048469911686178e-06, + "loss": 1.7758, + "step": 2930 + }, + { + "epoch": 0.55, + "learning_rate": 1.6038200862600122e-06, + "loss": 2.2563, + "step": 2935 + }, + { + "epoch": 0.55, + "learning_rate": 1.602793181351407e-06, + "loss": 1.8165, + "step": 2940 + }, + { + "epoch": 0.55, + "learning_rate": 1.6017662764428012e-06, + "loss": 1.8777, + "step": 2945 + }, + { + "epoch": 0.55, + "learning_rate": 1.600739371534196e-06, + "loss": 1.869, + "step": 2950 + }, + { + "epoch": 0.55, + "learning_rate": 1.5997124666255904e-06, + "loss": 2.1495, + "step": 2955 + }, + { + "epoch": 0.55, + "learning_rate": 1.598685561716985e-06, + "loss": 1.7904, + "step": 2960 + }, + { + "epoch": 0.55, + "learning_rate": 1.5976586568083794e-06, + "loss": 2.1359, + "step": 2965 + }, + { + "epoch": 0.55, + "learning_rate": 1.596631751899774e-06, + "loss": 1.73, + "step": 2970 + }, + { + "epoch": 0.55, + "learning_rate": 1.5956048469911685e-06, + "loss": 1.7582, + "step": 2975 + }, + { + "epoch": 0.56, + "learning_rate": 1.594577942082563e-06, + "loss": 1.8494, + "step": 2980 + }, + { + "epoch": 0.56, + "learning_rate": 1.5935510371739575e-06, + "loss": 1.8766, + "step": 2985 + }, + { + "epoch": 0.56, + "learning_rate": 1.5925241322653522e-06, + "loss": 1.8829, + "step": 2990 + }, + { + "epoch": 0.56, + "learning_rate": 1.5914972273567467e-06, + "loss": 1.6666, + "step": 2995 + }, + { + "epoch": 0.56, + "learning_rate": 1.5904703224481412e-06, + "loss": 1.993, + "step": 3000 + }, + { + "epoch": 0.56, + "eval_loss": 1.505236029624939, + "eval_runtime": 167.3686, + "eval_samples_per_second": 7.134, + "eval_steps_per_second": 0.896, + "eval_wer": 1.0, + "step": 3000 + }, + { + "epoch": 0.56, + "learning_rate": 1.5894434175395357e-06, + "loss": 1.6019, + "step": 3005 + }, + { + "epoch": 0.56, + "learning_rate": 1.5884165126309304e-06, + "loss": 2.1837, + "step": 3010 + }, + { + "epoch": 0.56, + "learning_rate": 1.5873896077223248e-06, + "loss": 1.8788, + "step": 3015 + }, + { + "epoch": 0.56, + "learning_rate": 1.5863627028137193e-06, + "loss": 2.2183, + "step": 3020 + }, + { + "epoch": 0.56, + "learning_rate": 1.5853357979051138e-06, + "loss": 1.7065, + "step": 3025 + }, + { + "epoch": 0.56, + "learning_rate": 1.5843088929965085e-06, + "loss": 1.6309, + "step": 3030 + }, + { + "epoch": 0.57, + "learning_rate": 1.583281988087903e-06, + "loss": 1.9461, + "step": 3035 + }, + { + "epoch": 0.57, + "learning_rate": 1.5822550831792975e-06, + "loss": 1.8182, + "step": 3040 + }, + { + "epoch": 0.57, + "learning_rate": 1.581228178270692e-06, + "loss": 1.8182, + "step": 3045 + }, + { + "epoch": 0.57, + "learning_rate": 1.5802012733620867e-06, + "loss": 1.95, + "step": 3050 + }, + { + "epoch": 0.57, + "learning_rate": 1.5791743684534812e-06, + "loss": 1.6864, + "step": 3055 + }, + { + "epoch": 0.57, + "learning_rate": 1.5781474635448756e-06, + "loss": 1.7599, + "step": 3060 + }, + { + "epoch": 0.57, + "learning_rate": 1.5771205586362701e-06, + "loss": 1.9663, + "step": 3065 + }, + { + "epoch": 0.57, + "learning_rate": 1.5760936537276648e-06, + "loss": 1.8025, + "step": 3070 + }, + { + "epoch": 0.57, + "learning_rate": 1.5750667488190593e-06, + "loss": 2.1133, + "step": 3075 + }, + { + "epoch": 0.57, + "learning_rate": 1.5740398439104538e-06, + "loss": 1.928, + "step": 3080 + }, + { + "epoch": 0.57, + "learning_rate": 1.5730129390018483e-06, + "loss": 1.6224, + "step": 3085 + }, + { + "epoch": 0.58, + "learning_rate": 1.571986034093243e-06, + "loss": 1.6727, + "step": 3090 + }, + { + "epoch": 0.58, + "learning_rate": 1.5709591291846375e-06, + "loss": 1.7127, + "step": 3095 + }, + { + "epoch": 0.58, + "learning_rate": 1.569932224276032e-06, + "loss": 1.6791, + "step": 3100 + }, + { + "epoch": 0.58, + "learning_rate": 1.5689053193674264e-06, + "loss": 1.9341, + "step": 3105 + }, + { + "epoch": 0.58, + "learning_rate": 1.5678784144588211e-06, + "loss": 1.9801, + "step": 3110 + }, + { + "epoch": 0.58, + "learning_rate": 1.5668515095502154e-06, + "loss": 2.084, + "step": 3115 + }, + { + "epoch": 0.58, + "learning_rate": 1.56582460464161e-06, + "loss": 1.7563, + "step": 3120 + }, + { + "epoch": 0.58, + "learning_rate": 1.5647976997330046e-06, + "loss": 1.6595, + "step": 3125 + }, + { + "epoch": 0.58, + "learning_rate": 1.5637707948243993e-06, + "loss": 1.5875, + "step": 3130 + }, + { + "epoch": 0.58, + "learning_rate": 1.5627438899157935e-06, + "loss": 2.1124, + "step": 3135 + }, + { + "epoch": 0.58, + "learning_rate": 1.5617169850071882e-06, + "loss": 1.8638, + "step": 3140 + }, + { + "epoch": 0.59, + "learning_rate": 1.5606900800985827e-06, + "loss": 1.6619, + "step": 3145 + }, + { + "epoch": 0.59, + "learning_rate": 1.5596631751899774e-06, + "loss": 1.7096, + "step": 3150 + }, + { + "epoch": 0.59, + "learning_rate": 1.5586362702813717e-06, + "loss": 1.796, + "step": 3155 + }, + { + "epoch": 0.59, + "learning_rate": 1.5576093653727664e-06, + "loss": 1.6431, + "step": 3160 + }, + { + "epoch": 0.59, + "learning_rate": 1.5565824604641609e-06, + "loss": 1.6813, + "step": 3165 + }, + { + "epoch": 0.59, + "learning_rate": 1.5555555555555556e-06, + "loss": 1.6838, + "step": 3170 + }, + { + "epoch": 0.59, + "learning_rate": 1.5545286506469499e-06, + "loss": 1.7729, + "step": 3175 + }, + { + "epoch": 0.59, + "learning_rate": 1.5535017457383445e-06, + "loss": 1.8684, + "step": 3180 + }, + { + "epoch": 0.59, + "learning_rate": 1.552474840829739e-06, + "loss": 1.6152, + "step": 3185 + }, + { + "epoch": 0.59, + "learning_rate": 1.5514479359211337e-06, + "loss": 1.8852, + "step": 3190 + }, + { + "epoch": 0.6, + "learning_rate": 1.550421031012528e-06, + "loss": 1.638, + "step": 3195 + }, + { + "epoch": 0.6, + "learning_rate": 1.5493941261039227e-06, + "loss": 1.7184, + "step": 3200 + }, + { + "epoch": 0.6, + "learning_rate": 1.5483672211953172e-06, + "loss": 1.8423, + "step": 3205 + }, + { + "epoch": 0.6, + "learning_rate": 1.5473403162867119e-06, + "loss": 1.996, + "step": 3210 + }, + { + "epoch": 0.6, + "learning_rate": 1.5463134113781062e-06, + "loss": 1.6101, + "step": 3215 + }, + { + "epoch": 0.6, + "learning_rate": 1.5452865064695009e-06, + "loss": 1.6341, + "step": 3220 + }, + { + "epoch": 0.6, + "learning_rate": 1.5442596015608953e-06, + "loss": 1.7689, + "step": 3225 + }, + { + "epoch": 0.6, + "learning_rate": 1.54323269665229e-06, + "loss": 1.5537, + "step": 3230 + }, + { + "epoch": 0.6, + "learning_rate": 1.5422057917436843e-06, + "loss": 1.6625, + "step": 3235 + }, + { + "epoch": 0.6, + "learning_rate": 1.541178886835079e-06, + "loss": 2.0027, + "step": 3240 + }, + { + "epoch": 0.6, + "learning_rate": 1.5401519819264735e-06, + "loss": 1.5174, + "step": 3245 + }, + { + "epoch": 0.61, + "learning_rate": 1.5391250770178682e-06, + "loss": 1.7209, + "step": 3250 + }, + { + "epoch": 0.61, + "learning_rate": 1.5380981721092625e-06, + "loss": 1.6119, + "step": 3255 + }, + { + "epoch": 0.61, + "learning_rate": 1.5370712672006572e-06, + "loss": 1.5694, + "step": 3260 + }, + { + "epoch": 0.61, + "learning_rate": 1.5360443622920516e-06, + "loss": 1.8602, + "step": 3265 + }, + { + "epoch": 0.61, + "learning_rate": 1.5350174573834463e-06, + "loss": 1.5486, + "step": 3270 + }, + { + "epoch": 0.61, + "learning_rate": 1.5339905524748406e-06, + "loss": 2.5045, + "step": 3275 + }, + { + "epoch": 0.61, + "learning_rate": 1.5329636475662353e-06, + "loss": 1.6657, + "step": 3280 + }, + { + "epoch": 0.61, + "learning_rate": 1.5319367426576298e-06, + "loss": 1.8253, + "step": 3285 + }, + { + "epoch": 0.61, + "learning_rate": 1.5309098377490243e-06, + "loss": 1.7489, + "step": 3290 + }, + { + "epoch": 0.61, + "learning_rate": 1.5298829328404188e-06, + "loss": 2.0765, + "step": 3295 + }, + { + "epoch": 0.61, + "learning_rate": 1.5288560279318135e-06, + "loss": 1.7706, + "step": 3300 + }, + { + "epoch": 0.62, + "learning_rate": 1.527829123023208e-06, + "loss": 1.6185, + "step": 3305 + }, + { + "epoch": 0.62, + "learning_rate": 1.5268022181146024e-06, + "loss": 1.4862, + "step": 3310 + }, + { + "epoch": 0.62, + "learning_rate": 1.525775313205997e-06, + "loss": 1.4534, + "step": 3315 + }, + { + "epoch": 0.62, + "learning_rate": 1.5247484082973916e-06, + "loss": 1.7926, + "step": 3320 + }, + { + "epoch": 0.62, + "learning_rate": 1.523721503388786e-06, + "loss": 1.9686, + "step": 3325 + }, + { + "epoch": 0.62, + "learning_rate": 1.5226945984801806e-06, + "loss": 1.7371, + "step": 3330 + }, + { + "epoch": 0.62, + "learning_rate": 1.521667693571575e-06, + "loss": 1.8109, + "step": 3335 + }, + { + "epoch": 0.62, + "learning_rate": 1.5206407886629698e-06, + "loss": 1.835, + "step": 3340 + }, + { + "epoch": 0.62, + "learning_rate": 1.5196138837543643e-06, + "loss": 1.4894, + "step": 3345 + }, + { + "epoch": 0.62, + "learning_rate": 1.5185869788457587e-06, + "loss": 1.8841, + "step": 3350 + }, + { + "epoch": 0.62, + "learning_rate": 1.5175600739371532e-06, + "loss": 1.3907, + "step": 3355 + }, + { + "epoch": 0.63, + "learning_rate": 1.516533169028548e-06, + "loss": 1.7033, + "step": 3360 + }, + { + "epoch": 0.63, + "learning_rate": 1.5155062641199426e-06, + "loss": 1.5871, + "step": 3365 + }, + { + "epoch": 0.63, + "learning_rate": 1.5144793592113369e-06, + "loss": 1.7982, + "step": 3370 + }, + { + "epoch": 0.63, + "learning_rate": 1.5134524543027316e-06, + "loss": 1.4018, + "step": 3375 + }, + { + "epoch": 0.63, + "learning_rate": 1.512425549394126e-06, + "loss": 1.8385, + "step": 3380 + }, + { + "epoch": 0.63, + "learning_rate": 1.5113986444855208e-06, + "loss": 1.7863, + "step": 3385 + }, + { + "epoch": 0.63, + "learning_rate": 1.510371739576915e-06, + "loss": 1.7658, + "step": 3390 + }, + { + "epoch": 0.63, + "learning_rate": 1.5093448346683097e-06, + "loss": 1.9278, + "step": 3395 + }, + { + "epoch": 0.63, + "learning_rate": 1.5083179297597042e-06, + "loss": 1.523, + "step": 3400 + }, + { + "epoch": 0.63, + "learning_rate": 1.507291024851099e-06, + "loss": 3.4477, + "step": 3405 + }, + { + "epoch": 0.64, + "learning_rate": 1.5062641199424932e-06, + "loss": 2.0776, + "step": 3410 + }, + { + "epoch": 0.64, + "learning_rate": 1.5052372150338879e-06, + "loss": 1.6868, + "step": 3415 + }, + { + "epoch": 0.64, + "learning_rate": 1.5042103101252824e-06, + "loss": 1.3986, + "step": 3420 + }, + { + "epoch": 0.64, + "learning_rate": 1.503183405216677e-06, + "loss": 1.5797, + "step": 3425 + }, + { + "epoch": 0.64, + "learning_rate": 1.5021565003080713e-06, + "loss": 1.7646, + "step": 3430 + }, + { + "epoch": 0.64, + "learning_rate": 1.501129595399466e-06, + "loss": 1.761, + "step": 3435 + }, + { + "epoch": 0.64, + "learning_rate": 1.5001026904908605e-06, + "loss": 1.4129, + "step": 3440 + }, + { + "epoch": 0.64, + "learning_rate": 1.499075785582255e-06, + "loss": 1.9737, + "step": 3445 + }, + { + "epoch": 0.64, + "learning_rate": 1.4980488806736495e-06, + "loss": 1.8094, + "step": 3450 + }, + { + "epoch": 0.64, + "learning_rate": 1.4970219757650442e-06, + "loss": 1.4816, + "step": 3455 + }, + { + "epoch": 0.64, + "learning_rate": 1.4959950708564387e-06, + "loss": 1.492, + "step": 3460 + }, + { + "epoch": 0.65, + "learning_rate": 1.4949681659478332e-06, + "loss": 1.5756, + "step": 3465 + }, + { + "epoch": 0.65, + "learning_rate": 1.4939412610392276e-06, + "loss": 1.6382, + "step": 3470 + }, + { + "epoch": 0.65, + "learning_rate": 1.4929143561306223e-06, + "loss": 1.5102, + "step": 3475 + }, + { + "epoch": 0.65, + "learning_rate": 1.4918874512220168e-06, + "loss": 1.4742, + "step": 3480 + }, + { + "epoch": 0.65, + "learning_rate": 1.4908605463134113e-06, + "loss": 1.8775, + "step": 3485 + }, + { + "epoch": 0.65, + "learning_rate": 1.4898336414048058e-06, + "loss": 1.4767, + "step": 3490 + }, + { + "epoch": 0.65, + "learning_rate": 1.4888067364962005e-06, + "loss": 1.3756, + "step": 3495 + }, + { + "epoch": 0.65, + "learning_rate": 1.487779831587595e-06, + "loss": 1.374, + "step": 3500 + }, + { + "epoch": 0.65, + "eval_loss": 1.0981903076171875, + "eval_runtime": 166.6258, + "eval_samples_per_second": 7.166, + "eval_steps_per_second": 0.9, + "eval_wer": 0.9991021036428938, + "step": 3500 + }, + { + "epoch": 0.65, + "learning_rate": 1.4867529266789895e-06, + "loss": 1.3723, + "step": 3505 + }, + { + "epoch": 0.65, + "learning_rate": 1.485726021770384e-06, + "loss": 1.4567, + "step": 3510 + }, + { + "epoch": 0.65, + "learning_rate": 1.4846991168617786e-06, + "loss": 1.7109, + "step": 3515 + }, + { + "epoch": 0.66, + "learning_rate": 1.4836722119531731e-06, + "loss": 1.6903, + "step": 3520 + }, + { + "epoch": 0.66, + "learning_rate": 1.4826453070445676e-06, + "loss": 1.6524, + "step": 3525 + }, + { + "epoch": 0.66, + "learning_rate": 1.481618402135962e-06, + "loss": 1.6053, + "step": 3530 + }, + { + "epoch": 0.66, + "learning_rate": 1.4805914972273568e-06, + "loss": 1.842, + "step": 3535 + }, + { + "epoch": 0.66, + "learning_rate": 1.4795645923187513e-06, + "loss": 1.5981, + "step": 3540 + }, + { + "epoch": 0.66, + "learning_rate": 1.4785376874101458e-06, + "loss": 1.6901, + "step": 3545 + }, + { + "epoch": 0.66, + "learning_rate": 1.4775107825015403e-06, + "loss": 1.3535, + "step": 3550 + }, + { + "epoch": 0.66, + "learning_rate": 1.476483877592935e-06, + "loss": 1.3337, + "step": 3555 + }, + { + "epoch": 0.66, + "learning_rate": 1.4754569726843294e-06, + "loss": 1.9106, + "step": 3560 + }, + { + "epoch": 0.66, + "learning_rate": 1.474430067775724e-06, + "loss": 1.3896, + "step": 3565 + }, + { + "epoch": 0.66, + "learning_rate": 1.4734031628671184e-06, + "loss": 1.5954, + "step": 3570 + }, + { + "epoch": 0.67, + "learning_rate": 1.472376257958513e-06, + "loss": 1.5729, + "step": 3575 + }, + { + "epoch": 0.67, + "learning_rate": 1.4713493530499074e-06, + "loss": 1.4061, + "step": 3580 + }, + { + "epoch": 0.67, + "learning_rate": 1.470322448141302e-06, + "loss": 1.3232, + "step": 3585 + }, + { + "epoch": 0.67, + "learning_rate": 1.4692955432326966e-06, + "loss": 1.4051, + "step": 3590 + }, + { + "epoch": 0.67, + "learning_rate": 1.4682686383240913e-06, + "loss": 1.3958, + "step": 3595 + }, + { + "epoch": 0.67, + "learning_rate": 1.4672417334154855e-06, + "loss": 2.2725, + "step": 3600 + }, + { + "epoch": 0.67, + "learning_rate": 1.4662148285068802e-06, + "loss": 1.627, + "step": 3605 + }, + { + "epoch": 0.67, + "learning_rate": 1.4651879235982747e-06, + "loss": 1.7266, + "step": 3610 + }, + { + "epoch": 0.67, + "learning_rate": 1.4641610186896694e-06, + "loss": 1.4118, + "step": 3615 + }, + { + "epoch": 0.67, + "learning_rate": 1.4631341137810637e-06, + "loss": 1.6395, + "step": 3620 + }, + { + "epoch": 0.68, + "learning_rate": 1.4621072088724584e-06, + "loss": 1.5691, + "step": 3625 + }, + { + "epoch": 0.68, + "learning_rate": 1.4610803039638529e-06, + "loss": 1.3964, + "step": 3630 + }, + { + "epoch": 0.68, + "learning_rate": 1.4600533990552476e-06, + "loss": 1.3778, + "step": 3635 + }, + { + "epoch": 0.68, + "learning_rate": 1.4590264941466418e-06, + "loss": 1.6348, + "step": 3640 + }, + { + "epoch": 0.68, + "learning_rate": 1.4579995892380365e-06, + "loss": 1.2501, + "step": 3645 + }, + { + "epoch": 0.68, + "learning_rate": 1.456972684329431e-06, + "loss": 1.2765, + "step": 3650 + }, + { + "epoch": 0.68, + "learning_rate": 1.4559457794208257e-06, + "loss": 1.8279, + "step": 3655 + }, + { + "epoch": 0.68, + "learning_rate": 1.45491887451222e-06, + "loss": 1.3734, + "step": 3660 + }, + { + "epoch": 0.68, + "learning_rate": 1.4538919696036147e-06, + "loss": 1.8975, + "step": 3665 + }, + { + "epoch": 0.68, + "learning_rate": 1.4528650646950092e-06, + "loss": 1.3493, + "step": 3670 + }, + { + "epoch": 0.68, + "learning_rate": 1.4518381597864039e-06, + "loss": 1.6834, + "step": 3675 + }, + { + "epoch": 0.69, + "learning_rate": 1.4508112548777981e-06, + "loss": 1.2842, + "step": 3680 + }, + { + "epoch": 0.69, + "learning_rate": 1.4497843499691928e-06, + "loss": 1.5672, + "step": 3685 + }, + { + "epoch": 0.69, + "learning_rate": 1.4487574450605873e-06, + "loss": 1.415, + "step": 3690 + }, + { + "epoch": 0.69, + "learning_rate": 1.447730540151982e-06, + "loss": 1.7638, + "step": 3695 + }, + { + "epoch": 0.69, + "learning_rate": 1.4467036352433763e-06, + "loss": 2.0034, + "step": 3700 + }, + { + "epoch": 0.69, + "learning_rate": 1.445676730334771e-06, + "loss": 1.2874, + "step": 3705 + }, + { + "epoch": 0.69, + "learning_rate": 1.4446498254261655e-06, + "loss": 1.5264, + "step": 3710 + }, + { + "epoch": 0.69, + "learning_rate": 1.4436229205175602e-06, + "loss": 1.5826, + "step": 3715 + }, + { + "epoch": 0.69, + "learning_rate": 1.4425960156089544e-06, + "loss": 1.4389, + "step": 3720 + }, + { + "epoch": 0.69, + "learning_rate": 1.4415691107003491e-06, + "loss": 1.3155, + "step": 3725 + }, + { + "epoch": 0.69, + "learning_rate": 1.4405422057917436e-06, + "loss": 1.229, + "step": 3730 + }, + { + "epoch": 0.7, + "learning_rate": 1.4395153008831383e-06, + "loss": 1.5056, + "step": 3735 + }, + { + "epoch": 0.7, + "learning_rate": 1.4384883959745326e-06, + "loss": 1.7682, + "step": 3740 + }, + { + "epoch": 0.7, + "learning_rate": 1.4374614910659273e-06, + "loss": 1.5526, + "step": 3745 + }, + { + "epoch": 0.7, + "learning_rate": 1.4364345861573218e-06, + "loss": 1.6273, + "step": 3750 + }, + { + "epoch": 0.7, + "learning_rate": 1.4354076812487163e-06, + "loss": 1.1467, + "step": 3755 + }, + { + "epoch": 0.7, + "learning_rate": 1.4343807763401107e-06, + "loss": 1.3847, + "step": 3760 + }, + { + "epoch": 0.7, + "learning_rate": 1.4333538714315054e-06, + "loss": 1.3596, + "step": 3765 + }, + { + "epoch": 0.7, + "learning_rate": 1.4323269665229e-06, + "loss": 1.5988, + "step": 3770 + }, + { + "epoch": 0.7, + "learning_rate": 1.4313000616142944e-06, + "loss": 1.5569, + "step": 3775 + }, + { + "epoch": 0.7, + "learning_rate": 1.430273156705689e-06, + "loss": 1.4909, + "step": 3780 + }, + { + "epoch": 0.7, + "learning_rate": 1.4292462517970836e-06, + "loss": 1.1364, + "step": 3785 + }, + { + "epoch": 0.71, + "learning_rate": 1.428219346888478e-06, + "loss": 1.4173, + "step": 3790 + }, + { + "epoch": 0.71, + "learning_rate": 1.4271924419798726e-06, + "loss": 1.4494, + "step": 3795 + }, + { + "epoch": 0.71, + "learning_rate": 1.426165537071267e-06, + "loss": 1.8525, + "step": 3800 + }, + { + "epoch": 0.71, + "learning_rate": 1.4251386321626617e-06, + "loss": 1.6446, + "step": 3805 + }, + { + "epoch": 0.71, + "learning_rate": 1.4241117272540562e-06, + "loss": 1.5038, + "step": 3810 + }, + { + "epoch": 0.71, + "learning_rate": 1.4230848223454507e-06, + "loss": 1.4557, + "step": 3815 + }, + { + "epoch": 0.71, + "learning_rate": 1.4220579174368452e-06, + "loss": 1.1329, + "step": 3820 + }, + { + "epoch": 0.71, + "learning_rate": 1.42103101252824e-06, + "loss": 1.4263, + "step": 3825 + }, + { + "epoch": 0.71, + "learning_rate": 1.4200041076196344e-06, + "loss": 1.1607, + "step": 3830 + }, + { + "epoch": 0.71, + "learning_rate": 1.4189772027110289e-06, + "loss": 1.5083, + "step": 3835 + }, + { + "epoch": 0.72, + "learning_rate": 1.4179502978024234e-06, + "loss": 1.6398, + "step": 3840 + }, + { + "epoch": 0.72, + "learning_rate": 1.416923392893818e-06, + "loss": 1.1638, + "step": 3845 + }, + { + "epoch": 0.72, + "learning_rate": 1.4158964879852125e-06, + "loss": 1.5206, + "step": 3850 + }, + { + "epoch": 0.72, + "learning_rate": 1.414869583076607e-06, + "loss": 1.4404, + "step": 3855 + }, + { + "epoch": 0.72, + "learning_rate": 1.4138426781680015e-06, + "loss": 1.4838, + "step": 3860 + }, + { + "epoch": 0.72, + "learning_rate": 1.4128157732593962e-06, + "loss": 1.3232, + "step": 3865 + }, + { + "epoch": 0.72, + "learning_rate": 1.4117888683507907e-06, + "loss": 1.4703, + "step": 3870 + }, + { + "epoch": 0.72, + "learning_rate": 1.4107619634421852e-06, + "loss": 1.2905, + "step": 3875 + }, + { + "epoch": 0.72, + "learning_rate": 1.4097350585335797e-06, + "loss": 1.4413, + "step": 3880 + }, + { + "epoch": 0.72, + "learning_rate": 1.4087081536249744e-06, + "loss": 1.1968, + "step": 3885 + }, + { + "epoch": 0.72, + "learning_rate": 1.4076812487163686e-06, + "loss": 1.3222, + "step": 3890 + }, + { + "epoch": 0.73, + "learning_rate": 1.4066543438077633e-06, + "loss": 1.1413, + "step": 3895 + }, + { + "epoch": 0.73, + "learning_rate": 1.4056274388991578e-06, + "loss": 1.5517, + "step": 3900 + }, + { + "epoch": 0.73, + "learning_rate": 1.4046005339905525e-06, + "loss": 1.1597, + "step": 3905 + }, + { + "epoch": 0.73, + "learning_rate": 1.4035736290819468e-06, + "loss": 1.2781, + "step": 3910 + }, + { + "epoch": 0.73, + "learning_rate": 1.4025467241733415e-06, + "loss": 1.1736, + "step": 3915 + }, + { + "epoch": 0.73, + "learning_rate": 1.401519819264736e-06, + "loss": 1.3079, + "step": 3920 + }, + { + "epoch": 0.73, + "learning_rate": 1.4004929143561307e-06, + "loss": 1.2027, + "step": 3925 + }, + { + "epoch": 0.73, + "learning_rate": 1.399466009447525e-06, + "loss": 1.2086, + "step": 3930 + }, + { + "epoch": 0.73, + "learning_rate": 1.3984391045389196e-06, + "loss": 1.243, + "step": 3935 + }, + { + "epoch": 0.73, + "learning_rate": 1.3974121996303141e-06, + "loss": 1.6102, + "step": 3940 + }, + { + "epoch": 0.73, + "learning_rate": 1.3963852947217088e-06, + "loss": 1.2809, + "step": 3945 + }, + { + "epoch": 0.74, + "learning_rate": 1.395358389813103e-06, + "loss": 1.1862, + "step": 3950 + }, + { + "epoch": 0.74, + "learning_rate": 1.3943314849044978e-06, + "loss": 1.274, + "step": 3955 + }, + { + "epoch": 0.74, + "learning_rate": 1.3933045799958923e-06, + "loss": 1.6845, + "step": 3960 + }, + { + "epoch": 0.74, + "learning_rate": 1.392277675087287e-06, + "loss": 1.8259, + "step": 3965 + }, + { + "epoch": 0.74, + "learning_rate": 1.3912507701786812e-06, + "loss": 1.5038, + "step": 3970 + }, + { + "epoch": 0.74, + "learning_rate": 1.390223865270076e-06, + "loss": 1.3773, + "step": 3975 + }, + { + "epoch": 0.74, + "learning_rate": 1.3891969603614704e-06, + "loss": 1.2645, + "step": 3980 + }, + { + "epoch": 0.74, + "learning_rate": 1.3881700554528651e-06, + "loss": 1.2258, + "step": 3985 + }, + { + "epoch": 0.74, + "learning_rate": 1.3871431505442594e-06, + "loss": 1.2284, + "step": 3990 + }, + { + "epoch": 0.74, + "learning_rate": 1.386116245635654e-06, + "loss": 1.4279, + "step": 3995 + }, + { + "epoch": 0.75, + "learning_rate": 1.3850893407270486e-06, + "loss": 1.4324, + "step": 4000 + }, + { + "epoch": 0.75, + "eval_loss": 0.871010959148407, + "eval_runtime": 165.2205, + "eval_samples_per_second": 7.227, + "eval_steps_per_second": 0.908, + "eval_wer": 0.9969214982042073, + "step": 4000 + }, + { + "epoch": 0.75, + "learning_rate": 1.3840624358184433e-06, + "loss": 1.4432, + "step": 4005 + }, + { + "epoch": 0.75, + "learning_rate": 1.3830355309098375e-06, + "loss": 1.1459, + "step": 4010 + }, + { + "epoch": 0.75, + "learning_rate": 1.3820086260012322e-06, + "loss": 1.8922, + "step": 4015 + }, + { + "epoch": 0.75, + "learning_rate": 1.3809817210926267e-06, + "loss": 1.5279, + "step": 4020 + }, + { + "epoch": 0.75, + "learning_rate": 1.3799548161840214e-06, + "loss": 1.4555, + "step": 4025 + }, + { + "epoch": 0.75, + "learning_rate": 1.3789279112754157e-06, + "loss": 1.255, + "step": 4030 + }, + { + "epoch": 0.75, + "learning_rate": 1.3779010063668104e-06, + "loss": 1.0926, + "step": 4035 + }, + { + "epoch": 0.75, + "learning_rate": 1.3768741014582049e-06, + "loss": 1.423, + "step": 4040 + }, + { + "epoch": 0.75, + "learning_rate": 1.3758471965495994e-06, + "loss": 1.0813, + "step": 4045 + }, + { + "epoch": 0.75, + "learning_rate": 1.3748202916409938e-06, + "loss": 1.3814, + "step": 4050 + }, + { + "epoch": 0.76, + "learning_rate": 1.3737933867323885e-06, + "loss": 1.2505, + "step": 4055 + }, + { + "epoch": 0.76, + "learning_rate": 1.372766481823783e-06, + "loss": 2.0445, + "step": 4060 + }, + { + "epoch": 0.76, + "learning_rate": 1.3717395769151775e-06, + "loss": 1.3996, + "step": 4065 + }, + { + "epoch": 0.76, + "learning_rate": 1.370712672006572e-06, + "loss": 1.3825, + "step": 4070 + }, + { + "epoch": 0.76, + "learning_rate": 1.3696857670979667e-06, + "loss": 1.5115, + "step": 4075 + }, + { + "epoch": 0.76, + "learning_rate": 1.3686588621893612e-06, + "loss": 1.3877, + "step": 4080 + }, + { + "epoch": 0.76, + "learning_rate": 1.3676319572807557e-06, + "loss": 1.0905, + "step": 4085 + }, + { + "epoch": 0.76, + "learning_rate": 1.3666050523721501e-06, + "loss": 1.3608, + "step": 4090 + }, + { + "epoch": 0.76, + "learning_rate": 1.3655781474635448e-06, + "loss": 1.3166, + "step": 4095 + }, + { + "epoch": 0.76, + "learning_rate": 1.3645512425549393e-06, + "loss": 1.0832, + "step": 4100 + }, + { + "epoch": 0.76, + "learning_rate": 1.3635243376463338e-06, + "loss": 1.248, + "step": 4105 + }, + { + "epoch": 0.77, + "learning_rate": 1.3624974327377283e-06, + "loss": 1.1094, + "step": 4110 + }, + { + "epoch": 0.77, + "learning_rate": 1.361470527829123e-06, + "loss": 1.1145, + "step": 4115 + }, + { + "epoch": 0.77, + "learning_rate": 1.3604436229205175e-06, + "loss": 1.5423, + "step": 4120 + }, + { + "epoch": 0.77, + "learning_rate": 1.359416718011912e-06, + "loss": 1.1091, + "step": 4125 + }, + { + "epoch": 0.77, + "learning_rate": 1.3583898131033065e-06, + "loss": 1.3596, + "step": 4130 + }, + { + "epoch": 0.77, + "learning_rate": 1.3573629081947012e-06, + "loss": 1.1707, + "step": 4135 + }, + { + "epoch": 0.77, + "learning_rate": 1.3563360032860956e-06, + "loss": 1.3573, + "step": 4140 + }, + { + "epoch": 0.77, + "learning_rate": 1.3553090983774901e-06, + "loss": 1.4772, + "step": 4145 + }, + { + "epoch": 0.77, + "learning_rate": 1.3542821934688846e-06, + "loss": 1.1288, + "step": 4150 + }, + { + "epoch": 0.77, + "learning_rate": 1.3532552885602793e-06, + "loss": 1.1474, + "step": 4155 + }, + { + "epoch": 0.77, + "learning_rate": 1.3522283836516738e-06, + "loss": 1.2226, + "step": 4160 + }, + { + "epoch": 0.78, + "learning_rate": 1.3512014787430683e-06, + "loss": 1.6267, + "step": 4165 + }, + { + "epoch": 0.78, + "learning_rate": 1.3501745738344628e-06, + "loss": 1.4794, + "step": 4170 + }, + { + "epoch": 0.78, + "learning_rate": 1.3491476689258575e-06, + "loss": 1.2631, + "step": 4175 + }, + { + "epoch": 0.78, + "learning_rate": 1.3481207640172517e-06, + "loss": 1.4549, + "step": 4180 + }, + { + "epoch": 0.78, + "learning_rate": 1.3470938591086464e-06, + "loss": 1.434, + "step": 4185 + }, + { + "epoch": 0.78, + "learning_rate": 1.346066954200041e-06, + "loss": 1.2872, + "step": 4190 + }, + { + "epoch": 0.78, + "learning_rate": 1.3450400492914356e-06, + "loss": 1.3279, + "step": 4195 + }, + { + "epoch": 0.78, + "learning_rate": 1.3440131443828303e-06, + "loss": 1.3805, + "step": 4200 + }, + { + "epoch": 0.78, + "learning_rate": 1.3429862394742246e-06, + "loss": 1.1369, + "step": 4205 + }, + { + "epoch": 0.78, + "learning_rate": 1.3419593345656193e-06, + "loss": 1.1013, + "step": 4210 + }, + { + "epoch": 0.79, + "learning_rate": 1.3409324296570138e-06, + "loss": 0.9662, + "step": 4215 + }, + { + "epoch": 0.79, + "learning_rate": 1.3399055247484082e-06, + "loss": 1.093, + "step": 4220 + }, + { + "epoch": 0.79, + "learning_rate": 1.3388786198398027e-06, + "loss": 1.2849, + "step": 4225 + }, + { + "epoch": 0.79, + "learning_rate": 1.3378517149311974e-06, + "loss": 1.0428, + "step": 4230 + }, + { + "epoch": 0.79, + "learning_rate": 1.336824810022592e-06, + "loss": 1.083, + "step": 4235 + }, + { + "epoch": 0.79, + "learning_rate": 1.3357979051139864e-06, + "loss": 1.3622, + "step": 4240 + }, + { + "epoch": 0.79, + "learning_rate": 1.3347710002053809e-06, + "loss": 1.1327, + "step": 4245 + }, + { + "epoch": 0.79, + "learning_rate": 1.3337440952967756e-06, + "loss": 1.0384, + "step": 4250 + }, + { + "epoch": 0.79, + "learning_rate": 1.33271719038817e-06, + "loss": 0.9773, + "step": 4255 + }, + { + "epoch": 0.79, + "learning_rate": 1.3316902854795645e-06, + "loss": 1.2673, + "step": 4260 + }, + { + "epoch": 0.79, + "learning_rate": 1.330663380570959e-06, + "loss": 1.3151, + "step": 4265 + }, + { + "epoch": 0.8, + "learning_rate": 1.3296364756623537e-06, + "loss": 1.4965, + "step": 4270 + }, + { + "epoch": 0.8, + "learning_rate": 1.3286095707537482e-06, + "loss": 1.3185, + "step": 4275 + }, + { + "epoch": 0.8, + "learning_rate": 1.3275826658451427e-06, + "loss": 1.6872, + "step": 4280 + }, + { + "epoch": 0.8, + "learning_rate": 1.3265557609365372e-06, + "loss": 1.6085, + "step": 4285 + }, + { + "epoch": 0.8, + "learning_rate": 1.3255288560279319e-06, + "loss": 1.3537, + "step": 4290 + }, + { + "epoch": 0.8, + "learning_rate": 1.3245019511193264e-06, + "loss": 1.1366, + "step": 4295 + }, + { + "epoch": 0.8, + "learning_rate": 1.3234750462107209e-06, + "loss": 1.1825, + "step": 4300 + }, + { + "epoch": 0.8, + "learning_rate": 1.3224481413021153e-06, + "loss": 1.3218, + "step": 4305 + }, + { + "epoch": 0.8, + "learning_rate": 1.32142123639351e-06, + "loss": 1.1001, + "step": 4310 + }, + { + "epoch": 0.8, + "learning_rate": 1.3203943314849045e-06, + "loss": 1.0751, + "step": 4315 + }, + { + "epoch": 0.8, + "learning_rate": 1.319367426576299e-06, + "loss": 1.3475, + "step": 4320 + }, + { + "epoch": 0.81, + "learning_rate": 1.3183405216676935e-06, + "loss": 1.0859, + "step": 4325 + }, + { + "epoch": 0.81, + "learning_rate": 1.3173136167590882e-06, + "loss": 1.4619, + "step": 4330 + }, + { + "epoch": 0.81, + "learning_rate": 1.3162867118504827e-06, + "loss": 1.1734, + "step": 4335 + }, + { + "epoch": 0.81, + "learning_rate": 1.3152598069418772e-06, + "loss": 1.0587, + "step": 4340 + }, + { + "epoch": 0.81, + "learning_rate": 1.3142329020332716e-06, + "loss": 1.0159, + "step": 4345 + }, + { + "epoch": 0.81, + "learning_rate": 1.3132059971246663e-06, + "loss": 0.9952, + "step": 4350 + }, + { + "epoch": 0.81, + "learning_rate": 1.3121790922160606e-06, + "loss": 0.9823, + "step": 4355 + }, + { + "epoch": 0.81, + "learning_rate": 1.3111521873074553e-06, + "loss": 1.209, + "step": 4360 + }, + { + "epoch": 0.81, + "learning_rate": 1.3101252823988498e-06, + "loss": 1.5698, + "step": 4365 + }, + { + "epoch": 0.81, + "learning_rate": 1.3090983774902445e-06, + "loss": 1.3529, + "step": 4370 + }, + { + "epoch": 0.81, + "learning_rate": 1.3080714725816388e-06, + "loss": 1.2588, + "step": 4375 + }, + { + "epoch": 0.82, + "learning_rate": 1.3070445676730335e-06, + "loss": 1.6183, + "step": 4380 + }, + { + "epoch": 0.82, + "learning_rate": 1.306017662764428e-06, + "loss": 1.0698, + "step": 4385 + }, + { + "epoch": 0.82, + "learning_rate": 1.3049907578558226e-06, + "loss": 1.0928, + "step": 4390 + }, + { + "epoch": 0.82, + "learning_rate": 1.303963852947217e-06, + "loss": 1.027, + "step": 4395 + }, + { + "epoch": 0.82, + "learning_rate": 1.3029369480386116e-06, + "loss": 1.2732, + "step": 4400 + }, + { + "epoch": 0.82, + "learning_rate": 1.301910043130006e-06, + "loss": 1.0801, + "step": 4405 + }, + { + "epoch": 0.82, + "learning_rate": 1.3008831382214008e-06, + "loss": 1.6345, + "step": 4410 + }, + { + "epoch": 0.82, + "learning_rate": 1.299856233312795e-06, + "loss": 1.228, + "step": 4415 + }, + { + "epoch": 0.82, + "learning_rate": 1.2988293284041898e-06, + "loss": 1.1848, + "step": 4420 + }, + { + "epoch": 0.82, + "learning_rate": 1.2978024234955842e-06, + "loss": 1.0078, + "step": 4425 + }, + { + "epoch": 0.83, + "learning_rate": 1.296775518586979e-06, + "loss": 1.0556, + "step": 4430 + }, + { + "epoch": 0.83, + "learning_rate": 1.2957486136783732e-06, + "loss": 1.0646, + "step": 4435 + }, + { + "epoch": 0.83, + "learning_rate": 1.294721708769768e-06, + "loss": 1.1601, + "step": 4440 + }, + { + "epoch": 0.83, + "learning_rate": 1.2936948038611624e-06, + "loss": 1.0673, + "step": 4445 + }, + { + "epoch": 0.83, + "learning_rate": 1.292667898952557e-06, + "loss": 1.4266, + "step": 4450 + }, + { + "epoch": 0.83, + "learning_rate": 1.2916409940439514e-06, + "loss": 1.0005, + "step": 4455 + }, + { + "epoch": 0.83, + "learning_rate": 1.290614089135346e-06, + "loss": 1.0665, + "step": 4460 + }, + { + "epoch": 0.83, + "learning_rate": 1.2895871842267406e-06, + "loss": 1.7098, + "step": 4465 + }, + { + "epoch": 0.83, + "learning_rate": 1.2885602793181353e-06, + "loss": 1.0159, + "step": 4470 + }, + { + "epoch": 0.83, + "learning_rate": 1.2875333744095295e-06, + "loss": 1.0682, + "step": 4475 + }, + { + "epoch": 0.83, + "learning_rate": 1.2865064695009242e-06, + "loss": 1.029, + "step": 4480 + }, + { + "epoch": 0.84, + "learning_rate": 1.2854795645923187e-06, + "loss": 1.2077, + "step": 4485 + }, + { + "epoch": 0.84, + "learning_rate": 1.2844526596837134e-06, + "loss": 1.1243, + "step": 4490 + }, + { + "epoch": 0.84, + "learning_rate": 1.2834257547751077e-06, + "loss": 0.8508, + "step": 4495 + }, + { + "epoch": 0.84, + "learning_rate": 1.2823988498665024e-06, + "loss": 1.5273, + "step": 4500 + }, + { + "epoch": 0.84, + "eval_loss": 0.7541612386703491, + "eval_runtime": 160.776, + "eval_samples_per_second": 7.426, + "eval_steps_per_second": 0.933, + "eval_wer": 0.9961518727552591, + "step": 4500 + }, + { + "epoch": 0.84, + "learning_rate": 1.2813719449578969e-06, + "loss": 1.4633, + "step": 4505 + }, + { + "epoch": 0.84, + "learning_rate": 1.2803450400492913e-06, + "loss": 1.0911, + "step": 4510 + }, + { + "epoch": 0.84, + "learning_rate": 1.2793181351406858e-06, + "loss": 1.039, + "step": 4515 + }, + { + "epoch": 0.84, + "learning_rate": 1.2782912302320805e-06, + "loss": 1.1547, + "step": 4520 + }, + { + "epoch": 0.84, + "learning_rate": 1.277264325323475e-06, + "loss": 0.9209, + "step": 4525 + }, + { + "epoch": 0.84, + "learning_rate": 1.2762374204148695e-06, + "loss": 0.9886, + "step": 4530 + }, + { + "epoch": 0.84, + "learning_rate": 1.275210515506264e-06, + "loss": 1.0997, + "step": 4535 + }, + { + "epoch": 0.85, + "learning_rate": 1.2741836105976587e-06, + "loss": 1.9769, + "step": 4540 + }, + { + "epoch": 0.85, + "learning_rate": 1.2731567056890532e-06, + "loss": 0.9819, + "step": 4545 + }, + { + "epoch": 0.85, + "learning_rate": 1.2721298007804476e-06, + "loss": 1.8481, + "step": 4550 + }, + { + "epoch": 0.85, + "learning_rate": 1.2711028958718421e-06, + "loss": 1.2041, + "step": 4555 + }, + { + "epoch": 0.85, + "learning_rate": 1.2700759909632368e-06, + "loss": 1.3081, + "step": 4560 + }, + { + "epoch": 0.85, + "learning_rate": 1.2690490860546313e-06, + "loss": 1.3219, + "step": 4565 + }, + { + "epoch": 0.85, + "learning_rate": 1.2680221811460258e-06, + "loss": 1.3714, + "step": 4570 + }, + { + "epoch": 0.85, + "learning_rate": 1.2669952762374203e-06, + "loss": 0.9208, + "step": 4575 + }, + { + "epoch": 0.85, + "learning_rate": 1.265968371328815e-06, + "loss": 1.0268, + "step": 4580 + }, + { + "epoch": 0.85, + "learning_rate": 1.2649414664202095e-06, + "loss": 0.9589, + "step": 4585 + }, + { + "epoch": 0.85, + "learning_rate": 1.263914561511604e-06, + "loss": 1.1938, + "step": 4590 + }, + { + "epoch": 0.86, + "learning_rate": 1.2628876566029984e-06, + "loss": 1.0504, + "step": 4595 + }, + { + "epoch": 0.86, + "learning_rate": 1.2618607516943931e-06, + "loss": 1.4992, + "step": 4600 + }, + { + "epoch": 0.86, + "learning_rate": 1.2608338467857876e-06, + "loss": 1.0982, + "step": 4605 + }, + { + "epoch": 0.86, + "learning_rate": 1.259806941877182e-06, + "loss": 1.1808, + "step": 4610 + }, + { + "epoch": 0.86, + "learning_rate": 1.2587800369685766e-06, + "loss": 0.9891, + "step": 4615 + }, + { + "epoch": 0.86, + "learning_rate": 1.2577531320599713e-06, + "loss": 0.9634, + "step": 4620 + }, + { + "epoch": 0.86, + "learning_rate": 1.2567262271513658e-06, + "loss": 1.253, + "step": 4625 + }, + { + "epoch": 0.86, + "learning_rate": 1.2556993222427603e-06, + "loss": 0.9934, + "step": 4630 + }, + { + "epoch": 0.86, + "learning_rate": 1.2546724173341547e-06, + "loss": 0.99, + "step": 4635 + }, + { + "epoch": 0.86, + "learning_rate": 1.2536455124255494e-06, + "loss": 1.1702, + "step": 4640 + }, + { + "epoch": 0.87, + "learning_rate": 1.2526186075169437e-06, + "loss": 1.2641, + "step": 4645 + }, + { + "epoch": 0.87, + "learning_rate": 1.2515917026083384e-06, + "loss": 0.9113, + "step": 4650 + }, + { + "epoch": 0.87, + "learning_rate": 1.2505647976997329e-06, + "loss": 0.8693, + "step": 4655 + }, + { + "epoch": 0.87, + "learning_rate": 1.2495378927911276e-06, + "loss": 1.0559, + "step": 4660 + }, + { + "epoch": 0.87, + "learning_rate": 1.2485109878825219e-06, + "loss": 1.177, + "step": 4665 + }, + { + "epoch": 0.87, + "learning_rate": 1.2474840829739166e-06, + "loss": 1.0942, + "step": 4670 + }, + { + "epoch": 0.87, + "learning_rate": 1.246457178065311e-06, + "loss": 1.0034, + "step": 4675 + }, + { + "epoch": 0.87, + "learning_rate": 1.2454302731567057e-06, + "loss": 0.8607, + "step": 4680 + }, + { + "epoch": 0.87, + "learning_rate": 1.2444033682481e-06, + "loss": 1.5524, + "step": 4685 + }, + { + "epoch": 0.87, + "learning_rate": 1.2433764633394947e-06, + "loss": 1.2187, + "step": 4690 + }, + { + "epoch": 0.87, + "learning_rate": 1.2423495584308892e-06, + "loss": 1.05, + "step": 4695 + }, + { + "epoch": 0.88, + "learning_rate": 1.2413226535222839e-06, + "loss": 1.1299, + "step": 4700 + }, + { + "epoch": 0.88, + "learning_rate": 1.2402957486136782e-06, + "loss": 1.0083, + "step": 4705 + }, + { + "epoch": 0.88, + "learning_rate": 1.2392688437050729e-06, + "loss": 1.0147, + "step": 4710 + }, + { + "epoch": 0.88, + "learning_rate": 1.2382419387964673e-06, + "loss": 1.1144, + "step": 4715 + }, + { + "epoch": 0.88, + "learning_rate": 1.237215033887862e-06, + "loss": 0.9494, + "step": 4720 + }, + { + "epoch": 0.88, + "learning_rate": 1.2361881289792563e-06, + "loss": 0.8921, + "step": 4725 + }, + { + "epoch": 0.88, + "learning_rate": 1.235161224070651e-06, + "loss": 0.9891, + "step": 4730 + }, + { + "epoch": 0.88, + "learning_rate": 1.2341343191620455e-06, + "loss": 1.0606, + "step": 4735 + }, + { + "epoch": 0.88, + "learning_rate": 1.2331074142534402e-06, + "loss": 1.1937, + "step": 4740 + }, + { + "epoch": 0.88, + "learning_rate": 1.2320805093448345e-06, + "loss": 0.9862, + "step": 4745 + }, + { + "epoch": 0.88, + "learning_rate": 1.2310536044362292e-06, + "loss": 1.3468, + "step": 4750 + }, + { + "epoch": 0.89, + "learning_rate": 1.2300266995276237e-06, + "loss": 0.8859, + "step": 4755 + }, + { + "epoch": 0.89, + "learning_rate": 1.2289997946190183e-06, + "loss": 0.9742, + "step": 4760 + }, + { + "epoch": 0.89, + "learning_rate": 1.2279728897104126e-06, + "loss": 0.898, + "step": 4765 + }, + { + "epoch": 0.89, + "learning_rate": 1.2269459848018073e-06, + "loss": 1.799, + "step": 4770 + }, + { + "epoch": 0.89, + "learning_rate": 1.2259190798932018e-06, + "loss": 0.8833, + "step": 4775 + }, + { + "epoch": 0.89, + "learning_rate": 1.2248921749845965e-06, + "loss": 1.2739, + "step": 4780 + }, + { + "epoch": 0.89, + "learning_rate": 1.2238652700759908e-06, + "loss": 0.9587, + "step": 4785 + }, + { + "epoch": 0.89, + "learning_rate": 1.2228383651673855e-06, + "loss": 1.0981, + "step": 4790 + }, + { + "epoch": 0.89, + "learning_rate": 1.22181146025878e-06, + "loss": 1.0444, + "step": 4795 + }, + { + "epoch": 0.89, + "learning_rate": 1.2207845553501747e-06, + "loss": 1.3144, + "step": 4800 + }, + { + "epoch": 0.89, + "learning_rate": 1.219757650441569e-06, + "loss": 0.8613, + "step": 4805 + }, + { + "epoch": 0.9, + "learning_rate": 1.2187307455329636e-06, + "loss": 0.9722, + "step": 4810 + }, + { + "epoch": 0.9, + "learning_rate": 1.2177038406243581e-06, + "loss": 1.3232, + "step": 4815 + }, + { + "epoch": 0.9, + "learning_rate": 1.2166769357157526e-06, + "loss": 1.3468, + "step": 4820 + }, + { + "epoch": 0.9, + "learning_rate": 1.215650030807147e-06, + "loss": 0.9843, + "step": 4825 + }, + { + "epoch": 0.9, + "learning_rate": 1.2146231258985418e-06, + "loss": 1.0025, + "step": 4830 + }, + { + "epoch": 0.9, + "learning_rate": 1.2135962209899363e-06, + "loss": 1.192, + "step": 4835 + }, + { + "epoch": 0.9, + "learning_rate": 1.2125693160813307e-06, + "loss": 1.1494, + "step": 4840 + }, + { + "epoch": 0.9, + "learning_rate": 1.2115424111727252e-06, + "loss": 1.2217, + "step": 4845 + }, + { + "epoch": 0.9, + "learning_rate": 1.21051550626412e-06, + "loss": 1.058, + "step": 4850 + }, + { + "epoch": 0.9, + "learning_rate": 1.2094886013555144e-06, + "loss": 0.8975, + "step": 4855 + }, + { + "epoch": 0.91, + "learning_rate": 1.208461696446909e-06, + "loss": 1.0316, + "step": 4860 + }, + { + "epoch": 0.91, + "learning_rate": 1.2074347915383034e-06, + "loss": 1.3582, + "step": 4865 + }, + { + "epoch": 0.91, + "learning_rate": 1.206407886629698e-06, + "loss": 1.1331, + "step": 4870 + }, + { + "epoch": 0.91, + "learning_rate": 1.2053809817210926e-06, + "loss": 1.0301, + "step": 4875 + }, + { + "epoch": 0.91, + "learning_rate": 1.204354076812487e-06, + "loss": 0.9586, + "step": 4880 + }, + { + "epoch": 0.91, + "learning_rate": 1.2033271719038815e-06, + "loss": 0.8966, + "step": 4885 + }, + { + "epoch": 0.91, + "learning_rate": 1.2023002669952762e-06, + "loss": 1.3665, + "step": 4890 + }, + { + "epoch": 0.91, + "learning_rate": 1.2012733620866707e-06, + "loss": 1.1276, + "step": 4895 + }, + { + "epoch": 0.91, + "learning_rate": 1.2002464571780652e-06, + "loss": 1.4535, + "step": 4900 + }, + { + "epoch": 0.91, + "learning_rate": 1.1992195522694597e-06, + "loss": 0.8732, + "step": 4905 + }, + { + "epoch": 0.91, + "learning_rate": 1.1981926473608544e-06, + "loss": 1.1848, + "step": 4910 + }, + { + "epoch": 0.92, + "learning_rate": 1.1971657424522489e-06, + "loss": 0.976, + "step": 4915 + }, + { + "epoch": 0.92, + "learning_rate": 1.1961388375436434e-06, + "loss": 1.2866, + "step": 4920 + }, + { + "epoch": 0.92, + "learning_rate": 1.1951119326350378e-06, + "loss": 0.8825, + "step": 4925 + }, + { + "epoch": 0.92, + "learning_rate": 1.1940850277264325e-06, + "loss": 0.8137, + "step": 4930 + }, + { + "epoch": 0.92, + "learning_rate": 1.193058122817827e-06, + "loss": 1.1454, + "step": 4935 + }, + { + "epoch": 0.92, + "learning_rate": 1.1920312179092215e-06, + "loss": 0.9308, + "step": 4940 + }, + { + "epoch": 0.92, + "learning_rate": 1.191004313000616e-06, + "loss": 0.9336, + "step": 4945 + }, + { + "epoch": 0.92, + "learning_rate": 1.1899774080920107e-06, + "loss": 0.9893, + "step": 4950 + }, + { + "epoch": 0.92, + "learning_rate": 1.188950503183405e-06, + "loss": 1.312, + "step": 4955 + }, + { + "epoch": 0.92, + "learning_rate": 1.1879235982747997e-06, + "loss": 1.1768, + "step": 4960 + }, + { + "epoch": 0.92, + "learning_rate": 1.1868966933661941e-06, + "loss": 1.1879, + "step": 4965 + }, + { + "epoch": 0.93, + "learning_rate": 1.1858697884575888e-06, + "loss": 0.8554, + "step": 4970 + }, + { + "epoch": 0.93, + "learning_rate": 1.1848428835489831e-06, + "loss": 1.1773, + "step": 4975 + }, + { + "epoch": 0.93, + "learning_rate": 1.1838159786403778e-06, + "loss": 1.2384, + "step": 4980 + }, + { + "epoch": 0.93, + "learning_rate": 1.1827890737317723e-06, + "loss": 1.0867, + "step": 4985 + }, + { + "epoch": 0.93, + "learning_rate": 1.181762168823167e-06, + "loss": 0.9638, + "step": 4990 + }, + { + "epoch": 0.93, + "learning_rate": 1.1807352639145613e-06, + "loss": 0.9975, + "step": 4995 + }, + { + "epoch": 0.93, + "learning_rate": 1.179708359005956e-06, + "loss": 1.6983, + "step": 5000 + }, + { + "epoch": 0.93, + "eval_loss": 0.6864951848983765, + "eval_runtime": 158.2129, + "eval_samples_per_second": 7.547, + "eval_steps_per_second": 0.948, + "eval_wer": 0.9917906618778861, + "step": 5000 + }, + { + "epoch": 0.93, + "learning_rate": 1.1786814540973504e-06, + "loss": 1.3032, + "step": 5005 + }, + { + "epoch": 0.93, + "learning_rate": 1.1776545491887451e-06, + "loss": 0.8693, + "step": 5010 + }, + { + "epoch": 0.93, + "learning_rate": 1.1766276442801394e-06, + "loss": 1.4751, + "step": 5015 + }, + { + "epoch": 0.93, + "learning_rate": 1.1756007393715341e-06, + "loss": 1.2441, + "step": 5020 + }, + { + "epoch": 0.94, + "learning_rate": 1.1745738344629286e-06, + "loss": 0.9813, + "step": 5025 + }, + { + "epoch": 0.94, + "learning_rate": 1.1735469295543233e-06, + "loss": 0.9869, + "step": 5030 + }, + { + "epoch": 0.94, + "learning_rate": 1.1725200246457176e-06, + "loss": 1.0416, + "step": 5035 + }, + { + "epoch": 0.94, + "learning_rate": 1.1714931197371123e-06, + "loss": 1.0176, + "step": 5040 + }, + { + "epoch": 0.94, + "learning_rate": 1.170466214828507e-06, + "loss": 0.9778, + "step": 5045 + }, + { + "epoch": 0.94, + "learning_rate": 1.1694393099199014e-06, + "loss": 0.9427, + "step": 5050 + }, + { + "epoch": 0.94, + "learning_rate": 1.168412405011296e-06, + "loss": 1.2824, + "step": 5055 + }, + { + "epoch": 0.94, + "learning_rate": 1.1673855001026904e-06, + "loss": 1.0722, + "step": 5060 + }, + { + "epoch": 0.94, + "learning_rate": 1.1663585951940851e-06, + "loss": 0.8688, + "step": 5065 + }, + { + "epoch": 0.94, + "learning_rate": 1.1653316902854796e-06, + "loss": 0.8749, + "step": 5070 + }, + { + "epoch": 0.95, + "learning_rate": 1.164304785376874e-06, + "loss": 1.1906, + "step": 5075 + }, + { + "epoch": 0.95, + "learning_rate": 1.1632778804682686e-06, + "loss": 1.2363, + "step": 5080 + }, + { + "epoch": 0.95, + "learning_rate": 1.1622509755596633e-06, + "loss": 1.2716, + "step": 5085 + }, + { + "epoch": 0.95, + "learning_rate": 1.1612240706510578e-06, + "loss": 1.2981, + "step": 5090 + }, + { + "epoch": 0.95, + "learning_rate": 1.1601971657424522e-06, + "loss": 1.1415, + "step": 5095 + }, + { + "epoch": 0.95, + "learning_rate": 1.1591702608338467e-06, + "loss": 0.9733, + "step": 5100 + }, + { + "epoch": 0.95, + "learning_rate": 1.1581433559252414e-06, + "loss": 1.0701, + "step": 5105 + }, + { + "epoch": 0.95, + "learning_rate": 1.1571164510166357e-06, + "loss": 1.2484, + "step": 5110 + }, + { + "epoch": 0.95, + "learning_rate": 1.1560895461080304e-06, + "loss": 1.1807, + "step": 5115 + }, + { + "epoch": 0.95, + "learning_rate": 1.1550626411994249e-06, + "loss": 1.4136, + "step": 5120 + }, + { + "epoch": 0.95, + "learning_rate": 1.1540357362908196e-06, + "loss": 0.888, + "step": 5125 + }, + { + "epoch": 0.96, + "learning_rate": 1.1530088313822138e-06, + "loss": 1.2419, + "step": 5130 + }, + { + "epoch": 0.96, + "learning_rate": 1.1519819264736085e-06, + "loss": 1.2136, + "step": 5135 + }, + { + "epoch": 0.96, + "learning_rate": 1.150955021565003e-06, + "loss": 1.1895, + "step": 5140 + }, + { + "epoch": 0.96, + "learning_rate": 1.1499281166563977e-06, + "loss": 0.895, + "step": 5145 + }, + { + "epoch": 0.96, + "learning_rate": 1.148901211747792e-06, + "loss": 1.2032, + "step": 5150 + }, + { + "epoch": 0.96, + "learning_rate": 1.1478743068391867e-06, + "loss": 0.9632, + "step": 5155 + }, + { + "epoch": 0.96, + "learning_rate": 1.1468474019305812e-06, + "loss": 1.2399, + "step": 5160 + }, + { + "epoch": 0.96, + "learning_rate": 1.1458204970219759e-06, + "loss": 1.0117, + "step": 5165 + }, + { + "epoch": 0.96, + "learning_rate": 1.1447935921133701e-06, + "loss": 1.2522, + "step": 5170 + }, + { + "epoch": 0.96, + "learning_rate": 1.1437666872047648e-06, + "loss": 0.915, + "step": 5175 + }, + { + "epoch": 0.96, + "learning_rate": 1.1427397822961593e-06, + "loss": 1.1109, + "step": 5180 + }, + { + "epoch": 0.97, + "learning_rate": 1.141712877387554e-06, + "loss": 1.1202, + "step": 5185 + }, + { + "epoch": 0.97, + "learning_rate": 1.1406859724789483e-06, + "loss": 1.1674, + "step": 5190 + }, + { + "epoch": 0.97, + "learning_rate": 1.139659067570343e-06, + "loss": 1.0151, + "step": 5195 + }, + { + "epoch": 0.97, + "learning_rate": 1.1386321626617375e-06, + "loss": 1.1584, + "step": 5200 + }, + { + "epoch": 0.97, + "learning_rate": 1.1376052577531322e-06, + "loss": 1.1947, + "step": 5205 + }, + { + "epoch": 0.97, + "learning_rate": 1.1365783528445265e-06, + "loss": 1.4659, + "step": 5210 + }, + { + "epoch": 0.97, + "learning_rate": 1.1355514479359211e-06, + "loss": 1.3269, + "step": 5215 + }, + { + "epoch": 0.97, + "learning_rate": 1.1345245430273156e-06, + "loss": 0.8676, + "step": 5220 + }, + { + "epoch": 0.97, + "learning_rate": 1.1334976381187103e-06, + "loss": 1.4621, + "step": 5225 + }, + { + "epoch": 0.97, + "learning_rate": 1.1324707332101046e-06, + "loss": 1.1258, + "step": 5230 + }, + { + "epoch": 0.98, + "learning_rate": 1.1314438283014993e-06, + "loss": 0.9158, + "step": 5235 + }, + { + "epoch": 0.98, + "learning_rate": 1.1304169233928938e-06, + "loss": 1.1497, + "step": 5240 + }, + { + "epoch": 0.98, + "learning_rate": 1.1293900184842885e-06, + "loss": 1.1792, + "step": 5245 + }, + { + "epoch": 0.98, + "learning_rate": 1.1283631135756828e-06, + "loss": 0.9564, + "step": 5250 + }, + { + "epoch": 0.98, + "learning_rate": 1.1273362086670775e-06, + "loss": 1.108, + "step": 5255 + }, + { + "epoch": 0.98, + "learning_rate": 1.126309303758472e-06, + "loss": 0.9212, + "step": 5260 + }, + { + "epoch": 0.98, + "learning_rate": 1.1252823988498666e-06, + "loss": 0.9636, + "step": 5265 + }, + { + "epoch": 0.98, + "learning_rate": 1.124255493941261e-06, + "loss": 0.8813, + "step": 5270 + }, + { + "epoch": 0.98, + "learning_rate": 1.1232285890326556e-06, + "loss": 0.9706, + "step": 5275 + }, + { + "epoch": 0.98, + "learning_rate": 1.12220168412405e-06, + "loss": 1.3708, + "step": 5280 + }, + { + "epoch": 0.98, + "learning_rate": 1.1211747792154446e-06, + "loss": 1.3527, + "step": 5285 + }, + { + "epoch": 0.99, + "learning_rate": 1.120147874306839e-06, + "loss": 0.897, + "step": 5290 + }, + { + "epoch": 0.99, + "learning_rate": 1.1191209693982338e-06, + "loss": 1.1322, + "step": 5295 + }, + { + "epoch": 0.99, + "learning_rate": 1.1180940644896282e-06, + "loss": 1.3505, + "step": 5300 + }, + { + "epoch": 0.99, + "learning_rate": 1.1170671595810227e-06, + "loss": 0.815, + "step": 5305 + }, + { + "epoch": 0.99, + "learning_rate": 1.1160402546724172e-06, + "loss": 0.9654, + "step": 5310 + }, + { + "epoch": 0.99, + "learning_rate": 1.115013349763812e-06, + "loss": 0.9672, + "step": 5315 + }, + { + "epoch": 0.99, + "learning_rate": 1.1139864448552064e-06, + "loss": 1.0071, + "step": 5320 + }, + { + "epoch": 0.99, + "learning_rate": 1.1129595399466009e-06, + "loss": 0.8848, + "step": 5325 + }, + { + "epoch": 0.99, + "learning_rate": 1.1119326350379954e-06, + "loss": 0.8209, + "step": 5330 + }, + { + "epoch": 0.99, + "learning_rate": 1.11090573012939e-06, + "loss": 0.8231, + "step": 5335 + }, + { + "epoch": 0.99, + "learning_rate": 1.1098788252207845e-06, + "loss": 0.9784, + "step": 5340 + }, + { + "epoch": 1.0, + "learning_rate": 1.108851920312179e-06, + "loss": 1.1011, + "step": 5345 + }, + { + "epoch": 1.0, + "learning_rate": 1.1078250154035735e-06, + "loss": 0.8685, + "step": 5350 + }, + { + "epoch": 1.0, + "learning_rate": 1.1067981104949682e-06, + "loss": 1.1179, + "step": 5355 + }, + { + "epoch": 1.0, + "learning_rate": 1.1057712055863627e-06, + "loss": 0.9418, + "step": 5360 + }, + { + "epoch": 1.0, + "learning_rate": 1.1047443006777572e-06, + "loss": 0.8272, + "step": 5365 + }, + { + "epoch": 1.0, + "learning_rate": 1.1037173957691517e-06, + "loss": 1.1035, + "step": 5370 + }, + { + "epoch": 1.0, + "learning_rate": 1.1026904908605464e-06, + "loss": 1.1308, + "step": 5375 + }, + { + "epoch": 1.0, + "learning_rate": 1.1016635859519409e-06, + "loss": 1.3084, + "step": 5380 + }, + { + "epoch": 1.0, + "learning_rate": 1.1006366810433353e-06, + "loss": 1.1212, + "step": 5385 + }, + { + "epoch": 1.0, + "learning_rate": 1.0996097761347298e-06, + "loss": 1.1658, + "step": 5390 + }, + { + "epoch": 1.0, + "learning_rate": 1.0985828712261245e-06, + "loss": 1.0412, + "step": 5395 + }, + { + "epoch": 1.01, + "learning_rate": 1.097555966317519e-06, + "loss": 0.9328, + "step": 5400 + }, + { + "epoch": 1.01, + "learning_rate": 1.0965290614089135e-06, + "loss": 1.2895, + "step": 5405 + }, + { + "epoch": 1.01, + "learning_rate": 1.095502156500308e-06, + "loss": 0.865, + "step": 5410 + }, + { + "epoch": 1.01, + "learning_rate": 1.0944752515917027e-06, + "loss": 0.8867, + "step": 5415 + }, + { + "epoch": 1.01, + "learning_rate": 1.093448346683097e-06, + "loss": 1.02, + "step": 5420 + }, + { + "epoch": 1.01, + "learning_rate": 1.0924214417744916e-06, + "loss": 1.03, + "step": 5425 + }, + { + "epoch": 1.01, + "learning_rate": 1.0913945368658861e-06, + "loss": 1.2617, + "step": 5430 + }, + { + "epoch": 1.01, + "learning_rate": 1.0903676319572808e-06, + "loss": 1.2242, + "step": 5435 + }, + { + "epoch": 1.01, + "learning_rate": 1.089340727048675e-06, + "loss": 0.9322, + "step": 5440 + }, + { + "epoch": 1.01, + "learning_rate": 1.0883138221400698e-06, + "loss": 1.1522, + "step": 5445 + }, + { + "epoch": 1.02, + "learning_rate": 1.0872869172314643e-06, + "loss": 1.1224, + "step": 5450 + }, + { + "epoch": 1.02, + "learning_rate": 1.086260012322859e-06, + "loss": 1.2487, + "step": 5455 + }, + { + "epoch": 1.02, + "learning_rate": 1.0852331074142532e-06, + "loss": 0.9581, + "step": 5460 + }, + { + "epoch": 1.02, + "learning_rate": 1.084206202505648e-06, + "loss": 1.442, + "step": 5465 + }, + { + "epoch": 1.02, + "learning_rate": 1.0831792975970424e-06, + "loss": 1.3162, + "step": 5470 + }, + { + "epoch": 1.02, + "learning_rate": 1.0821523926884371e-06, + "loss": 0.9452, + "step": 5475 + }, + { + "epoch": 1.02, + "learning_rate": 1.0811254877798314e-06, + "loss": 0.8652, + "step": 5480 + }, + { + "epoch": 1.02, + "learning_rate": 1.080098582871226e-06, + "loss": 1.0966, + "step": 5485 + }, + { + "epoch": 1.02, + "learning_rate": 1.0790716779626206e-06, + "loss": 0.8736, + "step": 5490 + }, + { + "epoch": 1.02, + "learning_rate": 1.0780447730540153e-06, + "loss": 0.8189, + "step": 5495 + }, + { + "epoch": 1.02, + "learning_rate": 1.0770178681454096e-06, + "loss": 1.3183, + "step": 5500 + }, + { + "epoch": 1.02, + "eval_loss": 0.657252311706543, + "eval_runtime": 155.1549, + "eval_samples_per_second": 7.696, + "eval_steps_per_second": 0.967, + "eval_wer": 0.9889687018984095, + "step": 5500 + }, + { + "epoch": 1.03, + "learning_rate": 1.0759909632368042e-06, + "loss": 1.0584, + "step": 5505 + }, + { + "epoch": 1.03, + "learning_rate": 1.0749640583281987e-06, + "loss": 1.2603, + "step": 5510 + }, + { + "epoch": 1.03, + "learning_rate": 1.0739371534195934e-06, + "loss": 1.2782, + "step": 5515 + }, + { + "epoch": 1.03, + "learning_rate": 1.0729102485109877e-06, + "loss": 0.9035, + "step": 5520 + }, + { + "epoch": 1.03, + "learning_rate": 1.0718833436023824e-06, + "loss": 0.8609, + "step": 5525 + }, + { + "epoch": 1.03, + "learning_rate": 1.0708564386937769e-06, + "loss": 1.2478, + "step": 5530 + }, + { + "epoch": 1.03, + "learning_rate": 1.0698295337851716e-06, + "loss": 0.9603, + "step": 5535 + }, + { + "epoch": 1.03, + "learning_rate": 1.0688026288765659e-06, + "loss": 0.8891, + "step": 5540 + }, + { + "epoch": 1.03, + "learning_rate": 1.0677757239679606e-06, + "loss": 1.302, + "step": 5545 + }, + { + "epoch": 1.03, + "learning_rate": 1.066748819059355e-06, + "loss": 1.0154, + "step": 5550 + }, + { + "epoch": 1.03, + "learning_rate": 1.0657219141507497e-06, + "loss": 1.2031, + "step": 5555 + }, + { + "epoch": 1.04, + "learning_rate": 1.064695009242144e-06, + "loss": 1.3591, + "step": 5560 + }, + { + "epoch": 1.04, + "learning_rate": 1.0636681043335387e-06, + "loss": 1.8304, + "step": 5565 + }, + { + "epoch": 1.04, + "learning_rate": 1.0626411994249332e-06, + "loss": 0.8764, + "step": 5570 + }, + { + "epoch": 1.04, + "learning_rate": 1.0616142945163277e-06, + "loss": 0.8704, + "step": 5575 + }, + { + "epoch": 1.04, + "learning_rate": 1.0605873896077222e-06, + "loss": 0.9308, + "step": 5580 + }, + { + "epoch": 1.04, + "learning_rate": 1.0595604846991169e-06, + "loss": 0.8924, + "step": 5585 + }, + { + "epoch": 1.04, + "learning_rate": 1.0585335797905113e-06, + "loss": 0.8275, + "step": 5590 + }, + { + "epoch": 1.04, + "learning_rate": 1.0575066748819058e-06, + "loss": 0.9068, + "step": 5595 + }, + { + "epoch": 1.04, + "learning_rate": 1.0564797699733003e-06, + "loss": 1.1158, + "step": 5600 + }, + { + "epoch": 1.04, + "learning_rate": 1.055452865064695e-06, + "loss": 0.8869, + "step": 5605 + }, + { + "epoch": 1.04, + "learning_rate": 1.0544259601560895e-06, + "loss": 0.9003, + "step": 5610 + }, + { + "epoch": 1.05, + "learning_rate": 1.053399055247484e-06, + "loss": 1.0639, + "step": 5615 + }, + { + "epoch": 1.05, + "learning_rate": 1.0523721503388785e-06, + "loss": 1.3936, + "step": 5620 + }, + { + "epoch": 1.05, + "learning_rate": 1.0513452454302732e-06, + "loss": 1.2128, + "step": 5625 + }, + { + "epoch": 1.05, + "learning_rate": 1.0503183405216676e-06, + "loss": 1.1496, + "step": 5630 + }, + { + "epoch": 1.05, + "learning_rate": 1.0492914356130621e-06, + "loss": 1.1112, + "step": 5635 + }, + { + "epoch": 1.05, + "learning_rate": 1.0482645307044566e-06, + "loss": 1.406, + "step": 5640 + }, + { + "epoch": 1.05, + "learning_rate": 1.0472376257958513e-06, + "loss": 0.9241, + "step": 5645 + }, + { + "epoch": 1.05, + "learning_rate": 1.0462107208872458e-06, + "loss": 0.9112, + "step": 5650 + }, + { + "epoch": 1.05, + "learning_rate": 1.0451838159786403e-06, + "loss": 1.1099, + "step": 5655 + }, + { + "epoch": 1.05, + "learning_rate": 1.0441569110700348e-06, + "loss": 1.0678, + "step": 5660 + }, + { + "epoch": 1.06, + "learning_rate": 1.0431300061614295e-06, + "loss": 1.6929, + "step": 5665 + }, + { + "epoch": 1.06, + "learning_rate": 1.042103101252824e-06, + "loss": 0.8691, + "step": 5670 + }, + { + "epoch": 1.06, + "learning_rate": 1.0410761963442184e-06, + "loss": 0.7781, + "step": 5675 + }, + { + "epoch": 1.06, + "learning_rate": 1.040049291435613e-06, + "loss": 0.7718, + "step": 5680 + }, + { + "epoch": 1.06, + "learning_rate": 1.0390223865270076e-06, + "loss": 0.8345, + "step": 5685 + }, + { + "epoch": 1.06, + "learning_rate": 1.037995481618402e-06, + "loss": 0.8584, + "step": 5690 + }, + { + "epoch": 1.06, + "learning_rate": 1.0369685767097966e-06, + "loss": 0.8594, + "step": 5695 + }, + { + "epoch": 1.06, + "learning_rate": 1.035941671801191e-06, + "loss": 1.1204, + "step": 5700 + }, + { + "epoch": 1.06, + "learning_rate": 1.0349147668925858e-06, + "loss": 1.0265, + "step": 5705 + }, + { + "epoch": 1.06, + "learning_rate": 1.03388786198398e-06, + "loss": 0.7591, + "step": 5710 + }, + { + "epoch": 1.06, + "learning_rate": 1.0328609570753747e-06, + "loss": 0.8985, + "step": 5715 + }, + { + "epoch": 1.07, + "learning_rate": 1.0318340521667692e-06, + "loss": 1.3364, + "step": 5720 + }, + { + "epoch": 1.07, + "learning_rate": 1.030807147258164e-06, + "loss": 0.89, + "step": 5725 + }, + { + "epoch": 1.07, + "learning_rate": 1.0297802423495582e-06, + "loss": 1.0093, + "step": 5730 + }, + { + "epoch": 1.07, + "learning_rate": 1.0287533374409529e-06, + "loss": 0.7526, + "step": 5735 + }, + { + "epoch": 1.07, + "learning_rate": 1.0277264325323474e-06, + "loss": 0.8598, + "step": 5740 + }, + { + "epoch": 1.07, + "learning_rate": 1.026699527623742e-06, + "loss": 0.8158, + "step": 5745 + }, + { + "epoch": 1.07, + "learning_rate": 1.0256726227151363e-06, + "loss": 0.9379, + "step": 5750 + }, + { + "epoch": 1.07, + "learning_rate": 1.024645717806531e-06, + "loss": 1.0578, + "step": 5755 + }, + { + "epoch": 1.07, + "learning_rate": 1.0236188128979255e-06, + "loss": 0.9005, + "step": 5760 + }, + { + "epoch": 1.07, + "learning_rate": 1.0225919079893202e-06, + "loss": 0.7995, + "step": 5765 + }, + { + "epoch": 1.07, + "learning_rate": 1.0215650030807145e-06, + "loss": 1.4633, + "step": 5770 + }, + { + "epoch": 1.08, + "learning_rate": 1.0205380981721092e-06, + "loss": 0.9068, + "step": 5775 + }, + { + "epoch": 1.08, + "learning_rate": 1.0195111932635037e-06, + "loss": 1.0527, + "step": 5780 + }, + { + "epoch": 1.08, + "learning_rate": 1.0184842883548984e-06, + "loss": 1.186, + "step": 5785 + }, + { + "epoch": 1.08, + "learning_rate": 1.0174573834462926e-06, + "loss": 0.8254, + "step": 5790 + }, + { + "epoch": 1.08, + "learning_rate": 1.0164304785376873e-06, + "loss": 1.1384, + "step": 5795 + }, + { + "epoch": 1.08, + "learning_rate": 1.0154035736290818e-06, + "loss": 0.9161, + "step": 5800 + }, + { + "epoch": 1.08, + "learning_rate": 1.0143766687204765e-06, + "loss": 1.0261, + "step": 5805 + }, + { + "epoch": 1.08, + "learning_rate": 1.0133497638118708e-06, + "loss": 0.8808, + "step": 5810 + }, + { + "epoch": 1.08, + "learning_rate": 1.0123228589032655e-06, + "loss": 0.9922, + "step": 5815 + }, + { + "epoch": 1.08, + "learning_rate": 1.01129595399466e-06, + "loss": 1.5194, + "step": 5820 + }, + { + "epoch": 1.08, + "learning_rate": 1.0102690490860547e-06, + "loss": 0.7695, + "step": 5825 + }, + { + "epoch": 1.09, + "learning_rate": 1.009242144177449e-06, + "loss": 1.1249, + "step": 5830 + }, + { + "epoch": 1.09, + "learning_rate": 1.0082152392688437e-06, + "loss": 0.9865, + "step": 5835 + }, + { + "epoch": 1.09, + "learning_rate": 1.0071883343602381e-06, + "loss": 1.1333, + "step": 5840 + }, + { + "epoch": 1.09, + "learning_rate": 1.0061614294516328e-06, + "loss": 0.7846, + "step": 5845 + }, + { + "epoch": 1.09, + "learning_rate": 1.005134524543027e-06, + "loss": 1.7098, + "step": 5850 + }, + { + "epoch": 1.09, + "learning_rate": 1.0041076196344218e-06, + "loss": 1.1977, + "step": 5855 + }, + { + "epoch": 1.09, + "learning_rate": 1.0030807147258163e-06, + "loss": 1.0122, + "step": 5860 + }, + { + "epoch": 1.09, + "learning_rate": 1.002053809817211e-06, + "loss": 0.926, + "step": 5865 + }, + { + "epoch": 1.09, + "learning_rate": 1.0010269049086053e-06, + "loss": 0.9618, + "step": 5870 + }, + { + "epoch": 1.09, + "learning_rate": 1e-06, + "loss": 1.3674, + "step": 5875 + }, + { + "epoch": 1.1, + "learning_rate": 9.989730950913944e-07, + "loss": 1.2644, + "step": 5880 + }, + { + "epoch": 1.1, + "learning_rate": 9.97946190182789e-07, + "loss": 0.9674, + "step": 5885 + }, + { + "epoch": 1.1, + "learning_rate": 9.969192852741836e-07, + "loss": 1.0945, + "step": 5890 + }, + { + "epoch": 1.1, + "learning_rate": 9.958923803655781e-07, + "loss": 0.7358, + "step": 5895 + }, + { + "epoch": 1.1, + "learning_rate": 9.948654754569726e-07, + "loss": 1.0663, + "step": 5900 + }, + { + "epoch": 1.1, + "learning_rate": 9.93838570548367e-07, + "loss": 1.1117, + "step": 5905 + }, + { + "epoch": 1.1, + "learning_rate": 9.928116656397618e-07, + "loss": 0.8097, + "step": 5910 + }, + { + "epoch": 1.1, + "learning_rate": 9.917847607311563e-07, + "loss": 0.9344, + "step": 5915 + }, + { + "epoch": 1.1, + "learning_rate": 9.907578558225507e-07, + "loss": 0.9088, + "step": 5920 + }, + { + "epoch": 1.1, + "learning_rate": 9.897309509139452e-07, + "loss": 0.7678, + "step": 5925 + }, + { + "epoch": 1.1, + "learning_rate": 9.8870404600534e-07, + "loss": 0.8153, + "step": 5930 + }, + { + "epoch": 1.11, + "learning_rate": 9.876771410967344e-07, + "loss": 1.0027, + "step": 5935 + }, + { + "epoch": 1.11, + "learning_rate": 9.86650236188129e-07, + "loss": 0.8837, + "step": 5940 + }, + { + "epoch": 1.11, + "learning_rate": 9.856233312795234e-07, + "loss": 0.837, + "step": 5945 + }, + { + "epoch": 1.11, + "learning_rate": 9.84596426370918e-07, + "loss": 1.0137, + "step": 5950 + }, + { + "epoch": 1.11, + "learning_rate": 9.835695214623126e-07, + "loss": 1.3639, + "step": 5955 + }, + { + "epoch": 1.11, + "learning_rate": 9.82542616553707e-07, + "loss": 1.2383, + "step": 5960 + }, + { + "epoch": 1.11, + "learning_rate": 9.815157116451015e-07, + "loss": 0.8519, + "step": 5965 + }, + { + "epoch": 1.11, + "learning_rate": 9.804888067364962e-07, + "loss": 0.8987, + "step": 5970 + }, + { + "epoch": 1.11, + "learning_rate": 9.794619018278907e-07, + "loss": 0.7677, + "step": 5975 + }, + { + "epoch": 1.11, + "learning_rate": 9.784349969192852e-07, + "loss": 0.7758, + "step": 5980 + }, + { + "epoch": 1.11, + "learning_rate": 9.774080920106797e-07, + "loss": 0.7488, + "step": 5985 + }, + { + "epoch": 1.12, + "learning_rate": 9.763811871020744e-07, + "loss": 1.3031, + "step": 5990 + }, + { + "epoch": 1.12, + "learning_rate": 9.753542821934689e-07, + "loss": 0.9354, + "step": 5995 + }, + { + "epoch": 1.12, + "learning_rate": 9.743273772848634e-07, + "loss": 0.8463, + "step": 6000 + }, + { + "epoch": 1.12, + "eval_loss": 0.6284204125404358, + "eval_runtime": 159.2114, + "eval_samples_per_second": 7.499, + "eval_steps_per_second": 0.942, + "eval_wer": 0.9790918419702411, + "step": 6000 + }, + { + "epoch": 1.12, + "learning_rate": 9.733004723762578e-07, + "loss": 1.0615, + "step": 6005 + }, + { + "epoch": 1.12, + "learning_rate": 9.722735674676525e-07, + "loss": 0.7658, + "step": 6010 + }, + { + "epoch": 1.12, + "learning_rate": 9.71246662559047e-07, + "loss": 0.7916, + "step": 6015 + }, + { + "epoch": 1.12, + "learning_rate": 9.702197576504415e-07, + "loss": 0.8727, + "step": 6020 + }, + { + "epoch": 1.12, + "learning_rate": 9.69192852741836e-07, + "loss": 1.3318, + "step": 6025 + }, + { + "epoch": 1.12, + "learning_rate": 9.681659478332305e-07, + "loss": 0.9762, + "step": 6030 + }, + { + "epoch": 1.12, + "learning_rate": 9.671390429246252e-07, + "loss": 1.13, + "step": 6035 + }, + { + "epoch": 1.12, + "learning_rate": 9.661121380160197e-07, + "loss": 0.9907, + "step": 6040 + }, + { + "epoch": 1.13, + "learning_rate": 9.650852331074141e-07, + "loss": 0.8157, + "step": 6045 + }, + { + "epoch": 1.13, + "learning_rate": 9.640583281988086e-07, + "loss": 1.3409, + "step": 6050 + }, + { + "epoch": 1.13, + "learning_rate": 9.630314232902033e-07, + "loss": 0.7981, + "step": 6055 + }, + { + "epoch": 1.13, + "learning_rate": 9.620045183815978e-07, + "loss": 1.1387, + "step": 6060 + }, + { + "epoch": 1.13, + "learning_rate": 9.609776134729923e-07, + "loss": 1.3179, + "step": 6065 + }, + { + "epoch": 1.13, + "learning_rate": 9.599507085643868e-07, + "loss": 1.3169, + "step": 6070 + }, + { + "epoch": 1.13, + "learning_rate": 9.589238036557815e-07, + "loss": 0.859, + "step": 6075 + }, + { + "epoch": 1.13, + "learning_rate": 9.57896898747176e-07, + "loss": 0.8268, + "step": 6080 + }, + { + "epoch": 1.13, + "learning_rate": 9.568699938385704e-07, + "loss": 0.8662, + "step": 6085 + }, + { + "epoch": 1.13, + "learning_rate": 9.55843088929965e-07, + "loss": 1.1457, + "step": 6090 + }, + { + "epoch": 1.14, + "learning_rate": 9.548161840213596e-07, + "loss": 0.884, + "step": 6095 + }, + { + "epoch": 1.14, + "learning_rate": 9.537892791127541e-07, + "loss": 1.0815, + "step": 6100 + }, + { + "epoch": 1.14, + "learning_rate": 9.527623742041486e-07, + "loss": 0.8797, + "step": 6105 + }, + { + "epoch": 1.14, + "learning_rate": 9.517354692955432e-07, + "loss": 0.9832, + "step": 6110 + }, + { + "epoch": 1.14, + "learning_rate": 9.507085643869377e-07, + "loss": 1.0398, + "step": 6115 + }, + { + "epoch": 1.14, + "learning_rate": 9.496816594783323e-07, + "loss": 0.9358, + "step": 6120 + }, + { + "epoch": 1.14, + "learning_rate": 9.486547545697267e-07, + "loss": 0.7413, + "step": 6125 + }, + { + "epoch": 1.14, + "learning_rate": 9.476278496611213e-07, + "loss": 0.8723, + "step": 6130 + }, + { + "epoch": 1.14, + "learning_rate": 9.466009447525158e-07, + "loss": 0.8005, + "step": 6135 + }, + { + "epoch": 1.14, + "learning_rate": 9.455740398439104e-07, + "loss": 1.2658, + "step": 6140 + }, + { + "epoch": 1.14, + "learning_rate": 9.445471349353049e-07, + "loss": 0.7385, + "step": 6145 + }, + { + "epoch": 1.15, + "learning_rate": 9.435202300266995e-07, + "loss": 1.0049, + "step": 6150 + }, + { + "epoch": 1.15, + "learning_rate": 9.42493325118094e-07, + "loss": 0.9273, + "step": 6155 + }, + { + "epoch": 1.15, + "learning_rate": 9.414664202094886e-07, + "loss": 0.8961, + "step": 6160 + }, + { + "epoch": 1.15, + "learning_rate": 9.404395153008831e-07, + "loss": 0.9023, + "step": 6165 + }, + { + "epoch": 1.15, + "learning_rate": 9.394126103922776e-07, + "loss": 0.9846, + "step": 6170 + }, + { + "epoch": 1.15, + "learning_rate": 9.383857054836721e-07, + "loss": 0.8104, + "step": 6175 + }, + { + "epoch": 1.15, + "learning_rate": 9.373588005750666e-07, + "loss": 1.1124, + "step": 6180 + }, + { + "epoch": 1.15, + "learning_rate": 9.363318956664612e-07, + "loss": 0.9646, + "step": 6185 + }, + { + "epoch": 1.15, + "learning_rate": 9.353049907578557e-07, + "loss": 1.0231, + "step": 6190 + }, + { + "epoch": 1.15, + "learning_rate": 9.342780858492503e-07, + "loss": 1.2962, + "step": 6195 + }, + { + "epoch": 1.15, + "learning_rate": 9.332511809406448e-07, + "loss": 0.8414, + "step": 6200 + }, + { + "epoch": 1.16, + "learning_rate": 9.322242760320394e-07, + "loss": 0.7878, + "step": 6205 + }, + { + "epoch": 1.16, + "learning_rate": 9.311973711234338e-07, + "loss": 0.944, + "step": 6210 + }, + { + "epoch": 1.16, + "learning_rate": 9.301704662148284e-07, + "loss": 0.942, + "step": 6215 + }, + { + "epoch": 1.16, + "learning_rate": 9.291435613062229e-07, + "loss": 1.3707, + "step": 6220 + }, + { + "epoch": 1.16, + "learning_rate": 9.281166563976175e-07, + "loss": 0.8415, + "step": 6225 + }, + { + "epoch": 1.16, + "learning_rate": 9.27089751489012e-07, + "loss": 0.8805, + "step": 6230 + }, + { + "epoch": 1.16, + "learning_rate": 9.260628465804066e-07, + "loss": 0.891, + "step": 6235 + }, + { + "epoch": 1.16, + "learning_rate": 9.250359416718011e-07, + "loss": 0.7415, + "step": 6240 + }, + { + "epoch": 1.16, + "learning_rate": 9.240090367631957e-07, + "loss": 0.8968, + "step": 6245 + }, + { + "epoch": 1.16, + "learning_rate": 9.229821318545901e-07, + "loss": 0.7583, + "step": 6250 + }, + { + "epoch": 1.17, + "learning_rate": 9.219552269459847e-07, + "loss": 0.7122, + "step": 6255 + }, + { + "epoch": 1.17, + "learning_rate": 9.209283220373792e-07, + "loss": 1.2121, + "step": 6260 + }, + { + "epoch": 1.17, + "learning_rate": 9.199014171287738e-07, + "loss": 1.0367, + "step": 6265 + }, + { + "epoch": 1.17, + "learning_rate": 9.188745122201683e-07, + "loss": 0.7003, + "step": 6270 + }, + { + "epoch": 1.17, + "learning_rate": 9.178476073115629e-07, + "loss": 1.0541, + "step": 6275 + }, + { + "epoch": 1.17, + "learning_rate": 9.168207024029574e-07, + "loss": 0.9233, + "step": 6280 + }, + { + "epoch": 1.17, + "learning_rate": 9.15793797494352e-07, + "loss": 1.0809, + "step": 6285 + }, + { + "epoch": 1.17, + "learning_rate": 9.147668925857465e-07, + "loss": 0.7956, + "step": 6290 + }, + { + "epoch": 1.17, + "learning_rate": 9.137399876771411e-07, + "loss": 0.9461, + "step": 6295 + }, + { + "epoch": 1.17, + "learning_rate": 9.127130827685356e-07, + "loss": 1.3418, + "step": 6300 + }, + { + "epoch": 1.17, + "learning_rate": 9.116861778599302e-07, + "loss": 0.785, + "step": 6305 + }, + { + "epoch": 1.18, + "learning_rate": 9.106592729513247e-07, + "loss": 0.8314, + "step": 6310 + }, + { + "epoch": 1.18, + "learning_rate": 9.096323680427193e-07, + "loss": 0.8523, + "step": 6315 + }, + { + "epoch": 1.18, + "learning_rate": 9.086054631341138e-07, + "loss": 1.278, + "step": 6320 + }, + { + "epoch": 1.18, + "learning_rate": 9.075785582255084e-07, + "loss": 1.2236, + "step": 6325 + }, + { + "epoch": 1.18, + "learning_rate": 9.065516533169029e-07, + "loss": 0.9903, + "step": 6330 + }, + { + "epoch": 1.18, + "learning_rate": 9.055247484082975e-07, + "loss": 1.452, + "step": 6335 + }, + { + "epoch": 1.18, + "learning_rate": 9.044978434996919e-07, + "loss": 1.2451, + "step": 6340 + }, + { + "epoch": 1.18, + "learning_rate": 9.034709385910864e-07, + "loss": 1.02, + "step": 6345 + }, + { + "epoch": 1.18, + "learning_rate": 9.02444033682481e-07, + "loss": 1.0055, + "step": 6350 + }, + { + "epoch": 1.18, + "learning_rate": 9.014171287738755e-07, + "loss": 0.8727, + "step": 6355 + }, + { + "epoch": 1.18, + "learning_rate": 9.003902238652701e-07, + "loss": 0.8138, + "step": 6360 + }, + { + "epoch": 1.19, + "learning_rate": 8.993633189566646e-07, + "loss": 0.8879, + "step": 6365 + }, + { + "epoch": 1.19, + "learning_rate": 8.983364140480592e-07, + "loss": 1.0248, + "step": 6370 + }, + { + "epoch": 1.19, + "learning_rate": 8.973095091394536e-07, + "loss": 0.8572, + "step": 6375 + }, + { + "epoch": 1.19, + "learning_rate": 8.962826042308482e-07, + "loss": 0.7173, + "step": 6380 + }, + { + "epoch": 1.19, + "learning_rate": 8.952556993222427e-07, + "loss": 0.8795, + "step": 6385 + }, + { + "epoch": 1.19, + "learning_rate": 8.942287944136373e-07, + "loss": 1.6804, + "step": 6390 + }, + { + "epoch": 1.19, + "learning_rate": 8.932018895050318e-07, + "loss": 1.1026, + "step": 6395 + }, + { + "epoch": 1.19, + "learning_rate": 8.921749845964264e-07, + "loss": 0.8339, + "step": 6400 + }, + { + "epoch": 1.19, + "learning_rate": 8.911480796878209e-07, + "loss": 1.3447, + "step": 6405 + }, + { + "epoch": 1.19, + "learning_rate": 8.901211747792155e-07, + "loss": 0.9072, + "step": 6410 + }, + { + "epoch": 1.19, + "learning_rate": 8.8909426987061e-07, + "loss": 1.6232, + "step": 6415 + }, + { + "epoch": 1.2, + "learning_rate": 8.880673649620045e-07, + "loss": 0.7329, + "step": 6420 + }, + { + "epoch": 1.2, + "learning_rate": 8.87040460053399e-07, + "loss": 0.8971, + "step": 6425 + }, + { + "epoch": 1.2, + "learning_rate": 8.860135551447936e-07, + "loss": 0.8014, + "step": 6430 + }, + { + "epoch": 1.2, + "learning_rate": 8.849866502361881e-07, + "loss": 0.902, + "step": 6435 + }, + { + "epoch": 1.2, + "learning_rate": 8.839597453275827e-07, + "loss": 0.9787, + "step": 6440 + }, + { + "epoch": 1.2, + "learning_rate": 8.829328404189772e-07, + "loss": 1.3367, + "step": 6445 + }, + { + "epoch": 1.2, + "learning_rate": 8.819059355103718e-07, + "loss": 1.0189, + "step": 6450 + }, + { + "epoch": 1.2, + "learning_rate": 8.808790306017663e-07, + "loss": 0.8373, + "step": 6455 + }, + { + "epoch": 1.2, + "learning_rate": 8.798521256931608e-07, + "loss": 0.8355, + "step": 6460 + }, + { + "epoch": 1.2, + "learning_rate": 8.788252207845553e-07, + "loss": 0.8937, + "step": 6465 + }, + { + "epoch": 1.21, + "learning_rate": 8.777983158759499e-07, + "loss": 1.0145, + "step": 6470 + }, + { + "epoch": 1.21, + "learning_rate": 8.767714109673444e-07, + "loss": 0.8532, + "step": 6475 + }, + { + "epoch": 1.21, + "learning_rate": 8.75744506058739e-07, + "loss": 1.2985, + "step": 6480 + }, + { + "epoch": 1.21, + "learning_rate": 8.747176011501335e-07, + "loss": 0.9596, + "step": 6485 + }, + { + "epoch": 1.21, + "learning_rate": 8.736906962415281e-07, + "loss": 1.1915, + "step": 6490 + }, + { + "epoch": 1.21, + "learning_rate": 8.726637913329226e-07, + "loss": 0.7417, + "step": 6495 + }, + { + "epoch": 1.21, + "learning_rate": 8.71636886424317e-07, + "loss": 0.8899, + "step": 6500 + }, + { + "epoch": 1.21, + "eval_loss": 0.6119966506958008, + "eval_runtime": 161.8006, + "eval_samples_per_second": 7.379, + "eval_steps_per_second": 0.927, + "eval_wer": 0.9730631092868137, + "step": 6500 + }, + { + "epoch": 1.21, + "learning_rate": 8.706099815157116e-07, + "loss": 1.0632, + "step": 6505 + }, + { + "epoch": 1.21, + "learning_rate": 8.695830766071061e-07, + "loss": 0.9989, + "step": 6510 + }, + { + "epoch": 1.21, + "learning_rate": 8.685561716985007e-07, + "loss": 1.0238, + "step": 6515 + }, + { + "epoch": 1.21, + "learning_rate": 8.675292667898952e-07, + "loss": 0.9555, + "step": 6520 + }, + { + "epoch": 1.22, + "learning_rate": 8.665023618812898e-07, + "loss": 0.9623, + "step": 6525 + }, + { + "epoch": 1.22, + "learning_rate": 8.654754569726843e-07, + "loss": 0.6852, + "step": 6530 + }, + { + "epoch": 1.22, + "learning_rate": 8.644485520640789e-07, + "loss": 0.9969, + "step": 6535 + }, + { + "epoch": 1.22, + "learning_rate": 8.634216471554734e-07, + "loss": 0.8759, + "step": 6540 + }, + { + "epoch": 1.22, + "learning_rate": 8.623947422468679e-07, + "loss": 0.972, + "step": 6545 + }, + { + "epoch": 1.22, + "learning_rate": 8.613678373382624e-07, + "loss": 0.7837, + "step": 6550 + }, + { + "epoch": 1.22, + "learning_rate": 8.60340932429657e-07, + "loss": 1.3972, + "step": 6555 + }, + { + "epoch": 1.22, + "learning_rate": 8.593140275210515e-07, + "loss": 0.9475, + "step": 6560 + }, + { + "epoch": 1.22, + "learning_rate": 8.582871226124461e-07, + "loss": 0.9438, + "step": 6565 + }, + { + "epoch": 1.22, + "learning_rate": 8.572602177038406e-07, + "loss": 0.848, + "step": 6570 + }, + { + "epoch": 1.22, + "learning_rate": 8.562333127952352e-07, + "loss": 0.9746, + "step": 6575 + }, + { + "epoch": 1.23, + "learning_rate": 8.552064078866297e-07, + "loss": 0.859, + "step": 6580 + }, + { + "epoch": 1.23, + "learning_rate": 8.541795029780242e-07, + "loss": 1.0748, + "step": 6585 + }, + { + "epoch": 1.23, + "learning_rate": 8.531525980694187e-07, + "loss": 0.8909, + "step": 6590 + }, + { + "epoch": 1.23, + "learning_rate": 8.521256931608133e-07, + "loss": 0.7974, + "step": 6595 + }, + { + "epoch": 1.23, + "learning_rate": 8.510987882522078e-07, + "loss": 0.9178, + "step": 6600 + }, + { + "epoch": 1.23, + "learning_rate": 8.500718833436024e-07, + "loss": 0.8336, + "step": 6605 + }, + { + "epoch": 1.23, + "learning_rate": 8.490449784349969e-07, + "loss": 0.9486, + "step": 6610 + }, + { + "epoch": 1.23, + "learning_rate": 8.480180735263915e-07, + "loss": 0.8703, + "step": 6615 + }, + { + "epoch": 1.23, + "learning_rate": 8.46991168617786e-07, + "loss": 1.1615, + "step": 6620 + }, + { + "epoch": 1.23, + "learning_rate": 8.459642637091806e-07, + "loss": 0.8364, + "step": 6625 + }, + { + "epoch": 1.23, + "learning_rate": 8.44937358800575e-07, + "loss": 0.9219, + "step": 6630 + }, + { + "epoch": 1.24, + "learning_rate": 8.439104538919696e-07, + "loss": 0.8983, + "step": 6635 + }, + { + "epoch": 1.24, + "learning_rate": 8.428835489833641e-07, + "loss": 1.0514, + "step": 6640 + }, + { + "epoch": 1.24, + "learning_rate": 8.418566440747586e-07, + "loss": 0.7211, + "step": 6645 + }, + { + "epoch": 1.24, + "learning_rate": 8.408297391661532e-07, + "loss": 0.9361, + "step": 6650 + }, + { + "epoch": 1.24, + "learning_rate": 8.398028342575477e-07, + "loss": 0.818, + "step": 6655 + }, + { + "epoch": 1.24, + "learning_rate": 8.387759293489423e-07, + "loss": 0.8167, + "step": 6660 + }, + { + "epoch": 1.24, + "learning_rate": 8.377490244403367e-07, + "loss": 0.9332, + "step": 6665 + }, + { + "epoch": 1.24, + "learning_rate": 8.367221195317313e-07, + "loss": 1.3069, + "step": 6670 + }, + { + "epoch": 1.24, + "learning_rate": 8.356952146231258e-07, + "loss": 0.8066, + "step": 6675 + }, + { + "epoch": 1.24, + "learning_rate": 8.346683097145204e-07, + "loss": 0.7699, + "step": 6680 + }, + { + "epoch": 1.25, + "learning_rate": 8.336414048059149e-07, + "loss": 1.1784, + "step": 6685 + }, + { + "epoch": 1.25, + "learning_rate": 8.326144998973095e-07, + "loss": 0.9819, + "step": 6690 + }, + { + "epoch": 1.25, + "learning_rate": 8.31587594988704e-07, + "loss": 0.7979, + "step": 6695 + }, + { + "epoch": 1.25, + "learning_rate": 8.305606900800986e-07, + "loss": 0.8063, + "step": 6700 + }, + { + "epoch": 1.25, + "learning_rate": 8.29533785171493e-07, + "loss": 0.7892, + "step": 6705 + }, + { + "epoch": 1.25, + "learning_rate": 8.285068802628876e-07, + "loss": 0.8912, + "step": 6710 + }, + { + "epoch": 1.25, + "learning_rate": 8.274799753542821e-07, + "loss": 0.9465, + "step": 6715 + }, + { + "epoch": 1.25, + "learning_rate": 8.264530704456767e-07, + "loss": 0.7973, + "step": 6720 + }, + { + "epoch": 1.25, + "learning_rate": 8.254261655370712e-07, + "loss": 0.7016, + "step": 6725 + }, + { + "epoch": 1.25, + "learning_rate": 8.243992606284658e-07, + "loss": 1.0314, + "step": 6730 + }, + { + "epoch": 1.25, + "learning_rate": 8.233723557198603e-07, + "loss": 0.837, + "step": 6735 + }, + { + "epoch": 1.26, + "learning_rate": 8.223454508112549e-07, + "loss": 1.0261, + "step": 6740 + }, + { + "epoch": 1.26, + "learning_rate": 8.213185459026494e-07, + "loss": 0.907, + "step": 6745 + }, + { + "epoch": 1.26, + "learning_rate": 8.20291640994044e-07, + "loss": 1.3548, + "step": 6750 + }, + { + "epoch": 1.26, + "learning_rate": 8.192647360854384e-07, + "loss": 0.6939, + "step": 6755 + }, + { + "epoch": 1.26, + "learning_rate": 8.18237831176833e-07, + "loss": 0.642, + "step": 6760 + }, + { + "epoch": 1.26, + "learning_rate": 8.172109262682275e-07, + "loss": 0.7524, + "step": 6765 + }, + { + "epoch": 1.26, + "learning_rate": 8.161840213596221e-07, + "loss": 1.3072, + "step": 6770 + }, + { + "epoch": 1.26, + "learning_rate": 8.151571164510166e-07, + "loss": 0.9227, + "step": 6775 + }, + { + "epoch": 1.26, + "learning_rate": 8.141302115424112e-07, + "loss": 1.0372, + "step": 6780 + }, + { + "epoch": 1.26, + "learning_rate": 8.131033066338057e-07, + "loss": 1.0262, + "step": 6785 + }, + { + "epoch": 1.26, + "learning_rate": 8.120764017252003e-07, + "loss": 0.7881, + "step": 6790 + }, + { + "epoch": 1.27, + "learning_rate": 8.110494968165947e-07, + "loss": 1.0526, + "step": 6795 + }, + { + "epoch": 1.27, + "learning_rate": 8.100225919079892e-07, + "loss": 1.1853, + "step": 6800 + }, + { + "epoch": 1.27, + "learning_rate": 8.089956869993838e-07, + "loss": 0.7666, + "step": 6805 + }, + { + "epoch": 1.27, + "learning_rate": 8.079687820907783e-07, + "loss": 0.8543, + "step": 6810 + }, + { + "epoch": 1.27, + "learning_rate": 8.069418771821729e-07, + "loss": 0.8792, + "step": 6815 + }, + { + "epoch": 1.27, + "learning_rate": 8.059149722735674e-07, + "loss": 0.8891, + "step": 6820 + }, + { + "epoch": 1.27, + "learning_rate": 8.04888067364962e-07, + "loss": 0.6812, + "step": 6825 + }, + { + "epoch": 1.27, + "learning_rate": 8.038611624563565e-07, + "loss": 0.9066, + "step": 6830 + }, + { + "epoch": 1.27, + "learning_rate": 8.02834257547751e-07, + "loss": 0.951, + "step": 6835 + }, + { + "epoch": 1.27, + "learning_rate": 8.018073526391455e-07, + "loss": 1.108, + "step": 6840 + }, + { + "epoch": 1.27, + "learning_rate": 8.007804477305401e-07, + "loss": 0.7586, + "step": 6845 + }, + { + "epoch": 1.28, + "learning_rate": 7.997535428219346e-07, + "loss": 0.8866, + "step": 6850 + }, + { + "epoch": 1.28, + "learning_rate": 7.987266379133292e-07, + "loss": 0.7629, + "step": 6855 + }, + { + "epoch": 1.28, + "learning_rate": 7.976997330047237e-07, + "loss": 0.8082, + "step": 6860 + }, + { + "epoch": 1.28, + "learning_rate": 7.966728280961183e-07, + "loss": 0.8103, + "step": 6865 + }, + { + "epoch": 1.28, + "learning_rate": 7.956459231875128e-07, + "loss": 0.8515, + "step": 6870 + }, + { + "epoch": 1.28, + "learning_rate": 7.946190182789073e-07, + "loss": 0.971, + "step": 6875 + }, + { + "epoch": 1.28, + "learning_rate": 7.935921133703018e-07, + "loss": 0.8346, + "step": 6880 + }, + { + "epoch": 1.28, + "learning_rate": 7.925652084616964e-07, + "loss": 0.9302, + "step": 6885 + }, + { + "epoch": 1.28, + "learning_rate": 7.915383035530909e-07, + "loss": 0.9843, + "step": 6890 + }, + { + "epoch": 1.28, + "learning_rate": 7.905113986444855e-07, + "loss": 1.0542, + "step": 6895 + }, + { + "epoch": 1.29, + "learning_rate": 7.8948449373588e-07, + "loss": 1.1789, + "step": 6900 + }, + { + "epoch": 1.29, + "learning_rate": 7.884575888272746e-07, + "loss": 0.9403, + "step": 6905 + }, + { + "epoch": 1.29, + "learning_rate": 7.874306839186691e-07, + "loss": 0.9338, + "step": 6910 + }, + { + "epoch": 1.29, + "learning_rate": 7.864037790100636e-07, + "loss": 0.8633, + "step": 6915 + }, + { + "epoch": 1.29, + "learning_rate": 7.853768741014581e-07, + "loss": 0.8621, + "step": 6920 + }, + { + "epoch": 1.29, + "learning_rate": 7.843499691928527e-07, + "loss": 0.8301, + "step": 6925 + }, + { + "epoch": 1.29, + "learning_rate": 7.833230642842472e-07, + "loss": 0.8555, + "step": 6930 + }, + { + "epoch": 1.29, + "learning_rate": 7.822961593756418e-07, + "loss": 0.8075, + "step": 6935 + }, + { + "epoch": 1.29, + "learning_rate": 7.812692544670363e-07, + "loss": 1.0482, + "step": 6940 + }, + { + "epoch": 1.29, + "learning_rate": 7.802423495584308e-07, + "loss": 1.2927, + "step": 6945 + }, + { + "epoch": 1.29, + "learning_rate": 7.792154446498254e-07, + "loss": 0.7703, + "step": 6950 + }, + { + "epoch": 1.3, + "learning_rate": 7.781885397412198e-07, + "loss": 1.0229, + "step": 6955 + }, + { + "epoch": 1.3, + "learning_rate": 7.771616348326144e-07, + "loss": 0.6933, + "step": 6960 + }, + { + "epoch": 1.3, + "learning_rate": 7.761347299240089e-07, + "loss": 0.8685, + "step": 6965 + }, + { + "epoch": 1.3, + "learning_rate": 7.751078250154035e-07, + "loss": 0.9672, + "step": 6970 + }, + { + "epoch": 1.3, + "learning_rate": 7.74080920106798e-07, + "loss": 1.1863, + "step": 6975 + }, + { + "epoch": 1.3, + "learning_rate": 7.730540151981926e-07, + "loss": 0.7385, + "step": 6980 + }, + { + "epoch": 1.3, + "learning_rate": 7.720271102895871e-07, + "loss": 0.9416, + "step": 6985 + }, + { + "epoch": 1.3, + "learning_rate": 7.710002053809817e-07, + "loss": 0.9813, + "step": 6990 + }, + { + "epoch": 1.3, + "learning_rate": 7.699733004723762e-07, + "loss": 1.1032, + "step": 6995 + }, + { + "epoch": 1.3, + "learning_rate": 7.689463955637707e-07, + "loss": 0.9412, + "step": 7000 + }, + { + "epoch": 1.3, + "eval_loss": 0.5923011898994446, + "eval_runtime": 153.2623, + "eval_samples_per_second": 7.791, + "eval_steps_per_second": 0.979, + "eval_wer": 0.952539763981529, + "step": 7000 + }, + { + "epoch": 1.3, + "learning_rate": 7.679194906551652e-07, + "loss": 0.7374, + "step": 7005 + }, + { + "epoch": 1.31, + "learning_rate": 7.668925857465598e-07, + "loss": 0.9419, + "step": 7010 + }, + { + "epoch": 1.31, + "learning_rate": 7.658656808379543e-07, + "loss": 0.8655, + "step": 7015 + }, + { + "epoch": 1.31, + "learning_rate": 7.648387759293489e-07, + "loss": 1.0748, + "step": 7020 + }, + { + "epoch": 1.31, + "learning_rate": 7.638118710207434e-07, + "loss": 0.9836, + "step": 7025 + }, + { + "epoch": 1.31, + "learning_rate": 7.62784966112138e-07, + "loss": 0.7297, + "step": 7030 + }, + { + "epoch": 1.31, + "learning_rate": 7.617580612035325e-07, + "loss": 1.3443, + "step": 7035 + }, + { + "epoch": 1.31, + "learning_rate": 7.60731156294927e-07, + "loss": 0.894, + "step": 7040 + }, + { + "epoch": 1.31, + "learning_rate": 7.597042513863215e-07, + "loss": 1.1128, + "step": 7045 + }, + { + "epoch": 1.31, + "learning_rate": 7.586773464777161e-07, + "loss": 0.7503, + "step": 7050 + }, + { + "epoch": 1.31, + "learning_rate": 7.576504415691106e-07, + "loss": 0.8865, + "step": 7055 + }, + { + "epoch": 1.31, + "learning_rate": 7.566235366605052e-07, + "loss": 0.8906, + "step": 7060 + }, + { + "epoch": 1.32, + "learning_rate": 7.555966317518997e-07, + "loss": 0.8262, + "step": 7065 + }, + { + "epoch": 1.32, + "learning_rate": 7.545697268432943e-07, + "loss": 0.9334, + "step": 7070 + }, + { + "epoch": 1.32, + "learning_rate": 7.535428219346888e-07, + "loss": 0.7228, + "step": 7075 + }, + { + "epoch": 1.32, + "learning_rate": 7.525159170260834e-07, + "loss": 0.6956, + "step": 7080 + }, + { + "epoch": 1.32, + "learning_rate": 7.514890121174778e-07, + "loss": 0.8124, + "step": 7085 + }, + { + "epoch": 1.32, + "learning_rate": 7.504621072088724e-07, + "loss": 1.0577, + "step": 7090 + }, + { + "epoch": 1.32, + "learning_rate": 7.494352023002669e-07, + "loss": 1.0066, + "step": 7095 + }, + { + "epoch": 1.32, + "learning_rate": 7.484082973916614e-07, + "loss": 1.1995, + "step": 7100 + }, + { + "epoch": 1.32, + "learning_rate": 7.47381392483056e-07, + "loss": 0.7794, + "step": 7105 + }, + { + "epoch": 1.32, + "learning_rate": 7.463544875744505e-07, + "loss": 0.9095, + "step": 7110 + }, + { + "epoch": 1.33, + "learning_rate": 7.453275826658451e-07, + "loss": 0.8585, + "step": 7115 + }, + { + "epoch": 1.33, + "learning_rate": 7.443006777572395e-07, + "loss": 1.0227, + "step": 7120 + }, + { + "epoch": 1.33, + "learning_rate": 7.432737728486341e-07, + "loss": 0.7072, + "step": 7125 + }, + { + "epoch": 1.33, + "learning_rate": 7.422468679400286e-07, + "loss": 0.765, + "step": 7130 + }, + { + "epoch": 1.33, + "learning_rate": 7.412199630314233e-07, + "loss": 0.7863, + "step": 7135 + }, + { + "epoch": 1.33, + "learning_rate": 7.401930581228178e-07, + "loss": 0.7918, + "step": 7140 + }, + { + "epoch": 1.33, + "learning_rate": 7.391661532142124e-07, + "loss": 1.0758, + "step": 7145 + }, + { + "epoch": 1.33, + "learning_rate": 7.381392483056069e-07, + "loss": 0.7628, + "step": 7150 + }, + { + "epoch": 1.33, + "learning_rate": 7.371123433970015e-07, + "loss": 0.9962, + "step": 7155 + }, + { + "epoch": 1.33, + "learning_rate": 7.36085438488396e-07, + "loss": 1.0403, + "step": 7160 + }, + { + "epoch": 1.33, + "learning_rate": 7.350585335797905e-07, + "loss": 0.775, + "step": 7165 + }, + { + "epoch": 1.34, + "learning_rate": 7.34031628671185e-07, + "loss": 0.8383, + "step": 7170 + }, + { + "epoch": 1.34, + "learning_rate": 7.330047237625796e-07, + "loss": 0.8059, + "step": 7175 + }, + { + "epoch": 1.34, + "learning_rate": 7.319778188539741e-07, + "loss": 0.715, + "step": 7180 + }, + { + "epoch": 1.34, + "learning_rate": 7.309509139453687e-07, + "loss": 0.7442, + "step": 7185 + }, + { + "epoch": 1.34, + "learning_rate": 7.299240090367632e-07, + "loss": 0.7807, + "step": 7190 + }, + { + "epoch": 1.34, + "learning_rate": 7.288971041281578e-07, + "loss": 0.8463, + "step": 7195 + }, + { + "epoch": 1.34, + "learning_rate": 7.278701992195523e-07, + "loss": 0.8495, + "step": 7200 + }, + { + "epoch": 1.34, + "learning_rate": 7.268432943109469e-07, + "loss": 0.8013, + "step": 7205 + }, + { + "epoch": 1.34, + "learning_rate": 7.258163894023413e-07, + "loss": 1.0864, + "step": 7210 + }, + { + "epoch": 1.34, + "learning_rate": 7.247894844937359e-07, + "loss": 1.1016, + "step": 7215 + }, + { + "epoch": 1.34, + "learning_rate": 7.237625795851304e-07, + "loss": 0.917, + "step": 7220 + }, + { + "epoch": 1.35, + "learning_rate": 7.22735674676525e-07, + "loss": 0.7113, + "step": 7225 + }, + { + "epoch": 1.35, + "learning_rate": 7.217087697679195e-07, + "loss": 1.215, + "step": 7230 + }, + { + "epoch": 1.35, + "learning_rate": 7.206818648593141e-07, + "loss": 0.9089, + "step": 7235 + }, + { + "epoch": 1.35, + "learning_rate": 7.196549599507086e-07, + "loss": 1.0031, + "step": 7240 + }, + { + "epoch": 1.35, + "learning_rate": 7.186280550421032e-07, + "loss": 0.9265, + "step": 7245 + }, + { + "epoch": 1.35, + "learning_rate": 7.176011501334976e-07, + "loss": 0.7035, + "step": 7250 + }, + { + "epoch": 1.35, + "learning_rate": 7.165742452248922e-07, + "loss": 0.8049, + "step": 7255 + }, + { + "epoch": 1.35, + "learning_rate": 7.155473403162867e-07, + "loss": 0.87, + "step": 7260 + }, + { + "epoch": 1.35, + "learning_rate": 7.145204354076812e-07, + "loss": 0.9135, + "step": 7265 + }, + { + "epoch": 1.35, + "learning_rate": 7.134935304990758e-07, + "loss": 0.9293, + "step": 7270 + }, + { + "epoch": 1.36, + "learning_rate": 7.124666255904703e-07, + "loss": 0.8794, + "step": 7275 + }, + { + "epoch": 1.36, + "learning_rate": 7.114397206818649e-07, + "loss": 0.7732, + "step": 7280 + }, + { + "epoch": 1.36, + "learning_rate": 7.104128157732594e-07, + "loss": 0.784, + "step": 7285 + }, + { + "epoch": 1.36, + "learning_rate": 7.093859108646539e-07, + "loss": 1.573, + "step": 7290 + }, + { + "epoch": 1.36, + "learning_rate": 7.083590059560484e-07, + "loss": 0.956, + "step": 7295 + }, + { + "epoch": 1.36, + "learning_rate": 7.07332101047443e-07, + "loss": 1.0869, + "step": 7300 + }, + { + "epoch": 1.36, + "learning_rate": 7.063051961388375e-07, + "loss": 0.8412, + "step": 7305 + }, + { + "epoch": 1.36, + "learning_rate": 7.052782912302321e-07, + "loss": 1.2126, + "step": 7310 + }, + { + "epoch": 1.36, + "learning_rate": 7.042513863216266e-07, + "loss": 0.8477, + "step": 7315 + }, + { + "epoch": 1.36, + "learning_rate": 7.032244814130212e-07, + "loss": 1.3195, + "step": 7320 + }, + { + "epoch": 1.36, + "learning_rate": 7.021975765044157e-07, + "loss": 0.7801, + "step": 7325 + }, + { + "epoch": 1.37, + "learning_rate": 7.011706715958103e-07, + "loss": 0.8952, + "step": 7330 + }, + { + "epoch": 1.37, + "learning_rate": 7.001437666872047e-07, + "loss": 0.9682, + "step": 7335 + }, + { + "epoch": 1.37, + "learning_rate": 6.991168617785993e-07, + "loss": 0.7288, + "step": 7340 + }, + { + "epoch": 1.37, + "learning_rate": 6.980899568699938e-07, + "loss": 0.855, + "step": 7345 + }, + { + "epoch": 1.37, + "learning_rate": 6.970630519613884e-07, + "loss": 0.9398, + "step": 7350 + }, + { + "epoch": 1.37, + "learning_rate": 6.960361470527829e-07, + "loss": 0.9362, + "step": 7355 + }, + { + "epoch": 1.37, + "learning_rate": 6.950092421441775e-07, + "loss": 0.9882, + "step": 7360 + }, + { + "epoch": 1.37, + "learning_rate": 6.93982337235572e-07, + "loss": 1.0757, + "step": 7365 + }, + { + "epoch": 1.37, + "learning_rate": 6.929554323269666e-07, + "loss": 0.8157, + "step": 7370 + }, + { + "epoch": 1.37, + "learning_rate": 6.91928527418361e-07, + "loss": 0.8172, + "step": 7375 + }, + { + "epoch": 1.37, + "learning_rate": 6.909016225097556e-07, + "loss": 0.737, + "step": 7380 + }, + { + "epoch": 1.38, + "learning_rate": 6.898747176011501e-07, + "loss": 0.7614, + "step": 7385 + }, + { + "epoch": 1.38, + "learning_rate": 6.888478126925447e-07, + "loss": 1.1501, + "step": 7390 + }, + { + "epoch": 1.38, + "learning_rate": 6.878209077839392e-07, + "loss": 0.6488, + "step": 7395 + }, + { + "epoch": 1.38, + "learning_rate": 6.867940028753338e-07, + "loss": 1.0218, + "step": 7400 + }, + { + "epoch": 1.38, + "learning_rate": 6.857670979667283e-07, + "loss": 0.7974, + "step": 7405 + }, + { + "epoch": 1.38, + "learning_rate": 6.847401930581228e-07, + "loss": 0.9662, + "step": 7410 + }, + { + "epoch": 1.38, + "learning_rate": 6.837132881495173e-07, + "loss": 0.7973, + "step": 7415 + }, + { + "epoch": 1.38, + "learning_rate": 6.826863832409118e-07, + "loss": 1.1172, + "step": 7420 + }, + { + "epoch": 1.38, + "learning_rate": 6.816594783323064e-07, + "loss": 1.118, + "step": 7425 + }, + { + "epoch": 1.38, + "learning_rate": 6.806325734237009e-07, + "loss": 1.2301, + "step": 7430 + }, + { + "epoch": 1.38, + "learning_rate": 6.796056685150955e-07, + "loss": 1.0008, + "step": 7435 + }, + { + "epoch": 1.39, + "learning_rate": 6.7857876360649e-07, + "loss": 0.9601, + "step": 7440 + }, + { + "epoch": 1.39, + "learning_rate": 6.775518586978846e-07, + "loss": 0.7135, + "step": 7445 + }, + { + "epoch": 1.39, + "learning_rate": 6.765249537892791e-07, + "loss": 0.8211, + "step": 7450 + }, + { + "epoch": 1.39, + "learning_rate": 6.754980488806736e-07, + "loss": 1.1097, + "step": 7455 + }, + { + "epoch": 1.39, + "learning_rate": 6.744711439720681e-07, + "loss": 1.0741, + "step": 7460 + }, + { + "epoch": 1.39, + "learning_rate": 6.734442390634627e-07, + "loss": 1.2393, + "step": 7465 + }, + { + "epoch": 1.39, + "learning_rate": 6.724173341548572e-07, + "loss": 0.8408, + "step": 7470 + }, + { + "epoch": 1.39, + "learning_rate": 6.713904292462518e-07, + "loss": 0.7914, + "step": 7475 + }, + { + "epoch": 1.39, + "learning_rate": 6.703635243376463e-07, + "loss": 0.7918, + "step": 7480 + }, + { + "epoch": 1.39, + "learning_rate": 6.693366194290409e-07, + "loss": 0.9031, + "step": 7485 + }, + { + "epoch": 1.4, + "learning_rate": 6.683097145204354e-07, + "loss": 0.7893, + "step": 7490 + }, + { + "epoch": 1.4, + "learning_rate": 6.6728280961183e-07, + "loss": 0.7198, + "step": 7495 + }, + { + "epoch": 1.4, + "learning_rate": 6.662559047032244e-07, + "loss": 0.8052, + "step": 7500 + }, + { + "epoch": 1.4, + "eval_loss": 0.5810225009918213, + "eval_runtime": 145.8096, + "eval_samples_per_second": 8.189, + "eval_steps_per_second": 1.029, + "eval_wer": 0.9427911749615188, + "step": 7500 + }, + { + "epoch": 1.4, + "learning_rate": 6.65228999794619e-07, + "loss": 1.2298, + "step": 7505 + }, + { + "epoch": 1.4, + "learning_rate": 6.642020948860135e-07, + "loss": 0.7371, + "step": 7510 + }, + { + "epoch": 1.4, + "learning_rate": 6.631751899774081e-07, + "loss": 1.2392, + "step": 7515 + }, + { + "epoch": 1.4, + "learning_rate": 6.621482850688026e-07, + "loss": 0.7397, + "step": 7520 + }, + { + "epoch": 1.4, + "learning_rate": 6.611213801601972e-07, + "loss": 0.8519, + "step": 7525 + }, + { + "epoch": 1.4, + "learning_rate": 6.600944752515917e-07, + "loss": 1.2469, + "step": 7530 + }, + { + "epoch": 1.4, + "learning_rate": 6.590675703429863e-07, + "loss": 0.7008, + "step": 7535 + }, + { + "epoch": 1.4, + "learning_rate": 6.580406654343807e-07, + "loss": 0.8012, + "step": 7540 + }, + { + "epoch": 1.41, + "learning_rate": 6.570137605257753e-07, + "loss": 1.1256, + "step": 7545 + }, + { + "epoch": 1.41, + "learning_rate": 6.559868556171698e-07, + "loss": 0.7622, + "step": 7550 + }, + { + "epoch": 1.41, + "learning_rate": 6.549599507085644e-07, + "loss": 0.8032, + "step": 7555 + }, + { + "epoch": 1.41, + "learning_rate": 6.539330457999589e-07, + "loss": 0.8004, + "step": 7560 + }, + { + "epoch": 1.41, + "learning_rate": 6.529061408913534e-07, + "loss": 0.7468, + "step": 7565 + }, + { + "epoch": 1.41, + "learning_rate": 6.51879235982748e-07, + "loss": 0.8619, + "step": 7570 + }, + { + "epoch": 1.41, + "learning_rate": 6.508523310741425e-07, + "loss": 0.7856, + "step": 7575 + }, + { + "epoch": 1.41, + "learning_rate": 6.49825426165537e-07, + "loss": 0.7295, + "step": 7580 + }, + { + "epoch": 1.41, + "learning_rate": 6.487985212569315e-07, + "loss": 0.9886, + "step": 7585 + }, + { + "epoch": 1.41, + "learning_rate": 6.477716163483261e-07, + "loss": 0.9888, + "step": 7590 + }, + { + "epoch": 1.41, + "learning_rate": 6.467447114397206e-07, + "loss": 0.9019, + "step": 7595 + }, + { + "epoch": 1.42, + "learning_rate": 6.457178065311152e-07, + "loss": 0.7629, + "step": 7600 + }, + { + "epoch": 1.42, + "learning_rate": 6.446909016225097e-07, + "loss": 0.8729, + "step": 7605 + }, + { + "epoch": 1.42, + "learning_rate": 6.436639967139043e-07, + "loss": 0.8466, + "step": 7610 + }, + { + "epoch": 1.42, + "learning_rate": 6.426370918052988e-07, + "loss": 0.7365, + "step": 7615 + }, + { + "epoch": 1.42, + "learning_rate": 6.416101868966933e-07, + "loss": 1.0247, + "step": 7620 + }, + { + "epoch": 1.42, + "learning_rate": 6.405832819880878e-07, + "loss": 1.0193, + "step": 7625 + }, + { + "epoch": 1.42, + "learning_rate": 6.395563770794824e-07, + "loss": 1.3307, + "step": 7630 + }, + { + "epoch": 1.42, + "learning_rate": 6.385294721708769e-07, + "loss": 0.9158, + "step": 7635 + }, + { + "epoch": 1.42, + "learning_rate": 6.375025672622715e-07, + "loss": 1.2267, + "step": 7640 + }, + { + "epoch": 1.42, + "learning_rate": 6.36475662353666e-07, + "loss": 1.0363, + "step": 7645 + }, + { + "epoch": 1.42, + "learning_rate": 6.354487574450606e-07, + "loss": 0.9707, + "step": 7650 + }, + { + "epoch": 1.43, + "learning_rate": 6.344218525364551e-07, + "loss": 0.8471, + "step": 7655 + }, + { + "epoch": 1.43, + "learning_rate": 6.336003286095707e-07, + "loss": 2.2894, + "step": 7660 + }, + { + "epoch": 1.43, + "learning_rate": 6.325734237009652e-07, + "loss": 1.0268, + "step": 7665 + }, + { + "epoch": 1.43, + "learning_rate": 6.315465187923598e-07, + "loss": 0.7682, + "step": 7670 + }, + { + "epoch": 1.43, + "learning_rate": 6.305196138837543e-07, + "loss": 0.6118, + "step": 7675 + }, + { + "epoch": 1.43, + "learning_rate": 6.294927089751488e-07, + "loss": 0.877, + "step": 7680 + }, + { + "epoch": 1.43, + "learning_rate": 6.284658040665434e-07, + "loss": 0.6714, + "step": 7685 + }, + { + "epoch": 1.43, + "learning_rate": 6.274388991579379e-07, + "loss": 1.2271, + "step": 7690 + }, + { + "epoch": 1.43, + "learning_rate": 6.264119942493324e-07, + "loss": 0.7157, + "step": 7695 + }, + { + "epoch": 1.43, + "learning_rate": 6.253850893407269e-07, + "loss": 0.649, + "step": 7700 + }, + { + "epoch": 1.44, + "learning_rate": 6.243581844321215e-07, + "loss": 0.9921, + "step": 7705 + }, + { + "epoch": 1.44, + "learning_rate": 6.23331279523516e-07, + "loss": 0.8691, + "step": 7710 + }, + { + "epoch": 1.44, + "learning_rate": 6.223043746149106e-07, + "loss": 1.0678, + "step": 7715 + }, + { + "epoch": 1.44, + "learning_rate": 6.212774697063051e-07, + "loss": 0.7666, + "step": 7720 + }, + { + "epoch": 1.44, + "learning_rate": 6.202505647976997e-07, + "loss": 0.8856, + "step": 7725 + }, + { + "epoch": 1.44, + "learning_rate": 6.192236598890942e-07, + "loss": 1.169, + "step": 7730 + }, + { + "epoch": 1.44, + "learning_rate": 6.181967549804888e-07, + "loss": 0.8315, + "step": 7735 + }, + { + "epoch": 1.44, + "learning_rate": 6.171698500718832e-07, + "loss": 0.9041, + "step": 7740 + }, + { + "epoch": 1.44, + "learning_rate": 6.161429451632778e-07, + "loss": 0.7837, + "step": 7745 + }, + { + "epoch": 1.44, + "learning_rate": 6.151160402546723e-07, + "loss": 0.8858, + "step": 7750 + }, + { + "epoch": 1.44, + "learning_rate": 6.140891353460669e-07, + "loss": 0.9944, + "step": 7755 + }, + { + "epoch": 1.45, + "learning_rate": 6.130622304374614e-07, + "loss": 1.438, + "step": 7760 + }, + { + "epoch": 1.45, + "learning_rate": 6.12035325528856e-07, + "loss": 0.7522, + "step": 7765 + }, + { + "epoch": 1.45, + "learning_rate": 6.110084206202505e-07, + "loss": 1.161, + "step": 7770 + }, + { + "epoch": 1.45, + "learning_rate": 6.099815157116451e-07, + "loss": 0.8066, + "step": 7775 + }, + { + "epoch": 1.45, + "learning_rate": 6.089546108030395e-07, + "loss": 0.8732, + "step": 7780 + }, + { + "epoch": 1.45, + "learning_rate": 6.079277058944341e-07, + "loss": 0.8681, + "step": 7785 + }, + { + "epoch": 1.45, + "learning_rate": 6.069008009858286e-07, + "loss": 0.6792, + "step": 7790 + }, + { + "epoch": 1.45, + "learning_rate": 6.058738960772232e-07, + "loss": 0.7122, + "step": 7795 + }, + { + "epoch": 1.45, + "learning_rate": 6.048469911686177e-07, + "loss": 1.1585, + "step": 7800 + }, + { + "epoch": 1.45, + "learning_rate": 6.038200862600123e-07, + "loss": 0.8072, + "step": 7805 + }, + { + "epoch": 1.45, + "learning_rate": 6.027931813514069e-07, + "loss": 0.9174, + "step": 7810 + }, + { + "epoch": 1.46, + "learning_rate": 6.017662764428015e-07, + "loss": 0.9088, + "step": 7815 + }, + { + "epoch": 1.46, + "learning_rate": 6.00739371534196e-07, + "loss": 0.817, + "step": 7820 + }, + { + "epoch": 1.46, + "learning_rate": 5.997124666255905e-07, + "loss": 0.849, + "step": 7825 + }, + { + "epoch": 1.46, + "learning_rate": 5.98685561716985e-07, + "loss": 0.9686, + "step": 7830 + }, + { + "epoch": 1.46, + "learning_rate": 5.976586568083796e-07, + "loss": 0.9308, + "step": 7835 + }, + { + "epoch": 1.46, + "learning_rate": 5.966317518997741e-07, + "loss": 0.8584, + "step": 7840 + }, + { + "epoch": 1.46, + "learning_rate": 5.956048469911686e-07, + "loss": 0.8181, + "step": 7845 + }, + { + "epoch": 1.46, + "learning_rate": 5.945779420825632e-07, + "loss": 0.7327, + "step": 7850 + }, + { + "epoch": 1.46, + "learning_rate": 5.935510371739577e-07, + "loss": 0.6989, + "step": 7855 + }, + { + "epoch": 1.46, + "learning_rate": 5.925241322653523e-07, + "loss": 0.7766, + "step": 7860 + }, + { + "epoch": 1.46, + "learning_rate": 5.914972273567467e-07, + "loss": 1.4259, + "step": 7865 + }, + { + "epoch": 1.47, + "learning_rate": 5.904703224481413e-07, + "loss": 0.9504, + "step": 7870 + }, + { + "epoch": 1.47, + "learning_rate": 5.894434175395358e-07, + "loss": 0.8883, + "step": 7875 + }, + { + "epoch": 1.47, + "learning_rate": 5.884165126309304e-07, + "loss": 0.8198, + "step": 7880 + }, + { + "epoch": 1.47, + "learning_rate": 5.873896077223249e-07, + "loss": 1.1042, + "step": 7885 + }, + { + "epoch": 1.47, + "learning_rate": 5.863627028137195e-07, + "loss": 0.761, + "step": 7890 + }, + { + "epoch": 1.47, + "learning_rate": 5.85335797905114e-07, + "loss": 0.7181, + "step": 7895 + }, + { + "epoch": 1.47, + "learning_rate": 5.843088929965086e-07, + "loss": 0.7321, + "step": 7900 + }, + { + "epoch": 1.47, + "learning_rate": 5.83281988087903e-07, + "loss": 0.8182, + "step": 7905 + }, + { + "epoch": 1.47, + "learning_rate": 5.822550831792976e-07, + "loss": 0.8529, + "step": 7910 + }, + { + "epoch": 1.47, + "learning_rate": 5.812281782706921e-07, + "loss": 0.9153, + "step": 7915 + }, + { + "epoch": 1.48, + "learning_rate": 5.802012733620867e-07, + "loss": 1.3715, + "step": 7920 + }, + { + "epoch": 1.48, + "learning_rate": 5.791743684534812e-07, + "loss": 0.7765, + "step": 7925 + }, + { + "epoch": 1.48, + "learning_rate": 5.781474635448758e-07, + "loss": 0.7273, + "step": 7930 + }, + { + "epoch": 1.48, + "learning_rate": 5.771205586362703e-07, + "loss": 1.0647, + "step": 7935 + }, + { + "epoch": 1.48, + "learning_rate": 5.760936537276649e-07, + "loss": 0.7211, + "step": 7940 + }, + { + "epoch": 1.48, + "learning_rate": 5.750667488190593e-07, + "loss": 1.1039, + "step": 7945 + }, + { + "epoch": 1.48, + "learning_rate": 5.740398439104539e-07, + "loss": 0.9831, + "step": 7950 + }, + { + "epoch": 1.48, + "learning_rate": 5.730129390018484e-07, + "loss": 0.7514, + "step": 7955 + }, + { + "epoch": 1.48, + "learning_rate": 5.71986034093243e-07, + "loss": 0.9246, + "step": 7960 + }, + { + "epoch": 1.48, + "learning_rate": 5.709591291846375e-07, + "loss": 1.0028, + "step": 7965 + }, + { + "epoch": 1.48, + "learning_rate": 5.699322242760321e-07, + "loss": 0.9095, + "step": 7970 + }, + { + "epoch": 1.49, + "learning_rate": 5.689053193674266e-07, + "loss": 0.7569, + "step": 7975 + }, + { + "epoch": 1.49, + "learning_rate": 5.678784144588212e-07, + "loss": 0.6962, + "step": 7980 + }, + { + "epoch": 1.49, + "learning_rate": 5.668515095502157e-07, + "loss": 0.8134, + "step": 7985 + }, + { + "epoch": 1.49, + "learning_rate": 5.658246046416102e-07, + "loss": 1.0712, + "step": 7990 + }, + { + "epoch": 1.49, + "learning_rate": 5.647976997330047e-07, + "loss": 0.6945, + "step": 7995 + }, + { + "epoch": 1.49, + "learning_rate": 5.637707948243992e-07, + "loss": 0.9881, + "step": 8000 + }, + { + "epoch": 1.49, + "eval_loss": 0.5700684189796448, + "eval_runtime": 138.9442, + "eval_samples_per_second": 8.593, + "eval_steps_per_second": 1.08, + "eval_wer": 0.9295792714212416, + "step": 8000 + }, + { + "epoch": 1.49, + "learning_rate": 5.627438899157938e-07, + "loss": 1.0634, + "step": 8005 + }, + { + "epoch": 1.49, + "learning_rate": 5.617169850071883e-07, + "loss": 0.7482, + "step": 8010 + }, + { + "epoch": 1.49, + "learning_rate": 5.606900800985829e-07, + "loss": 0.8581, + "step": 8015 + }, + { + "epoch": 1.49, + "learning_rate": 5.596631751899774e-07, + "loss": 1.0777, + "step": 8020 + }, + { + "epoch": 1.49, + "learning_rate": 5.58636270281372e-07, + "loss": 0.75, + "step": 8025 + }, + { + "epoch": 1.5, + "learning_rate": 5.576093653727664e-07, + "loss": 0.8893, + "step": 8030 + }, + { + "epoch": 1.5, + "learning_rate": 5.56582460464161e-07, + "loss": 0.7469, + "step": 8035 + }, + { + "epoch": 1.5, + "learning_rate": 5.555555555555555e-07, + "loss": 0.7758, + "step": 8040 + }, + { + "epoch": 1.5, + "learning_rate": 5.545286506469501e-07, + "loss": 1.1137, + "step": 8045 + }, + { + "epoch": 1.5, + "learning_rate": 5.535017457383446e-07, + "loss": 0.8816, + "step": 8050 + }, + { + "epoch": 1.5, + "learning_rate": 5.524748408297392e-07, + "loss": 0.8427, + "step": 8055 + }, + { + "epoch": 1.5, + "learning_rate": 5.514479359211337e-07, + "loss": 0.8506, + "step": 8060 + }, + { + "epoch": 1.5, + "learning_rate": 5.504210310125283e-07, + "loss": 0.9094, + "step": 8065 + }, + { + "epoch": 1.5, + "learning_rate": 5.493941261039227e-07, + "loss": 0.9327, + "step": 8070 + }, + { + "epoch": 1.5, + "learning_rate": 5.483672211953173e-07, + "loss": 0.7259, + "step": 8075 + }, + { + "epoch": 1.5, + "learning_rate": 5.473403162867118e-07, + "loss": 0.8508, + "step": 8080 + }, + { + "epoch": 1.51, + "learning_rate": 5.463134113781064e-07, + "loss": 0.9925, + "step": 8085 + }, + { + "epoch": 1.51, + "learning_rate": 5.452865064695009e-07, + "loss": 0.855, + "step": 8090 + }, + { + "epoch": 1.51, + "learning_rate": 5.442596015608955e-07, + "loss": 0.7268, + "step": 8095 + }, + { + "epoch": 1.51, + "learning_rate": 5.4323269665229e-07, + "loss": 0.7489, + "step": 8100 + }, + { + "epoch": 1.51, + "learning_rate": 5.422057917436846e-07, + "loss": 0.8293, + "step": 8105 + }, + { + "epoch": 1.51, + "learning_rate": 5.41178886835079e-07, + "loss": 0.8503, + "step": 8110 + }, + { + "epoch": 1.51, + "learning_rate": 5.401519819264736e-07, + "loss": 1.0528, + "step": 8115 + }, + { + "epoch": 1.51, + "learning_rate": 5.391250770178681e-07, + "loss": 1.0937, + "step": 8120 + }, + { + "epoch": 1.51, + "learning_rate": 5.380981721092627e-07, + "loss": 0.733, + "step": 8125 + }, + { + "epoch": 1.51, + "learning_rate": 5.370712672006572e-07, + "loss": 1.0224, + "step": 8130 + }, + { + "epoch": 1.52, + "learning_rate": 5.360443622920518e-07, + "loss": 0.8198, + "step": 8135 + }, + { + "epoch": 1.52, + "learning_rate": 5.350174573834463e-07, + "loss": 0.7389, + "step": 8140 + }, + { + "epoch": 1.52, + "learning_rate": 5.339905524748408e-07, + "loss": 0.9084, + "step": 8145 + }, + { + "epoch": 1.52, + "learning_rate": 5.329636475662354e-07, + "loss": 0.661, + "step": 8150 + }, + { + "epoch": 1.52, + "learning_rate": 5.319367426576298e-07, + "loss": 0.7891, + "step": 8155 + }, + { + "epoch": 1.52, + "learning_rate": 5.309098377490244e-07, + "loss": 0.8624, + "step": 8160 + }, + { + "epoch": 1.52, + "learning_rate": 5.298829328404189e-07, + "loss": 0.8217, + "step": 8165 + }, + { + "epoch": 1.52, + "learning_rate": 5.288560279318135e-07, + "loss": 0.7959, + "step": 8170 + }, + { + "epoch": 1.52, + "learning_rate": 5.27829123023208e-07, + "loss": 1.0279, + "step": 8175 + }, + { + "epoch": 1.52, + "learning_rate": 5.268022181146026e-07, + "loss": 0.7266, + "step": 8180 + }, + { + "epoch": 1.52, + "learning_rate": 5.257753132059971e-07, + "loss": 0.9282, + "step": 8185 + }, + { + "epoch": 1.53, + "learning_rate": 5.247484082973917e-07, + "loss": 0.8392, + "step": 8190 + }, + { + "epoch": 1.53, + "learning_rate": 5.237215033887861e-07, + "loss": 0.8131, + "step": 8195 + }, + { + "epoch": 1.53, + "learning_rate": 5.226945984801807e-07, + "loss": 0.8858, + "step": 8200 + }, + { + "epoch": 1.53, + "learning_rate": 5.216676935715752e-07, + "loss": 0.786, + "step": 8205 + }, + { + "epoch": 1.53, + "learning_rate": 5.206407886629698e-07, + "loss": 0.918, + "step": 8210 + }, + { + "epoch": 1.53, + "learning_rate": 5.196138837543643e-07, + "loss": 0.7505, + "step": 8215 + }, + { + "epoch": 1.53, + "learning_rate": 5.185869788457589e-07, + "loss": 0.7523, + "step": 8220 + }, + { + "epoch": 1.53, + "learning_rate": 5.175600739371534e-07, + "loss": 0.9177, + "step": 8225 + }, + { + "epoch": 1.53, + "learning_rate": 5.16533169028548e-07, + "loss": 0.9611, + "step": 8230 + }, + { + "epoch": 1.53, + "learning_rate": 5.155062641199424e-07, + "loss": 0.8993, + "step": 8235 + }, + { + "epoch": 1.53, + "learning_rate": 5.14479359211337e-07, + "loss": 0.9785, + "step": 8240 + }, + { + "epoch": 1.54, + "learning_rate": 5.134524543027315e-07, + "loss": 0.9, + "step": 8245 + }, + { + "epoch": 1.54, + "learning_rate": 5.124255493941261e-07, + "loss": 0.7835, + "step": 8250 + }, + { + "epoch": 1.54, + "learning_rate": 5.113986444855206e-07, + "loss": 1.0824, + "step": 8255 + }, + { + "epoch": 1.54, + "learning_rate": 5.103717395769152e-07, + "loss": 1.0807, + "step": 8260 + }, + { + "epoch": 1.54, + "learning_rate": 5.093448346683097e-07, + "loss": 0.9891, + "step": 8265 + }, + { + "epoch": 1.54, + "learning_rate": 5.083179297597043e-07, + "loss": 0.8318, + "step": 8270 + }, + { + "epoch": 1.54, + "learning_rate": 5.072910248510988e-07, + "loss": 0.7792, + "step": 8275 + }, + { + "epoch": 1.54, + "learning_rate": 5.062641199424933e-07, + "loss": 0.8312, + "step": 8280 + }, + { + "epoch": 1.54, + "learning_rate": 5.052372150338878e-07, + "loss": 0.6618, + "step": 8285 + }, + { + "epoch": 1.54, + "learning_rate": 5.042103101252824e-07, + "loss": 0.7102, + "step": 8290 + }, + { + "epoch": 1.54, + "learning_rate": 5.031834052166769e-07, + "loss": 0.9409, + "step": 8295 + }, + { + "epoch": 1.55, + "learning_rate": 5.021565003080714e-07, + "loss": 1.1354, + "step": 8300 + }, + { + "epoch": 1.55, + "learning_rate": 5.01129595399466e-07, + "loss": 0.7533, + "step": 8305 + }, + { + "epoch": 1.55, + "learning_rate": 5.001026904908605e-07, + "loss": 1.0336, + "step": 8310 + }, + { + "epoch": 1.55, + "learning_rate": 4.990757855822551e-07, + "loss": 0.8046, + "step": 8315 + }, + { + "epoch": 1.55, + "learning_rate": 4.980488806736495e-07, + "loss": 1.3911, + "step": 8320 + }, + { + "epoch": 1.55, + "learning_rate": 4.970219757650441e-07, + "loss": 0.7045, + "step": 8325 + }, + { + "epoch": 1.55, + "learning_rate": 4.959950708564386e-07, + "loss": 0.8076, + "step": 8330 + }, + { + "epoch": 1.55, + "learning_rate": 4.949681659478332e-07, + "loss": 0.9713, + "step": 8335 + }, + { + "epoch": 1.55, + "learning_rate": 4.939412610392277e-07, + "loss": 0.8131, + "step": 8340 + }, + { + "epoch": 1.55, + "learning_rate": 4.929143561306223e-07, + "loss": 0.683, + "step": 8345 + }, + { + "epoch": 1.56, + "learning_rate": 4.918874512220168e-07, + "loss": 1.0491, + "step": 8350 + }, + { + "epoch": 1.56, + "learning_rate": 4.908605463134114e-07, + "loss": 0.9126, + "step": 8355 + }, + { + "epoch": 1.56, + "learning_rate": 4.898336414048058e-07, + "loss": 0.7582, + "step": 8360 + }, + { + "epoch": 1.56, + "learning_rate": 4.888067364962004e-07, + "loss": 1.0113, + "step": 8365 + }, + { + "epoch": 1.56, + "learning_rate": 4.877798315875949e-07, + "loss": 0.7116, + "step": 8370 + }, + { + "epoch": 1.56, + "learning_rate": 4.867529266789895e-07, + "loss": 0.9096, + "step": 8375 + }, + { + "epoch": 1.56, + "learning_rate": 4.85726021770384e-07, + "loss": 0.795, + "step": 8380 + }, + { + "epoch": 1.56, + "learning_rate": 4.846991168617786e-07, + "loss": 0.6889, + "step": 8385 + }, + { + "epoch": 1.56, + "learning_rate": 4.836722119531731e-07, + "loss": 1.0997, + "step": 8390 + }, + { + "epoch": 1.56, + "learning_rate": 4.826453070445677e-07, + "loss": 0.7957, + "step": 8395 + }, + { + "epoch": 1.56, + "learning_rate": 4.816184021359621e-07, + "loss": 0.8872, + "step": 8400 + }, + { + "epoch": 1.57, + "learning_rate": 4.805914972273567e-07, + "loss": 0.8239, + "step": 8405 + }, + { + "epoch": 1.57, + "learning_rate": 4.795645923187512e-07, + "loss": 0.7891, + "step": 8410 + }, + { + "epoch": 1.57, + "learning_rate": 4.785376874101458e-07, + "loss": 1.098, + "step": 8415 + }, + { + "epoch": 1.57, + "learning_rate": 4.775107825015403e-07, + "loss": 0.9928, + "step": 8420 + }, + { + "epoch": 1.57, + "learning_rate": 4.7648387759293484e-07, + "loss": 0.7261, + "step": 8425 + }, + { + "epoch": 1.57, + "learning_rate": 4.754569726843294e-07, + "loss": 0.9117, + "step": 8430 + }, + { + "epoch": 1.57, + "learning_rate": 4.744300677757239e-07, + "loss": 0.7395, + "step": 8435 + }, + { + "epoch": 1.57, + "learning_rate": 4.734031628671185e-07, + "loss": 0.8122, + "step": 8440 + }, + { + "epoch": 1.57, + "learning_rate": 4.7237625795851304e-07, + "loss": 0.6871, + "step": 8445 + }, + { + "epoch": 1.57, + "learning_rate": 4.713493530499076e-07, + "loss": 0.8141, + "step": 8450 + }, + { + "epoch": 1.57, + "learning_rate": 4.703224481413021e-07, + "loss": 0.7518, + "step": 8455 + }, + { + "epoch": 1.58, + "learning_rate": 4.6929554323269666e-07, + "loss": 0.9715, + "step": 8460 + }, + { + "epoch": 1.58, + "learning_rate": 4.682686383240912e-07, + "loss": 0.9768, + "step": 8465 + }, + { + "epoch": 1.58, + "learning_rate": 4.6724173341548573e-07, + "loss": 0.7381, + "step": 8470 + }, + { + "epoch": 1.58, + "learning_rate": 4.6621482850688027e-07, + "loss": 1.0727, + "step": 8475 + }, + { + "epoch": 1.58, + "learning_rate": 4.651879235982748e-07, + "loss": 0.9019, + "step": 8480 + }, + { + "epoch": 1.58, + "learning_rate": 4.6416101868966935e-07, + "loss": 1.1234, + "step": 8485 + }, + { + "epoch": 1.58, + "learning_rate": 4.631341137810639e-07, + "loss": 0.9862, + "step": 8490 + }, + { + "epoch": 1.58, + "learning_rate": 4.621072088724584e-07, + "loss": 0.9288, + "step": 8495 + }, + { + "epoch": 1.58, + "learning_rate": 4.6108030396385296e-07, + "loss": 0.7656, + "step": 8500 + }, + { + "epoch": 1.58, + "eval_loss": 0.5572460889816284, + "eval_runtime": 135.2315, + "eval_samples_per_second": 8.829, + "eval_steps_per_second": 1.109, + "eval_wer": 0.9211133914828117, + "step": 8500 + }, + { + "epoch": 1.58, + "learning_rate": 4.600533990552475e-07, + "loss": 1.2769, + "step": 8505 + }, + { + "epoch": 1.59, + "learning_rate": 4.5902649414664204e-07, + "loss": 0.7621, + "step": 8510 + }, + { + "epoch": 1.59, + "learning_rate": 4.579995892380366e-07, + "loss": 0.8506, + "step": 8515 + }, + { + "epoch": 1.59, + "learning_rate": 4.569726843294311e-07, + "loss": 0.8792, + "step": 8520 + }, + { + "epoch": 1.59, + "learning_rate": 4.5594577942082565e-07, + "loss": 0.8107, + "step": 8525 + }, + { + "epoch": 1.59, + "learning_rate": 4.5491887451222014e-07, + "loss": 0.7621, + "step": 8530 + }, + { + "epoch": 1.59, + "learning_rate": 4.538919696036147e-07, + "loss": 0.7552, + "step": 8535 + }, + { + "epoch": 1.59, + "learning_rate": 4.528650646950092e-07, + "loss": 0.6921, + "step": 8540 + }, + { + "epoch": 1.59, + "learning_rate": 4.5183815978640375e-07, + "loss": 0.614, + "step": 8545 + }, + { + "epoch": 1.59, + "learning_rate": 4.508112548777983e-07, + "loss": 0.7925, + "step": 8550 + }, + { + "epoch": 1.59, + "learning_rate": 4.4978434996919283e-07, + "loss": 0.8397, + "step": 8555 + }, + { + "epoch": 1.59, + "learning_rate": 4.4875744506058737e-07, + "loss": 0.9498, + "step": 8560 + }, + { + "epoch": 1.6, + "learning_rate": 4.477305401519819e-07, + "loss": 0.7446, + "step": 8565 + }, + { + "epoch": 1.6, + "learning_rate": 4.4670363524337644e-07, + "loss": 0.9555, + "step": 8570 + }, + { + "epoch": 1.6, + "learning_rate": 4.45676730334771e-07, + "loss": 0.8588, + "step": 8575 + }, + { + "epoch": 1.6, + "learning_rate": 4.446498254261655e-07, + "loss": 0.9522, + "step": 8580 + }, + { + "epoch": 1.6, + "learning_rate": 4.4362292051756006e-07, + "loss": 0.716, + "step": 8585 + }, + { + "epoch": 1.6, + "learning_rate": 4.425960156089546e-07, + "loss": 0.7492, + "step": 8590 + }, + { + "epoch": 1.6, + "learning_rate": 4.4156911070034913e-07, + "loss": 0.9591, + "step": 8595 + }, + { + "epoch": 1.6, + "learning_rate": 4.4054220579174367e-07, + "loss": 0.6838, + "step": 8600 + }, + { + "epoch": 1.6, + "learning_rate": 4.395153008831382e-07, + "loss": 0.6971, + "step": 8605 + }, + { + "epoch": 1.6, + "learning_rate": 4.3848839597453275e-07, + "loss": 0.7055, + "step": 8610 + }, + { + "epoch": 1.6, + "learning_rate": 4.374614910659273e-07, + "loss": 0.7494, + "step": 8615 + }, + { + "epoch": 1.61, + "learning_rate": 4.364345861573218e-07, + "loss": 0.7243, + "step": 8620 + }, + { + "epoch": 1.61, + "learning_rate": 4.3540768124871636e-07, + "loss": 0.8597, + "step": 8625 + }, + { + "epoch": 1.61, + "learning_rate": 4.343807763401109e-07, + "loss": 0.739, + "step": 8630 + }, + { + "epoch": 1.61, + "learning_rate": 4.3335387143150544e-07, + "loss": 0.838, + "step": 8635 + }, + { + "epoch": 1.61, + "learning_rate": 4.323269665229e-07, + "loss": 0.8557, + "step": 8640 + }, + { + "epoch": 1.61, + "learning_rate": 4.313000616142945e-07, + "loss": 0.6209, + "step": 8645 + }, + { + "epoch": 1.61, + "learning_rate": 4.3027315670568905e-07, + "loss": 0.7521, + "step": 8650 + }, + { + "epoch": 1.61, + "learning_rate": 4.292462517970836e-07, + "loss": 0.6777, + "step": 8655 + }, + { + "epoch": 1.61, + "learning_rate": 4.282193468884781e-07, + "loss": 0.7345, + "step": 8660 + }, + { + "epoch": 1.61, + "learning_rate": 4.2719244197987266e-07, + "loss": 0.7864, + "step": 8665 + }, + { + "epoch": 1.61, + "learning_rate": 4.261655370712672e-07, + "loss": 0.6808, + "step": 8670 + }, + { + "epoch": 1.62, + "learning_rate": 4.2513863216266174e-07, + "loss": 0.7143, + "step": 8675 + }, + { + "epoch": 1.62, + "learning_rate": 4.241117272540562e-07, + "loss": 1.0389, + "step": 8680 + }, + { + "epoch": 1.62, + "learning_rate": 4.2308482234545076e-07, + "loss": 0.7213, + "step": 8685 + }, + { + "epoch": 1.62, + "learning_rate": 4.220579174368453e-07, + "loss": 0.789, + "step": 8690 + }, + { + "epoch": 1.62, + "learning_rate": 4.2103101252823984e-07, + "loss": 0.6796, + "step": 8695 + }, + { + "epoch": 1.62, + "learning_rate": 4.200041076196344e-07, + "loss": 0.7828, + "step": 8700 + }, + { + "epoch": 1.62, + "learning_rate": 4.189772027110289e-07, + "loss": 0.7098, + "step": 8705 + }, + { + "epoch": 1.62, + "learning_rate": 4.1795029780242345e-07, + "loss": 0.7801, + "step": 8710 + }, + { + "epoch": 1.62, + "learning_rate": 4.16923392893818e-07, + "loss": 0.8762, + "step": 8715 + }, + { + "epoch": 1.62, + "learning_rate": 4.1589648798521253e-07, + "loss": 1.2351, + "step": 8720 + }, + { + "epoch": 1.63, + "learning_rate": 4.1486958307660707e-07, + "loss": 0.8635, + "step": 8725 + }, + { + "epoch": 1.63, + "learning_rate": 4.138426781680016e-07, + "loss": 0.7581, + "step": 8730 + }, + { + "epoch": 1.63, + "learning_rate": 4.1281577325939614e-07, + "loss": 0.7198, + "step": 8735 + }, + { + "epoch": 1.63, + "learning_rate": 4.117888683507907e-07, + "loss": 0.7464, + "step": 8740 + }, + { + "epoch": 1.63, + "learning_rate": 4.107619634421852e-07, + "loss": 0.7753, + "step": 8745 + }, + { + "epoch": 1.63, + "learning_rate": 4.0973505853357976e-07, + "loss": 0.7831, + "step": 8750 + }, + { + "epoch": 1.63, + "learning_rate": 4.087081536249743e-07, + "loss": 0.8637, + "step": 8755 + }, + { + "epoch": 1.63, + "learning_rate": 4.0768124871636883e-07, + "loss": 0.7104, + "step": 8760 + }, + { + "epoch": 1.63, + "learning_rate": 4.0665434380776337e-07, + "loss": 1.1407, + "step": 8765 + }, + { + "epoch": 1.63, + "learning_rate": 4.056274388991579e-07, + "loss": 1.8111, + "step": 8770 + }, + { + "epoch": 1.63, + "learning_rate": 4.0460053399055245e-07, + "loss": 0.9607, + "step": 8775 + }, + { + "epoch": 1.64, + "learning_rate": 4.03573629081947e-07, + "loss": 0.7323, + "step": 8780 + }, + { + "epoch": 1.64, + "learning_rate": 4.025467241733415e-07, + "loss": 0.7853, + "step": 8785 + }, + { + "epoch": 1.64, + "learning_rate": 4.0151981926473606e-07, + "loss": 1.0725, + "step": 8790 + }, + { + "epoch": 1.64, + "learning_rate": 4.004929143561306e-07, + "loss": 1.0457, + "step": 8795 + }, + { + "epoch": 1.64, + "learning_rate": 3.9946600944752514e-07, + "loss": 0.8052, + "step": 8800 + }, + { + "epoch": 1.64, + "learning_rate": 3.984391045389197e-07, + "loss": 0.9338, + "step": 8805 + }, + { + "epoch": 1.64, + "learning_rate": 3.974121996303142e-07, + "loss": 1.0658, + "step": 8810 + }, + { + "epoch": 1.64, + "learning_rate": 3.9638529472170875e-07, + "loss": 1.1294, + "step": 8815 + }, + { + "epoch": 1.64, + "learning_rate": 3.953583898131033e-07, + "loss": 0.8306, + "step": 8820 + }, + { + "epoch": 1.64, + "learning_rate": 3.9433148490449783e-07, + "loss": 0.9354, + "step": 8825 + }, + { + "epoch": 1.64, + "learning_rate": 3.933045799958923e-07, + "loss": 0.901, + "step": 8830 + }, + { + "epoch": 1.65, + "learning_rate": 3.9227767508728685e-07, + "loss": 0.888, + "step": 8835 + }, + { + "epoch": 1.65, + "learning_rate": 3.912507701786814e-07, + "loss": 0.8643, + "step": 8840 + }, + { + "epoch": 1.65, + "learning_rate": 3.9022386527007593e-07, + "loss": 0.8769, + "step": 8845 + }, + { + "epoch": 1.65, + "learning_rate": 3.8919696036147046e-07, + "loss": 0.7751, + "step": 8850 + }, + { + "epoch": 1.65, + "learning_rate": 3.88170055452865e-07, + "loss": 0.9784, + "step": 8855 + }, + { + "epoch": 1.65, + "learning_rate": 3.871431505442596e-07, + "loss": 0.6873, + "step": 8860 + }, + { + "epoch": 1.65, + "learning_rate": 3.8611624563565413e-07, + "loss": 0.8287, + "step": 8865 + }, + { + "epoch": 1.65, + "learning_rate": 3.8508934072704867e-07, + "loss": 1.0599, + "step": 8870 + }, + { + "epoch": 1.65, + "learning_rate": 3.840624358184432e-07, + "loss": 0.7779, + "step": 8875 + }, + { + "epoch": 1.65, + "learning_rate": 3.8303553090983775e-07, + "loss": 0.8061, + "step": 8880 + }, + { + "epoch": 1.65, + "learning_rate": 3.820086260012323e-07, + "loss": 0.7412, + "step": 8885 + }, + { + "epoch": 1.66, + "learning_rate": 3.809817210926268e-07, + "loss": 0.9013, + "step": 8890 + }, + { + "epoch": 1.66, + "learning_rate": 3.7995481618402136e-07, + "loss": 1.071, + "step": 8895 + }, + { + "epoch": 1.66, + "learning_rate": 3.789279112754159e-07, + "loss": 1.1361, + "step": 8900 + }, + { + "epoch": 1.66, + "learning_rate": 3.7790100636681044e-07, + "loss": 0.7694, + "step": 8905 + }, + { + "epoch": 1.66, + "learning_rate": 3.76874101458205e-07, + "loss": 0.9759, + "step": 8910 + }, + { + "epoch": 1.66, + "learning_rate": 3.758471965495995e-07, + "loss": 0.9244, + "step": 8915 + }, + { + "epoch": 1.66, + "learning_rate": 3.7482029164099405e-07, + "loss": 0.6793, + "step": 8920 + }, + { + "epoch": 1.66, + "learning_rate": 3.737933867323886e-07, + "loss": 0.7158, + "step": 8925 + }, + { + "epoch": 1.66, + "learning_rate": 3.727664818237831e-07, + "loss": 0.8618, + "step": 8930 + }, + { + "epoch": 1.66, + "learning_rate": 3.7173957691517766e-07, + "loss": 0.7628, + "step": 8935 + }, + { + "epoch": 1.67, + "learning_rate": 3.707126720065722e-07, + "loss": 0.7349, + "step": 8940 + }, + { + "epoch": 1.67, + "learning_rate": 3.6968576709796674e-07, + "loss": 0.7003, + "step": 8945 + }, + { + "epoch": 1.67, + "learning_rate": 3.686588621893613e-07, + "loss": 0.6532, + "step": 8950 + }, + { + "epoch": 1.67, + "learning_rate": 3.676319572807558e-07, + "loss": 0.9775, + "step": 8955 + }, + { + "epoch": 1.67, + "learning_rate": 3.6660505237215035e-07, + "loss": 0.8026, + "step": 8960 + }, + { + "epoch": 1.67, + "learning_rate": 3.655781474635449e-07, + "loss": 0.8922, + "step": 8965 + }, + { + "epoch": 1.67, + "learning_rate": 3.6455124255493943e-07, + "loss": 0.9833, + "step": 8970 + }, + { + "epoch": 1.67, + "learning_rate": 3.6352433764633397e-07, + "loss": 0.9331, + "step": 8975 + }, + { + "epoch": 1.67, + "learning_rate": 3.624974327377285e-07, + "loss": 0.6908, + "step": 8980 + }, + { + "epoch": 1.67, + "learning_rate": 3.6147052782912304e-07, + "loss": 0.7091, + "step": 8985 + }, + { + "epoch": 1.67, + "learning_rate": 3.6044362292051753e-07, + "loss": 0.9287, + "step": 8990 + }, + { + "epoch": 1.68, + "learning_rate": 3.5941671801191207e-07, + "loss": 0.9938, + "step": 8995 + }, + { + "epoch": 1.68, + "learning_rate": 3.583898131033066e-07, + "loss": 1.0478, + "step": 9000 + }, + { + "epoch": 1.68, + "eval_loss": 0.548711895942688, + "eval_runtime": 135.1827, + "eval_samples_per_second": 8.832, + "eval_steps_per_second": 1.11, + "eval_wer": 0.9168804515135968, + "step": 9000 + }, + { + "epoch": 1.68, + "learning_rate": 3.5736290819470114e-07, + "loss": 0.8037, + "step": 9005 + }, + { + "epoch": 1.68, + "learning_rate": 3.563360032860957e-07, + "loss": 0.7756, + "step": 9010 + }, + { + "epoch": 1.68, + "learning_rate": 3.553090983774902e-07, + "loss": 0.9559, + "step": 9015 + }, + { + "epoch": 1.68, + "learning_rate": 3.5428219346888476e-07, + "loss": 0.979, + "step": 9020 + }, + { + "epoch": 1.68, + "learning_rate": 3.532552885602793e-07, + "loss": 0.5972, + "step": 9025 + }, + { + "epoch": 1.68, + "learning_rate": 3.5222838365167383e-07, + "loss": 0.7141, + "step": 9030 + }, + { + "epoch": 1.68, + "learning_rate": 3.5120147874306837e-07, + "loss": 1.1511, + "step": 9035 + }, + { + "epoch": 1.68, + "learning_rate": 3.501745738344629e-07, + "loss": 1.0922, + "step": 9040 + }, + { + "epoch": 1.68, + "learning_rate": 3.4914766892585745e-07, + "loss": 0.9412, + "step": 9045 + }, + { + "epoch": 1.69, + "learning_rate": 3.48120764017252e-07, + "loss": 0.9679, + "step": 9050 + }, + { + "epoch": 1.69, + "learning_rate": 3.470938591086465e-07, + "loss": 0.7127, + "step": 9055 + }, + { + "epoch": 1.69, + "learning_rate": 3.4606695420004106e-07, + "loss": 0.7559, + "step": 9060 + }, + { + "epoch": 1.69, + "learning_rate": 3.450400492914356e-07, + "loss": 0.894, + "step": 9065 + }, + { + "epoch": 1.69, + "learning_rate": 3.4401314438283014e-07, + "loss": 0.8835, + "step": 9070 + }, + { + "epoch": 1.69, + "learning_rate": 3.429862394742247e-07, + "loss": 0.9195, + "step": 9075 + }, + { + "epoch": 1.69, + "learning_rate": 3.419593345656192e-07, + "loss": 0.7117, + "step": 9080 + }, + { + "epoch": 1.69, + "learning_rate": 3.4093242965701375e-07, + "loss": 1.1162, + "step": 9085 + }, + { + "epoch": 1.69, + "learning_rate": 3.399055247484083e-07, + "loss": 0.7655, + "step": 9090 + }, + { + "epoch": 1.69, + "learning_rate": 3.3887861983980283e-07, + "loss": 0.9353, + "step": 9095 + }, + { + "epoch": 1.69, + "learning_rate": 3.3785171493119737e-07, + "loss": 0.8058, + "step": 9100 + }, + { + "epoch": 1.7, + "learning_rate": 3.368248100225919e-07, + "loss": 0.7053, + "step": 9105 + }, + { + "epoch": 1.7, + "learning_rate": 3.3579790511398644e-07, + "loss": 1.4235, + "step": 9110 + }, + { + "epoch": 1.7, + "learning_rate": 3.34771000205381e-07, + "loss": 0.7978, + "step": 9115 + }, + { + "epoch": 1.7, + "learning_rate": 3.337440952967755e-07, + "loss": 0.9128, + "step": 9120 + }, + { + "epoch": 1.7, + "learning_rate": 3.3271719038817006e-07, + "loss": 0.6848, + "step": 9125 + }, + { + "epoch": 1.7, + "learning_rate": 3.316902854795646e-07, + "loss": 0.6636, + "step": 9130 + }, + { + "epoch": 1.7, + "learning_rate": 3.3066338057095913e-07, + "loss": 0.9091, + "step": 9135 + }, + { + "epoch": 1.7, + "learning_rate": 3.296364756623536e-07, + "loss": 0.6772, + "step": 9140 + }, + { + "epoch": 1.7, + "learning_rate": 3.2860957075374815e-07, + "loss": 0.732, + "step": 9145 + }, + { + "epoch": 1.7, + "learning_rate": 3.275826658451427e-07, + "loss": 0.9508, + "step": 9150 + }, + { + "epoch": 1.71, + "learning_rate": 3.2655576093653723e-07, + "loss": 0.9088, + "step": 9155 + }, + { + "epoch": 1.71, + "learning_rate": 3.2552885602793177e-07, + "loss": 0.7601, + "step": 9160 + }, + { + "epoch": 1.71, + "learning_rate": 3.245019511193263e-07, + "loss": 1.1497, + "step": 9165 + }, + { + "epoch": 1.71, + "learning_rate": 3.2347504621072084e-07, + "loss": 1.4884, + "step": 9170 + }, + { + "epoch": 1.71, + "learning_rate": 3.224481413021154e-07, + "loss": 1.0249, + "step": 9175 + }, + { + "epoch": 1.71, + "learning_rate": 3.214212363935099e-07, + "loss": 0.6794, + "step": 9180 + }, + { + "epoch": 1.71, + "learning_rate": 3.2039433148490446e-07, + "loss": 0.792, + "step": 9185 + }, + { + "epoch": 1.71, + "learning_rate": 3.19367426576299e-07, + "loss": 0.8582, + "step": 9190 + }, + { + "epoch": 1.71, + "learning_rate": 3.1834052166769353e-07, + "loss": 0.7575, + "step": 9195 + }, + { + "epoch": 1.71, + "learning_rate": 3.1731361675908807e-07, + "loss": 0.8361, + "step": 9200 + }, + { + "epoch": 1.71, + "learning_rate": 3.162867118504826e-07, + "loss": 1.4164, + "step": 9205 + }, + { + "epoch": 1.72, + "learning_rate": 3.1525980694187715e-07, + "loss": 0.8392, + "step": 9210 + }, + { + "epoch": 1.72, + "learning_rate": 3.142329020332717e-07, + "loss": 0.6588, + "step": 9215 + }, + { + "epoch": 1.72, + "learning_rate": 3.132059971246662e-07, + "loss": 0.7318, + "step": 9220 + }, + { + "epoch": 1.72, + "learning_rate": 3.1217909221606076e-07, + "loss": 1.029, + "step": 9225 + }, + { + "epoch": 1.72, + "learning_rate": 3.111521873074553e-07, + "loss": 0.9353, + "step": 9230 + }, + { + "epoch": 1.72, + "learning_rate": 3.1012528239884984e-07, + "loss": 1.1036, + "step": 9235 + }, + { + "epoch": 1.72, + "learning_rate": 3.090983774902444e-07, + "loss": 0.8916, + "step": 9240 + }, + { + "epoch": 1.72, + "learning_rate": 3.080714725816389e-07, + "loss": 0.7161, + "step": 9245 + }, + { + "epoch": 1.72, + "learning_rate": 3.0704456767303345e-07, + "loss": 0.7532, + "step": 9250 + }, + { + "epoch": 1.72, + "learning_rate": 3.06017662764428e-07, + "loss": 0.9709, + "step": 9255 + }, + { + "epoch": 1.72, + "learning_rate": 3.0499075785582253e-07, + "loss": 1.0166, + "step": 9260 + }, + { + "epoch": 1.73, + "learning_rate": 3.0396385294721707e-07, + "loss": 1.0056, + "step": 9265 + }, + { + "epoch": 1.73, + "learning_rate": 3.029369480386116e-07, + "loss": 0.7948, + "step": 9270 + }, + { + "epoch": 1.73, + "learning_rate": 3.0191004313000614e-07, + "loss": 0.7811, + "step": 9275 + }, + { + "epoch": 1.73, + "learning_rate": 3.0088313822140073e-07, + "loss": 0.6995, + "step": 9280 + }, + { + "epoch": 1.73, + "learning_rate": 2.9985623331279527e-07, + "loss": 0.8626, + "step": 9285 + }, + { + "epoch": 1.73, + "learning_rate": 2.988293284041898e-07, + "loss": 1.0764, + "step": 9290 + }, + { + "epoch": 1.73, + "learning_rate": 2.978024234955843e-07, + "loss": 1.33, + "step": 9295 + }, + { + "epoch": 1.73, + "learning_rate": 2.9677551858697883e-07, + "loss": 0.8439, + "step": 9300 + }, + { + "epoch": 1.73, + "learning_rate": 2.9574861367837337e-07, + "loss": 0.7295, + "step": 9305 + }, + { + "epoch": 1.73, + "learning_rate": 2.947217087697679e-07, + "loss": 0.7173, + "step": 9310 + }, + { + "epoch": 1.73, + "learning_rate": 2.9369480386116245e-07, + "loss": 0.9574, + "step": 9315 + }, + { + "epoch": 1.74, + "learning_rate": 2.92667898952557e-07, + "loss": 1.0192, + "step": 9320 + }, + { + "epoch": 1.74, + "learning_rate": 2.916409940439515e-07, + "loss": 0.8545, + "step": 9325 + }, + { + "epoch": 1.74, + "learning_rate": 2.9061408913534606e-07, + "loss": 1.3505, + "step": 9330 + }, + { + "epoch": 1.74, + "learning_rate": 2.895871842267406e-07, + "loss": 0.7252, + "step": 9335 + }, + { + "epoch": 1.74, + "learning_rate": 2.8856027931813514e-07, + "loss": 0.7729, + "step": 9340 + }, + { + "epoch": 1.74, + "learning_rate": 2.875333744095297e-07, + "loss": 0.7349, + "step": 9345 + }, + { + "epoch": 1.74, + "learning_rate": 2.865064695009242e-07, + "loss": 0.7728, + "step": 9350 + }, + { + "epoch": 1.74, + "learning_rate": 2.8547956459231875e-07, + "loss": 0.8057, + "step": 9355 + }, + { + "epoch": 1.74, + "learning_rate": 2.844526596837133e-07, + "loss": 0.7852, + "step": 9360 + }, + { + "epoch": 1.74, + "learning_rate": 2.8342575477510783e-07, + "loss": 0.9283, + "step": 9365 + }, + { + "epoch": 1.75, + "learning_rate": 2.8239884986650236e-07, + "loss": 0.7183, + "step": 9370 + }, + { + "epoch": 1.75, + "learning_rate": 2.813719449578969e-07, + "loss": 1.1469, + "step": 9375 + }, + { + "epoch": 1.75, + "learning_rate": 2.8034504004929144e-07, + "loss": 0.7638, + "step": 9380 + }, + { + "epoch": 1.75, + "learning_rate": 2.79318135140686e-07, + "loss": 0.9751, + "step": 9385 + }, + { + "epoch": 1.75, + "learning_rate": 2.782912302320805e-07, + "loss": 0.8638, + "step": 9390 + }, + { + "epoch": 1.75, + "learning_rate": 2.7726432532347505e-07, + "loss": 0.6055, + "step": 9395 + }, + { + "epoch": 1.75, + "learning_rate": 2.762374204148696e-07, + "loss": 0.7411, + "step": 9400 + }, + { + "epoch": 1.75, + "learning_rate": 2.7521051550626413e-07, + "loss": 0.9885, + "step": 9405 + }, + { + "epoch": 1.75, + "learning_rate": 2.7418361059765867e-07, + "loss": 0.8003, + "step": 9410 + }, + { + "epoch": 1.75, + "learning_rate": 2.731567056890532e-07, + "loss": 1.071, + "step": 9415 + }, + { + "epoch": 1.75, + "learning_rate": 2.7212980078044774e-07, + "loss": 0.8145, + "step": 9420 + }, + { + "epoch": 1.76, + "learning_rate": 2.711028958718423e-07, + "loss": 0.6303, + "step": 9425 + }, + { + "epoch": 1.76, + "learning_rate": 2.700759909632368e-07, + "loss": 0.9826, + "step": 9430 + }, + { + "epoch": 1.76, + "learning_rate": 2.6904908605463136e-07, + "loss": 0.7654, + "step": 9435 + }, + { + "epoch": 1.76, + "learning_rate": 2.680221811460259e-07, + "loss": 1.1978, + "step": 9440 + }, + { + "epoch": 1.76, + "learning_rate": 2.669952762374204e-07, + "loss": 1.0603, + "step": 9445 + }, + { + "epoch": 1.76, + "learning_rate": 2.659683713288149e-07, + "loss": 0.8834, + "step": 9450 + }, + { + "epoch": 1.76, + "learning_rate": 2.6494146642020946e-07, + "loss": 0.7221, + "step": 9455 + }, + { + "epoch": 1.76, + "learning_rate": 2.63914561511604e-07, + "loss": 0.8836, + "step": 9460 + }, + { + "epoch": 1.76, + "learning_rate": 2.6288765660299853e-07, + "loss": 0.7714, + "step": 9465 + }, + { + "epoch": 1.76, + "learning_rate": 2.6186075169439307e-07, + "loss": 0.8994, + "step": 9470 + }, + { + "epoch": 1.76, + "learning_rate": 2.608338467857876e-07, + "loss": 0.6029, + "step": 9475 + }, + { + "epoch": 1.77, + "learning_rate": 2.5980694187718215e-07, + "loss": 1.0004, + "step": 9480 + }, + { + "epoch": 1.77, + "learning_rate": 2.587800369685767e-07, + "loss": 0.8633, + "step": 9485 + }, + { + "epoch": 1.77, + "learning_rate": 2.577531320599712e-07, + "loss": 0.8298, + "step": 9490 + }, + { + "epoch": 1.77, + "learning_rate": 2.5672622715136576e-07, + "loss": 0.7246, + "step": 9495 + }, + { + "epoch": 1.77, + "learning_rate": 2.556993222427603e-07, + "loss": 0.8339, + "step": 9500 + }, + { + "epoch": 1.77, + "eval_loss": 0.5449791550636292, + "eval_runtime": 132.473, + "eval_samples_per_second": 9.013, + "eval_steps_per_second": 1.132, + "eval_wer": 0.9112365315546435, + "step": 9500 + }, + { + "epoch": 1.77, + "learning_rate": 2.5467241733415484e-07, + "loss": 1.1769, + "step": 9505 + }, + { + "epoch": 1.77, + "learning_rate": 2.536455124255494e-07, + "loss": 0.795, + "step": 9510 + }, + { + "epoch": 1.77, + "learning_rate": 2.526186075169439e-07, + "loss": 0.9244, + "step": 9515 + }, + { + "epoch": 1.77, + "learning_rate": 2.5159170260833845e-07, + "loss": 0.7642, + "step": 9520 + }, + { + "epoch": 1.77, + "learning_rate": 2.50564797699733e-07, + "loss": 1.0131, + "step": 9525 + }, + { + "epoch": 1.78, + "learning_rate": 2.4953789279112753e-07, + "loss": 0.7834, + "step": 9530 + }, + { + "epoch": 1.78, + "learning_rate": 2.4851098788252207e-07, + "loss": 0.9238, + "step": 9535 + }, + { + "epoch": 1.78, + "learning_rate": 2.474840829739166e-07, + "loss": 0.7334, + "step": 9540 + }, + { + "epoch": 1.78, + "learning_rate": 2.4645717806531114e-07, + "loss": 0.7504, + "step": 9545 + }, + { + "epoch": 1.78, + "learning_rate": 2.454302731567057e-07, + "loss": 0.6311, + "step": 9550 + }, + { + "epoch": 1.78, + "learning_rate": 2.444033682481002e-07, + "loss": 1.1449, + "step": 9555 + }, + { + "epoch": 1.78, + "learning_rate": 2.4337646333949476e-07, + "loss": 1.0693, + "step": 9560 + }, + { + "epoch": 1.78, + "learning_rate": 2.423495584308893e-07, + "loss": 0.8986, + "step": 9565 + }, + { + "epoch": 1.78, + "learning_rate": 2.4132265352228383e-07, + "loss": 1.0381, + "step": 9570 + }, + { + "epoch": 1.78, + "learning_rate": 2.4029574861367837e-07, + "loss": 0.9385, + "step": 9575 + }, + { + "epoch": 1.78, + "learning_rate": 2.392688437050729e-07, + "loss": 0.6327, + "step": 9580 + }, + { + "epoch": 1.79, + "learning_rate": 2.3824193879646742e-07, + "loss": 0.6624, + "step": 9585 + }, + { + "epoch": 1.79, + "learning_rate": 2.3721503388786196e-07, + "loss": 0.7345, + "step": 9590 + }, + { + "epoch": 1.79, + "learning_rate": 2.3618812897925652e-07, + "loss": 0.7158, + "step": 9595 + }, + { + "epoch": 1.79, + "learning_rate": 2.3516122407065106e-07, + "loss": 0.7815, + "step": 9600 + }, + { + "epoch": 1.79, + "learning_rate": 2.341343191620456e-07, + "loss": 1.0816, + "step": 9605 + }, + { + "epoch": 1.79, + "learning_rate": 2.3310741425344014e-07, + "loss": 0.8828, + "step": 9610 + }, + { + "epoch": 1.79, + "learning_rate": 2.3208050934483467e-07, + "loss": 0.9075, + "step": 9615 + }, + { + "epoch": 1.79, + "learning_rate": 2.310536044362292e-07, + "loss": 1.6703, + "step": 9620 + }, + { + "epoch": 1.79, + "learning_rate": 2.3002669952762375e-07, + "loss": 0.7218, + "step": 9625 + }, + { + "epoch": 1.79, + "learning_rate": 2.289997946190183e-07, + "loss": 0.7332, + "step": 9630 + }, + { + "epoch": 1.79, + "learning_rate": 2.2797288971041283e-07, + "loss": 0.6355, + "step": 9635 + }, + { + "epoch": 1.8, + "learning_rate": 2.2694598480180734e-07, + "loss": 0.8792, + "step": 9640 + }, + { + "epoch": 1.8, + "learning_rate": 2.2591907989320188e-07, + "loss": 0.7534, + "step": 9645 + }, + { + "epoch": 1.8, + "learning_rate": 2.2489217498459641e-07, + "loss": 0.738, + "step": 9650 + }, + { + "epoch": 1.8, + "learning_rate": 2.2386527007599095e-07, + "loss": 0.7342, + "step": 9655 + }, + { + "epoch": 1.8, + "learning_rate": 2.228383651673855e-07, + "loss": 0.7395, + "step": 9660 + }, + { + "epoch": 1.8, + "learning_rate": 2.2181146025878003e-07, + "loss": 0.6329, + "step": 9665 + }, + { + "epoch": 1.8, + "learning_rate": 2.2078455535017457e-07, + "loss": 0.8756, + "step": 9670 + }, + { + "epoch": 1.8, + "learning_rate": 2.197576504415691e-07, + "loss": 0.6017, + "step": 9675 + }, + { + "epoch": 1.8, + "learning_rate": 2.1873074553296364e-07, + "loss": 0.6754, + "step": 9680 + }, + { + "epoch": 1.8, + "learning_rate": 2.1770384062435818e-07, + "loss": 0.6871, + "step": 9685 + }, + { + "epoch": 1.8, + "learning_rate": 2.1667693571575272e-07, + "loss": 0.7573, + "step": 9690 + }, + { + "epoch": 1.81, + "learning_rate": 2.1565003080714726e-07, + "loss": 1.0602, + "step": 9695 + }, + { + "epoch": 1.81, + "learning_rate": 2.146231258985418e-07, + "loss": 0.8002, + "step": 9700 + }, + { + "epoch": 1.81, + "learning_rate": 2.1359622098993633e-07, + "loss": 0.9188, + "step": 9705 + }, + { + "epoch": 1.81, + "learning_rate": 2.1256931608133087e-07, + "loss": 0.8239, + "step": 9710 + }, + { + "epoch": 1.81, + "learning_rate": 2.1154241117272538e-07, + "loss": 0.7205, + "step": 9715 + }, + { + "epoch": 1.81, + "learning_rate": 2.1051550626411992e-07, + "loss": 0.9943, + "step": 9720 + }, + { + "epoch": 1.81, + "learning_rate": 2.0948860135551446e-07, + "loss": 0.7139, + "step": 9725 + }, + { + "epoch": 1.81, + "learning_rate": 2.08461696446909e-07, + "loss": 1.0076, + "step": 9730 + }, + { + "epoch": 1.81, + "learning_rate": 2.0743479153830353e-07, + "loss": 0.8668, + "step": 9735 + }, + { + "epoch": 1.81, + "learning_rate": 2.0640788662969807e-07, + "loss": 0.7373, + "step": 9740 + }, + { + "epoch": 1.82, + "learning_rate": 2.053809817210926e-07, + "loss": 0.92, + "step": 9745 + }, + { + "epoch": 1.82, + "learning_rate": 2.0435407681248715e-07, + "loss": 0.7847, + "step": 9750 + }, + { + "epoch": 1.82, + "learning_rate": 2.0332717190388169e-07, + "loss": 0.7019, + "step": 9755 + }, + { + "epoch": 1.82, + "learning_rate": 2.0230026699527622e-07, + "loss": 1.3355, + "step": 9760 + }, + { + "epoch": 1.82, + "learning_rate": 2.0127336208667076e-07, + "loss": 0.8364, + "step": 9765 + }, + { + "epoch": 1.82, + "learning_rate": 2.002464571780653e-07, + "loss": 1.0353, + "step": 9770 + }, + { + "epoch": 1.82, + "learning_rate": 1.9921955226945984e-07, + "loss": 0.799, + "step": 9775 + }, + { + "epoch": 1.82, + "learning_rate": 1.9819264736085438e-07, + "loss": 1.0127, + "step": 9780 + }, + { + "epoch": 1.82, + "learning_rate": 1.9716574245224891e-07, + "loss": 0.5976, + "step": 9785 + }, + { + "epoch": 1.82, + "learning_rate": 1.9613883754364343e-07, + "loss": 0.816, + "step": 9790 + }, + { + "epoch": 1.82, + "learning_rate": 1.9511193263503796e-07, + "loss": 0.8324, + "step": 9795 + }, + { + "epoch": 1.83, + "learning_rate": 1.940850277264325e-07, + "loss": 0.7665, + "step": 9800 + }, + { + "epoch": 1.83, + "learning_rate": 1.9305812281782707e-07, + "loss": 0.7966, + "step": 9805 + }, + { + "epoch": 1.83, + "learning_rate": 1.920312179092216e-07, + "loss": 0.8726, + "step": 9810 + }, + { + "epoch": 1.83, + "learning_rate": 1.9100431300061614e-07, + "loss": 0.7403, + "step": 9815 + }, + { + "epoch": 1.83, + "learning_rate": 1.8997740809201068e-07, + "loss": 0.9103, + "step": 9820 + }, + { + "epoch": 1.83, + "learning_rate": 1.8895050318340522e-07, + "loss": 0.6655, + "step": 9825 + }, + { + "epoch": 1.83, + "learning_rate": 1.8792359827479976e-07, + "loss": 0.6775, + "step": 9830 + }, + { + "epoch": 1.83, + "learning_rate": 1.868966933661943e-07, + "loss": 0.9323, + "step": 9835 + }, + { + "epoch": 1.83, + "learning_rate": 1.8586978845758883e-07, + "loss": 0.6396, + "step": 9840 + }, + { + "epoch": 1.83, + "learning_rate": 1.8484288354898337e-07, + "loss": 0.5921, + "step": 9845 + }, + { + "epoch": 1.83, + "learning_rate": 1.838159786403779e-07, + "loss": 0.8523, + "step": 9850 + }, + { + "epoch": 1.84, + "learning_rate": 1.8278907373177245e-07, + "loss": 0.7539, + "step": 9855 + }, + { + "epoch": 1.84, + "learning_rate": 1.8176216882316698e-07, + "loss": 0.7188, + "step": 9860 + }, + { + "epoch": 1.84, + "learning_rate": 1.8073526391456152e-07, + "loss": 0.9111, + "step": 9865 + }, + { + "epoch": 1.84, + "learning_rate": 1.7970835900595603e-07, + "loss": 0.9562, + "step": 9870 + }, + { + "epoch": 1.84, + "learning_rate": 1.7868145409735057e-07, + "loss": 0.6707, + "step": 9875 + }, + { + "epoch": 1.84, + "learning_rate": 1.776545491887451e-07, + "loss": 0.674, + "step": 9880 + }, + { + "epoch": 1.84, + "learning_rate": 1.7662764428013965e-07, + "loss": 0.7727, + "step": 9885 + }, + { + "epoch": 1.84, + "learning_rate": 1.7560073937153419e-07, + "loss": 0.9508, + "step": 9890 + }, + { + "epoch": 1.84, + "learning_rate": 1.7457383446292872e-07, + "loss": 1.0723, + "step": 9895 + }, + { + "epoch": 1.84, + "learning_rate": 1.7354692955432326e-07, + "loss": 0.9362, + "step": 9900 + }, + { + "epoch": 1.84, + "learning_rate": 1.725200246457178e-07, + "loss": 0.8443, + "step": 9905 + }, + { + "epoch": 1.85, + "learning_rate": 1.7149311973711234e-07, + "loss": 1.0858, + "step": 9910 + }, + { + "epoch": 1.85, + "learning_rate": 1.7046621482850688e-07, + "loss": 0.8252, + "step": 9915 + }, + { + "epoch": 1.85, + "learning_rate": 1.6943930991990141e-07, + "loss": 1.1394, + "step": 9920 + }, + { + "epoch": 1.85, + "learning_rate": 1.6841240501129595e-07, + "loss": 0.9659, + "step": 9925 + }, + { + "epoch": 1.85, + "learning_rate": 1.673855001026905e-07, + "loss": 0.8237, + "step": 9930 + }, + { + "epoch": 1.85, + "learning_rate": 1.6635859519408503e-07, + "loss": 1.0135, + "step": 9935 + }, + { + "epoch": 1.85, + "learning_rate": 1.6533169028547957e-07, + "loss": 0.5366, + "step": 9940 + }, + { + "epoch": 1.85, + "learning_rate": 1.6430478537687408e-07, + "loss": 0.7087, + "step": 9945 + }, + { + "epoch": 1.85, + "learning_rate": 1.6327788046826862e-07, + "loss": 0.7841, + "step": 9950 + }, + { + "epoch": 1.85, + "learning_rate": 1.6225097555966315e-07, + "loss": 0.7555, + "step": 9955 + }, + { + "epoch": 1.86, + "learning_rate": 1.612240706510577e-07, + "loss": 1.0564, + "step": 9960 + }, + { + "epoch": 1.86, + "learning_rate": 1.6019716574245223e-07, + "loss": 1.1673, + "step": 9965 + }, + { + "epoch": 1.86, + "learning_rate": 1.5917026083384677e-07, + "loss": 1.2251, + "step": 9970 + }, + { + "epoch": 1.86, + "learning_rate": 1.581433559252413e-07, + "loss": 0.6291, + "step": 9975 + }, + { + "epoch": 1.86, + "learning_rate": 1.5711645101663584e-07, + "loss": 0.9839, + "step": 9980 + }, + { + "epoch": 1.86, + "learning_rate": 1.5608954610803038e-07, + "loss": 0.6658, + "step": 9985 + }, + { + "epoch": 1.86, + "learning_rate": 1.5506264119942492e-07, + "loss": 0.6988, + "step": 9990 + }, + { + "epoch": 1.86, + "learning_rate": 1.5403573629081946e-07, + "loss": 1.0948, + "step": 9995 + }, + { + "epoch": 1.86, + "learning_rate": 1.53008831382214e-07, + "loss": 0.8519, + "step": 10000 + }, + { + "epoch": 1.86, + "eval_loss": 0.5432996153831482, + "eval_runtime": 131.7393, + "eval_samples_per_second": 9.063, + "eval_steps_per_second": 1.139, + "eval_wer": 0.9117496151872755, + "step": 10000 + }, + { + "epoch": 1.86, + "learning_rate": 1.5198192647360853e-07, + "loss": 0.8205, + "step": 10005 + }, + { + "epoch": 1.86, + "learning_rate": 1.5095502156500307e-07, + "loss": 0.7684, + "step": 10010 + }, + { + "epoch": 1.87, + "learning_rate": 1.4992811665639764e-07, + "loss": 0.6792, + "step": 10015 + }, + { + "epoch": 1.87, + "learning_rate": 1.4890121174779215e-07, + "loss": 1.3194, + "step": 10020 + }, + { + "epoch": 1.87, + "learning_rate": 1.4787430683918669e-07, + "loss": 0.6639, + "step": 10025 + }, + { + "epoch": 1.87, + "learning_rate": 1.4684740193058122e-07, + "loss": 0.9946, + "step": 10030 + }, + { + "epoch": 1.87, + "learning_rate": 1.4582049702197576e-07, + "loss": 0.7518, + "step": 10035 + }, + { + "epoch": 1.87, + "learning_rate": 1.447935921133703e-07, + "loss": 0.6756, + "step": 10040 + }, + { + "epoch": 1.87, + "learning_rate": 1.4376668720476484e-07, + "loss": 0.8861, + "step": 10045 + }, + { + "epoch": 1.87, + "learning_rate": 1.4273978229615938e-07, + "loss": 0.7895, + "step": 10050 + }, + { + "epoch": 1.87, + "learning_rate": 1.4171287738755391e-07, + "loss": 0.7307, + "step": 10055 + }, + { + "epoch": 1.87, + "learning_rate": 1.4068597247894845e-07, + "loss": 0.752, + "step": 10060 + }, + { + "epoch": 1.87, + "learning_rate": 1.39659067570343e-07, + "loss": 0.809, + "step": 10065 + }, + { + "epoch": 1.88, + "learning_rate": 1.3863216266173753e-07, + "loss": 0.7542, + "step": 10070 + }, + { + "epoch": 1.88, + "learning_rate": 1.3760525775313207e-07, + "loss": 0.6403, + "step": 10075 + }, + { + "epoch": 1.88, + "learning_rate": 1.365783528445266e-07, + "loss": 0.6063, + "step": 10080 + }, + { + "epoch": 1.88, + "learning_rate": 1.3555144793592114e-07, + "loss": 0.8263, + "step": 10085 + }, + { + "epoch": 1.88, + "learning_rate": 1.3452454302731568e-07, + "loss": 0.7645, + "step": 10090 + }, + { + "epoch": 1.88, + "learning_rate": 1.334976381187102e-07, + "loss": 0.999, + "step": 10095 + }, + { + "epoch": 1.88, + "learning_rate": 1.3247073321010473e-07, + "loss": 0.6707, + "step": 10100 + }, + { + "epoch": 1.88, + "learning_rate": 1.3144382830149927e-07, + "loss": 0.729, + "step": 10105 + }, + { + "epoch": 1.88, + "learning_rate": 1.304169233928938e-07, + "loss": 0.8524, + "step": 10110 + }, + { + "epoch": 1.88, + "learning_rate": 1.2939001848428834e-07, + "loss": 0.8057, + "step": 10115 + }, + { + "epoch": 1.88, + "learning_rate": 1.2836311357568288e-07, + "loss": 0.7858, + "step": 10120 + }, + { + "epoch": 1.89, + "learning_rate": 1.2733620866707742e-07, + "loss": 0.7812, + "step": 10125 + }, + { + "epoch": 1.89, + "learning_rate": 1.2630930375847196e-07, + "loss": 1.0849, + "step": 10130 + }, + { + "epoch": 1.89, + "learning_rate": 1.252823988498665e-07, + "loss": 1.1582, + "step": 10135 + }, + { + "epoch": 1.89, + "learning_rate": 1.2425549394126103e-07, + "loss": 0.6071, + "step": 10140 + }, + { + "epoch": 1.89, + "learning_rate": 1.2322858903265557e-07, + "loss": 0.6861, + "step": 10145 + }, + { + "epoch": 1.89, + "learning_rate": 1.222016841240501e-07, + "loss": 0.9519, + "step": 10150 + }, + { + "epoch": 1.89, + "learning_rate": 1.2117477921544465e-07, + "loss": 1.1016, + "step": 10155 + }, + { + "epoch": 1.89, + "learning_rate": 1.2014787430683919e-07, + "loss": 0.8019, + "step": 10160 + }, + { + "epoch": 1.89, + "learning_rate": 1.1912096939823371e-07, + "loss": 0.7285, + "step": 10165 + }, + { + "epoch": 1.89, + "learning_rate": 1.1809406448962826e-07, + "loss": 0.7394, + "step": 10170 + }, + { + "epoch": 1.9, + "learning_rate": 1.170671595810228e-07, + "loss": 0.6223, + "step": 10175 + }, + { + "epoch": 1.9, + "learning_rate": 1.1604025467241734e-07, + "loss": 1.2768, + "step": 10180 + }, + { + "epoch": 1.9, + "learning_rate": 1.1501334976381188e-07, + "loss": 0.9095, + "step": 10185 + }, + { + "epoch": 1.9, + "learning_rate": 1.1398644485520641e-07, + "loss": 0.6809, + "step": 10190 + }, + { + "epoch": 1.9, + "learning_rate": 1.1295953994660094e-07, + "loss": 0.7896, + "step": 10195 + }, + { + "epoch": 1.9, + "learning_rate": 1.1193263503799548e-07, + "loss": 0.7618, + "step": 10200 + }, + { + "epoch": 1.9, + "learning_rate": 1.1090573012939001e-07, + "loss": 0.9294, + "step": 10205 + }, + { + "epoch": 1.9, + "learning_rate": 1.0987882522078455e-07, + "loss": 0.9262, + "step": 10210 + }, + { + "epoch": 1.9, + "learning_rate": 1.0885192031217909e-07, + "loss": 0.8909, + "step": 10215 + }, + { + "epoch": 1.9, + "learning_rate": 1.0782501540357363e-07, + "loss": 0.9056, + "step": 10220 + }, + { + "epoch": 1.9, + "learning_rate": 1.0679811049496817e-07, + "loss": 0.8504, + "step": 10225 + }, + { + "epoch": 1.91, + "learning_rate": 1.0577120558636269e-07, + "loss": 0.6755, + "step": 10230 + }, + { + "epoch": 1.91, + "learning_rate": 1.0474430067775723e-07, + "loss": 1.085, + "step": 10235 + }, + { + "epoch": 1.91, + "learning_rate": 1.0371739576915177e-07, + "loss": 0.9311, + "step": 10240 + }, + { + "epoch": 1.91, + "learning_rate": 1.026904908605463e-07, + "loss": 0.9027, + "step": 10245 + }, + { + "epoch": 1.91, + "learning_rate": 1.0166358595194084e-07, + "loss": 1.0461, + "step": 10250 + }, + { + "epoch": 1.91, + "learning_rate": 1.0063668104333538e-07, + "loss": 0.9348, + "step": 10255 + }, + { + "epoch": 1.91, + "learning_rate": 9.960977613472992e-08, + "loss": 0.7014, + "step": 10260 + }, + { + "epoch": 1.91, + "learning_rate": 9.858287122612446e-08, + "loss": 0.8754, + "step": 10265 + }, + { + "epoch": 1.91, + "learning_rate": 9.755596631751898e-08, + "loss": 0.9965, + "step": 10270 + }, + { + "epoch": 1.91, + "learning_rate": 9.652906140891353e-08, + "loss": 0.7866, + "step": 10275 + }, + { + "epoch": 1.91, + "learning_rate": 9.550215650030807e-08, + "loss": 0.7955, + "step": 10280 + }, + { + "epoch": 1.92, + "learning_rate": 9.447525159170261e-08, + "loss": 0.9339, + "step": 10285 + }, + { + "epoch": 1.92, + "learning_rate": 9.344834668309715e-08, + "loss": 0.8488, + "step": 10290 + }, + { + "epoch": 1.92, + "learning_rate": 9.242144177449168e-08, + "loss": 0.6844, + "step": 10295 + }, + { + "epoch": 1.92, + "learning_rate": 9.139453686588622e-08, + "loss": 0.9284, + "step": 10300 + }, + { + "epoch": 1.92, + "learning_rate": 9.036763195728076e-08, + "loss": 0.8021, + "step": 10305 + }, + { + "epoch": 1.92, + "learning_rate": 8.934072704867529e-08, + "loss": 0.7857, + "step": 10310 + }, + { + "epoch": 1.92, + "learning_rate": 8.831382214006982e-08, + "loss": 0.8231, + "step": 10315 + }, + { + "epoch": 1.92, + "learning_rate": 8.728691723146436e-08, + "loss": 1.037, + "step": 10320 + }, + { + "epoch": 1.92, + "learning_rate": 8.62600123228589e-08, + "loss": 0.7272, + "step": 10325 + }, + { + "epoch": 1.92, + "learning_rate": 8.523310741425344e-08, + "loss": 0.9758, + "step": 10330 + }, + { + "epoch": 1.92, + "learning_rate": 8.420620250564798e-08, + "loss": 0.8089, + "step": 10335 + }, + { + "epoch": 1.93, + "learning_rate": 8.317929759704251e-08, + "loss": 0.6783, + "step": 10340 + }, + { + "epoch": 1.93, + "learning_rate": 8.215239268843704e-08, + "loss": 0.8336, + "step": 10345 + }, + { + "epoch": 1.93, + "learning_rate": 8.112548777983158e-08, + "loss": 0.8419, + "step": 10350 + }, + { + "epoch": 1.93, + "learning_rate": 8.009858287122611e-08, + "loss": 0.8973, + "step": 10355 + }, + { + "epoch": 1.93, + "learning_rate": 7.907167796262065e-08, + "loss": 0.738, + "step": 10360 + }, + { + "epoch": 1.93, + "learning_rate": 7.804477305401519e-08, + "loss": 0.7383, + "step": 10365 + }, + { + "epoch": 1.93, + "learning_rate": 7.701786814540973e-08, + "loss": 0.922, + "step": 10370 + }, + { + "epoch": 1.93, + "learning_rate": 7.599096323680427e-08, + "loss": 0.7351, + "step": 10375 + }, + { + "epoch": 1.93, + "learning_rate": 7.496405832819882e-08, + "loss": 0.863, + "step": 10380 + }, + { + "epoch": 1.93, + "learning_rate": 7.393715341959334e-08, + "loss": 0.752, + "step": 10385 + }, + { + "epoch": 1.94, + "learning_rate": 7.291024851098788e-08, + "loss": 0.6388, + "step": 10390 + }, + { + "epoch": 1.94, + "learning_rate": 7.188334360238242e-08, + "loss": 0.7757, + "step": 10395 + }, + { + "epoch": 1.94, + "learning_rate": 7.085643869377696e-08, + "loss": 0.6121, + "step": 10400 + }, + { + "epoch": 1.94, + "learning_rate": 6.98295337851715e-08, + "loss": 0.7088, + "step": 10405 + }, + { + "epoch": 1.94, + "learning_rate": 6.880262887656603e-08, + "loss": 0.8861, + "step": 10410 + }, + { + "epoch": 1.94, + "learning_rate": 6.777572396796057e-08, + "loss": 0.7993, + "step": 10415 + }, + { + "epoch": 1.94, + "learning_rate": 6.67488190593551e-08, + "loss": 1.3591, + "step": 10420 + }, + { + "epoch": 1.94, + "learning_rate": 6.572191415074963e-08, + "loss": 0.7474, + "step": 10425 + }, + { + "epoch": 1.94, + "learning_rate": 6.469500924214417e-08, + "loss": 0.7211, + "step": 10430 + }, + { + "epoch": 1.94, + "learning_rate": 6.366810433353871e-08, + "loss": 0.7035, + "step": 10435 + }, + { + "epoch": 1.94, + "learning_rate": 6.264119942493325e-08, + "loss": 0.7559, + "step": 10440 + }, + { + "epoch": 1.95, + "learning_rate": 6.161429451632779e-08, + "loss": 1.0432, + "step": 10445 + }, + { + "epoch": 1.95, + "learning_rate": 6.058738960772232e-08, + "loss": 0.9067, + "step": 10450 + }, + { + "epoch": 1.95, + "learning_rate": 5.9560484699116855e-08, + "loss": 0.7133, + "step": 10455 + }, + { + "epoch": 1.95, + "learning_rate": 5.85335797905114e-08, + "loss": 0.9685, + "step": 10460 + }, + { + "epoch": 1.95, + "learning_rate": 5.750667488190594e-08, + "loss": 0.8897, + "step": 10465 + }, + { + "epoch": 1.95, + "learning_rate": 5.647976997330047e-08, + "loss": 0.9995, + "step": 10470 + }, + { + "epoch": 1.95, + "learning_rate": 5.545286506469501e-08, + "loss": 0.863, + "step": 10475 + }, + { + "epoch": 1.95, + "learning_rate": 5.4425960156089545e-08, + "loss": 0.7476, + "step": 10480 + }, + { + "epoch": 1.95, + "learning_rate": 5.339905524748408e-08, + "loss": 0.9257, + "step": 10485 + }, + { + "epoch": 1.95, + "learning_rate": 5.2372150338878614e-08, + "loss": 0.8702, + "step": 10490 + }, + { + "epoch": 1.95, + "learning_rate": 5.134524543027315e-08, + "loss": 0.6936, + "step": 10495 + }, + { + "epoch": 1.96, + "learning_rate": 5.031834052166769e-08, + "loss": 0.7054, + "step": 10500 + }, + { + "epoch": 1.96, + "eval_loss": 0.5424375534057617, + "eval_runtime": 130.6279, + "eval_samples_per_second": 9.14, + "eval_steps_per_second": 1.148, + "eval_wer": 0.9084145715751668, + "step": 10500 + } + ], + "max_steps": 10738, + "num_train_epochs": 2, + "total_flos": 9.684670186971503e+17, + "trial_name": null, + "trial_params": null +}