{ "best_metric": null, "best_model_checkpoint": null, "epoch": 19.007506666666668, "global_step": 20000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 8.000000000000001e-07, "loss": 25.0773, "step": 10 }, { "epoch": 0.0, "learning_rate": 1.8e-06, "loss": 23.2187, "step": 20 }, { "epoch": 0.0, "learning_rate": 2.7e-06, "loss": 21.7996, "step": 30 }, { "epoch": 0.0, "learning_rate": 3.7e-06, "loss": 25.2934, "step": 40 }, { "epoch": 0.0, "learning_rate": 4.7e-06, "loss": 22.8354, "step": 50 }, { "epoch": 0.0, "learning_rate": 5.7000000000000005e-06, "loss": 22.4447, "step": 60 }, { "epoch": 0.0, "learning_rate": 6.700000000000001e-06, "loss": 21.4096, "step": 70 }, { "epoch": 0.0, "learning_rate": 7.7e-06, "loss": 19.6356, "step": 80 }, { "epoch": 0.0, "learning_rate": 8.7e-06, "loss": 15.8806, "step": 90 }, { "epoch": 0.0, "learning_rate": 9.7e-06, "loss": 11.4753, "step": 100 }, { "epoch": 0.0, "learning_rate": 1.0700000000000001e-05, "loss": 9.7256, "step": 110 }, { "epoch": 0.0, "learning_rate": 1.1700000000000001e-05, "loss": 8.5749, "step": 120 }, { "epoch": 0.0, "learning_rate": 1.27e-05, "loss": 8.3531, "step": 130 }, { "epoch": 0.0, "learning_rate": 1.3700000000000001e-05, "loss": 6.8619, "step": 140 }, { "epoch": 0.0, "learning_rate": 1.47e-05, "loss": 6.455, "step": 150 }, { "epoch": 0.0, "learning_rate": 1.5700000000000002e-05, "loss": 5.6672, "step": 160 }, { "epoch": 0.0, "learning_rate": 1.66e-05, "loss": 8.8545, "step": 170 }, { "epoch": 0.0, "learning_rate": 1.76e-05, "loss": 6.4555, "step": 180 }, { "epoch": 0.0, "learning_rate": 1.86e-05, "loss": 4.5403, "step": 190 }, { "epoch": 0.0, "learning_rate": 1.9600000000000002e-05, "loss": 4.691, "step": 200 }, { "epoch": 0.0, "learning_rate": 2.06e-05, "loss": 4.8806, "step": 210 }, { "epoch": 0.0, "learning_rate": 2.15e-05, "loss": 7.4317, "step": 220 }, { "epoch": 0.0, "learning_rate": 2.25e-05, "loss": 4.6169, "step": 230 }, { "epoch": 0.0, "learning_rate": 2.35e-05, "loss": 4.576, "step": 240 }, { "epoch": 0.0, "learning_rate": 2.45e-05, "loss": 7.4582, "step": 250 }, { "epoch": 0.0, "learning_rate": 2.5500000000000003e-05, "loss": 4.4076, "step": 260 }, { "epoch": 0.0, "learning_rate": 2.6500000000000004e-05, "loss": 4.7133, "step": 270 }, { "epoch": 0.0, "learning_rate": 2.7500000000000004e-05, "loss": 4.1636, "step": 280 }, { "epoch": 0.0, "learning_rate": 2.8499999999999998e-05, "loss": 3.8869, "step": 290 }, { "epoch": 0.0, "learning_rate": 2.95e-05, "loss": 3.8318, "step": 300 }, { "epoch": 0.0, "learning_rate": 3.05e-05, "loss": 3.597, "step": 310 }, { "epoch": 0.0, "learning_rate": 3.15e-05, "loss": 3.7072, "step": 320 }, { "epoch": 0.0, "learning_rate": 3.2500000000000004e-05, "loss": 3.465, "step": 330 }, { "epoch": 0.0, "learning_rate": 3.35e-05, "loss": 3.3834, "step": 340 }, { "epoch": 0.0, "learning_rate": 3.45e-05, "loss": 3.3522, "step": 350 }, { "epoch": 0.0, "learning_rate": 3.55e-05, "loss": 3.2943, "step": 360 }, { "epoch": 0.0, "learning_rate": 3.65e-05, "loss": 3.3241, "step": 370 }, { "epoch": 0.01, "learning_rate": 3.7500000000000003e-05, "loss": 3.1516, "step": 380 }, { "epoch": 0.01, "learning_rate": 3.85e-05, "loss": 3.208, "step": 390 }, { "epoch": 0.01, "learning_rate": 3.9500000000000005e-05, "loss": 3.0941, "step": 400 }, { "epoch": 0.01, "learning_rate": 4.05e-05, "loss": 3.0473, "step": 410 }, { "epoch": 0.01, "learning_rate": 4.15e-05, "loss": 3.0403, "step": 420 }, { "epoch": 0.01, "learning_rate": 4.25e-05, "loss": 3.0143, "step": 430 }, { "epoch": 0.01, "learning_rate": 4.35e-05, "loss": 3.0391, "step": 440 }, { "epoch": 0.01, "learning_rate": 4.4500000000000004e-05, "loss": 3.0252, "step": 450 }, { "epoch": 0.01, "learning_rate": 4.55e-05, "loss": 2.9525, "step": 460 }, { "epoch": 0.01, "learning_rate": 4.6500000000000005e-05, "loss": 2.998, "step": 470 }, { "epoch": 0.01, "learning_rate": 4.75e-05, "loss": 2.9662, "step": 480 }, { "epoch": 0.01, "learning_rate": 4.85e-05, "loss": 2.9385, "step": 490 }, { "epoch": 0.01, "learning_rate": 4.9500000000000004e-05, "loss": 2.9413, "step": 500 }, { "epoch": 0.01, "eval_loss": 2.9435229301452637, "eval_runtime": 132.4889, "eval_samples_per_second": 27.232, "eval_steps_per_second": 3.404, "eval_wer": 1.0, "step": 500 }, { "epoch": 0.01, "learning_rate": 5.05e-05, "loss": 2.9855, "step": 510 }, { "epoch": 0.01, "learning_rate": 5.1500000000000005e-05, "loss": 2.9853, "step": 520 }, { "epoch": 0.01, "learning_rate": 5.25e-05, "loss": 2.9712, "step": 530 }, { "epoch": 0.01, "learning_rate": 5.3500000000000006e-05, "loss": 2.9441, "step": 540 }, { "epoch": 0.01, "learning_rate": 5.45e-05, "loss": 2.9308, "step": 550 }, { "epoch": 0.01, "learning_rate": 5.550000000000001e-05, "loss": 2.8991, "step": 560 }, { "epoch": 0.01, "learning_rate": 5.65e-05, "loss": 2.889, "step": 570 }, { "epoch": 0.01, "learning_rate": 5.7499999999999995e-05, "loss": 2.895, "step": 580 }, { "epoch": 0.01, "learning_rate": 5.85e-05, "loss": 2.885, "step": 590 }, { "epoch": 0.01, "learning_rate": 5.95e-05, "loss": 2.8786, "step": 600 }, { "epoch": 0.01, "learning_rate": 6.05e-05, "loss": 2.8689, "step": 610 }, { "epoch": 0.01, "learning_rate": 6.15e-05, "loss": 2.8977, "step": 620 }, { "epoch": 0.01, "learning_rate": 6.25e-05, "loss": 2.895, "step": 630 }, { "epoch": 0.01, "learning_rate": 6.35e-05, "loss": 2.9192, "step": 640 }, { "epoch": 0.01, "learning_rate": 6.450000000000001e-05, "loss": 2.8868, "step": 650 }, { "epoch": 0.01, "learning_rate": 6.55e-05, "loss": 2.8669, "step": 660 }, { "epoch": 0.01, "learning_rate": 6.65e-05, "loss": 2.8769, "step": 670 }, { "epoch": 0.01, "learning_rate": 6.750000000000001e-05, "loss": 2.8739, "step": 680 }, { "epoch": 0.01, "learning_rate": 6.850000000000001e-05, "loss": 2.8588, "step": 690 }, { "epoch": 0.01, "learning_rate": 6.95e-05, "loss": 2.8773, "step": 700 }, { "epoch": 0.01, "learning_rate": 7.05e-05, "loss": 2.8926, "step": 710 }, { "epoch": 0.01, "learning_rate": 7.15e-05, "loss": 2.8817, "step": 720 }, { "epoch": 0.01, "learning_rate": 7.25e-05, "loss": 2.8898, "step": 730 }, { "epoch": 0.01, "learning_rate": 7.35e-05, "loss": 2.8643, "step": 740 }, { "epoch": 0.01, "learning_rate": 7.450000000000001e-05, "loss": 2.8421, "step": 750 }, { "epoch": 0.01, "learning_rate": 7.55e-05, "loss": 2.8708, "step": 760 }, { "epoch": 0.01, "learning_rate": 7.65e-05, "loss": 2.8801, "step": 770 }, { "epoch": 0.01, "learning_rate": 7.75e-05, "loss": 2.8684, "step": 780 }, { "epoch": 0.01, "learning_rate": 7.850000000000001e-05, "loss": 2.895, "step": 790 }, { "epoch": 0.01, "learning_rate": 7.950000000000001e-05, "loss": 2.8718, "step": 800 }, { "epoch": 0.01, "learning_rate": 8.05e-05, "loss": 2.8518, "step": 810 }, { "epoch": 0.01, "learning_rate": 8.15e-05, "loss": 2.8382, "step": 820 }, { "epoch": 0.01, "learning_rate": 8.25e-05, "loss": 2.8486, "step": 830 }, { "epoch": 0.01, "learning_rate": 8.35e-05, "loss": 2.8428, "step": 840 }, { "epoch": 0.01, "learning_rate": 8.450000000000001e-05, "loss": 2.8661, "step": 850 }, { "epoch": 0.01, "learning_rate": 8.55e-05, "loss": 2.891, "step": 860 }, { "epoch": 0.01, "learning_rate": 8.65e-05, "loss": 2.8411, "step": 870 }, { "epoch": 0.01, "learning_rate": 8.75e-05, "loss": 2.8477, "step": 880 }, { "epoch": 0.01, "learning_rate": 8.850000000000001e-05, "loss": 2.8434, "step": 890 }, { "epoch": 0.01, "learning_rate": 8.950000000000001e-05, "loss": 2.8309, "step": 900 }, { "epoch": 0.01, "learning_rate": 9.05e-05, "loss": 2.9248, "step": 910 }, { "epoch": 0.01, "learning_rate": 9.15e-05, "loss": 2.88, "step": 920 }, { "epoch": 0.01, "learning_rate": 9.250000000000001e-05, "loss": 2.8496, "step": 930 }, { "epoch": 0.01, "learning_rate": 9.350000000000001e-05, "loss": 2.9916, "step": 940 }, { "epoch": 0.01, "learning_rate": 9.449999999999999e-05, "loss": 3.3497, "step": 950 }, { "epoch": 0.01, "learning_rate": 9.55e-05, "loss": 3.1128, "step": 960 }, { "epoch": 0.01, "learning_rate": 9.65e-05, "loss": 3.0954, "step": 970 }, { "epoch": 0.01, "learning_rate": 9.75e-05, "loss": 2.9393, "step": 980 }, { "epoch": 0.01, "learning_rate": 9.850000000000001e-05, "loss": 2.9254, "step": 990 }, { "epoch": 0.01, "learning_rate": 9.95e-05, "loss": 2.9653, "step": 1000 }, { "epoch": 0.01, "eval_loss": 2.8854753971099854, "eval_runtime": 130.8403, "eval_samples_per_second": 27.576, "eval_steps_per_second": 3.447, "eval_wer": 1.0, "step": 1000 }, { "epoch": 0.01, "learning_rate": 9.999324324324325e-05, "loss": 2.981, "step": 1010 }, { "epoch": 0.01, "learning_rate": 9.997972972972973e-05, "loss": 2.934, "step": 1020 }, { "epoch": 1.0, "learning_rate": 9.996621621621622e-05, "loss": 2.981, "step": 1030 }, { "epoch": 1.0, "learning_rate": 9.99527027027027e-05, "loss": 2.869, "step": 1040 }, { "epoch": 1.0, "learning_rate": 9.99391891891892e-05, "loss": 2.8468, "step": 1050 }, { "epoch": 1.0, "learning_rate": 9.992567567567568e-05, "loss": 2.8198, "step": 1060 }, { "epoch": 1.0, "learning_rate": 9.991216216216217e-05, "loss": 2.8201, "step": 1070 }, { "epoch": 1.0, "learning_rate": 9.989864864864865e-05, "loss": 2.7722, "step": 1080 }, { "epoch": 1.0, "learning_rate": 9.988513513513515e-05, "loss": 2.8039, "step": 1090 }, { "epoch": 1.0, "learning_rate": 9.987162162162163e-05, "loss": 2.6876, "step": 1100 }, { "epoch": 1.0, "learning_rate": 9.985810810810812e-05, "loss": 2.6774, "step": 1110 }, { "epoch": 1.0, "learning_rate": 9.98445945945946e-05, "loss": 2.5588, "step": 1120 }, { "epoch": 1.0, "learning_rate": 9.983108108108109e-05, "loss": 2.4457, "step": 1130 }, { "epoch": 1.0, "learning_rate": 9.981756756756757e-05, "loss": 2.4035, "step": 1140 }, { "epoch": 1.0, "learning_rate": 9.980405405405406e-05, "loss": 2.3212, "step": 1150 }, { "epoch": 1.0, "learning_rate": 9.979054054054054e-05, "loss": 1.9928, "step": 1160 }, { "epoch": 1.0, "learning_rate": 9.977702702702704e-05, "loss": 1.8027, "step": 1170 }, { "epoch": 1.0, "learning_rate": 9.976351351351352e-05, "loss": 1.5632, "step": 1180 }, { "epoch": 1.0, "learning_rate": 9.975000000000001e-05, "loss": 2.5438, "step": 1190 }, { "epoch": 1.0, "learning_rate": 9.97364864864865e-05, "loss": 2.4939, "step": 1200 }, { "epoch": 1.0, "learning_rate": 9.972297297297297e-05, "loss": 3.0732, "step": 1210 }, { "epoch": 1.0, "learning_rate": 9.970945945945947e-05, "loss": 3.0607, "step": 1220 }, { "epoch": 1.0, "learning_rate": 9.969594594594595e-05, "loss": 2.9608, "step": 1230 }, { "epoch": 1.0, "learning_rate": 9.968243243243243e-05, "loss": 3.4062, "step": 1240 }, { "epoch": 1.0, "learning_rate": 9.966891891891891e-05, "loss": 3.2387, "step": 1250 }, { "epoch": 1.0, "learning_rate": 9.96554054054054e-05, "loss": 3.2496, "step": 1260 }, { "epoch": 1.0, "learning_rate": 9.964189189189189e-05, "loss": 3.7039, "step": 1270 }, { "epoch": 1.0, "learning_rate": 9.962837837837838e-05, "loss": 1.7503, "step": 1280 }, { "epoch": 1.0, "learning_rate": 9.961486486486486e-05, "loss": 1.6555, "step": 1290 }, { "epoch": 1.0, "learning_rate": 9.960135135135136e-05, "loss": 1.4705, "step": 1300 }, { "epoch": 1.0, "learning_rate": 9.958783783783784e-05, "loss": 1.7588, "step": 1310 }, { "epoch": 1.0, "learning_rate": 9.957432432432433e-05, "loss": 1.6669, "step": 1320 }, { "epoch": 1.0, "learning_rate": 9.956081081081081e-05, "loss": 1.5781, "step": 1330 }, { "epoch": 1.0, "learning_rate": 9.954729729729731e-05, "loss": 1.3074, "step": 1340 }, { "epoch": 1.0, "learning_rate": 9.953378378378379e-05, "loss": 1.2246, "step": 1350 }, { "epoch": 1.0, "learning_rate": 9.952027027027027e-05, "loss": 1.3054, "step": 1360 }, { "epoch": 1.0, "learning_rate": 9.950675675675675e-05, "loss": 1.367, "step": 1370 }, { "epoch": 1.0, "learning_rate": 9.949324324324325e-05, "loss": 1.3456, "step": 1380 }, { "epoch": 1.0, "learning_rate": 9.947972972972973e-05, "loss": 1.2367, "step": 1390 }, { "epoch": 1.01, "learning_rate": 9.946621621621622e-05, "loss": 1.0744, "step": 1400 }, { "epoch": 1.01, "learning_rate": 9.94527027027027e-05, "loss": 0.8936, "step": 1410 }, { "epoch": 1.01, "learning_rate": 9.94391891891892e-05, "loss": 0.849, "step": 1420 }, { "epoch": 1.01, "learning_rate": 9.942567567567568e-05, "loss": 1.1023, "step": 1430 }, { "epoch": 1.01, "learning_rate": 9.941216216216217e-05, "loss": 0.8972, "step": 1440 }, { "epoch": 1.01, "learning_rate": 9.939864864864865e-05, "loss": 0.9644, "step": 1450 }, { "epoch": 1.01, "learning_rate": 9.938513513513515e-05, "loss": 1.1211, "step": 1460 }, { "epoch": 1.01, "learning_rate": 9.937162162162163e-05, "loss": 1.1737, "step": 1470 }, { "epoch": 1.01, "learning_rate": 9.935810810810811e-05, "loss": 0.9672, "step": 1480 }, { "epoch": 1.01, "learning_rate": 9.934459459459459e-05, "loss": 1.3306, "step": 1490 }, { "epoch": 1.01, "learning_rate": 9.933108108108109e-05, "loss": 1.2461, "step": 1500 }, { "epoch": 1.01, "eval_loss": 0.6979973912239075, "eval_runtime": 131.1426, "eval_samples_per_second": 27.512, "eval_steps_per_second": 3.439, "eval_wer": 0.6363043376974328, "step": 1500 }, { "epoch": 1.01, "learning_rate": 9.931756756756757e-05, "loss": 1.3426, "step": 1510 }, { "epoch": 1.01, "learning_rate": 9.930405405405406e-05, "loss": 1.2723, "step": 1520 }, { "epoch": 1.01, "learning_rate": 9.929054054054054e-05, "loss": 1.0486, "step": 1530 }, { "epoch": 1.01, "learning_rate": 9.927702702702704e-05, "loss": 1.4819, "step": 1540 }, { "epoch": 1.01, "learning_rate": 9.926351351351352e-05, "loss": 1.5356, "step": 1550 }, { "epoch": 1.01, "learning_rate": 9.925000000000001e-05, "loss": 1.2206, "step": 1560 }, { "epoch": 1.01, "learning_rate": 9.92364864864865e-05, "loss": 0.7306, "step": 1570 }, { "epoch": 1.01, "learning_rate": 9.922297297297299e-05, "loss": 0.984, "step": 1580 }, { "epoch": 1.01, "learning_rate": 9.920945945945947e-05, "loss": 0.9026, "step": 1590 }, { "epoch": 1.01, "learning_rate": 9.919594594594595e-05, "loss": 0.7881, "step": 1600 }, { "epoch": 1.01, "learning_rate": 9.918243243243243e-05, "loss": 0.7499, "step": 1610 }, { "epoch": 1.01, "learning_rate": 9.916891891891891e-05, "loss": 0.7193, "step": 1620 }, { "epoch": 1.01, "learning_rate": 9.915540540540541e-05, "loss": 0.696, "step": 1630 }, { "epoch": 1.01, "learning_rate": 9.914189189189189e-05, "loss": 1.0071, "step": 1640 }, { "epoch": 1.01, "learning_rate": 9.912837837837838e-05, "loss": 1.0987, "step": 1650 }, { "epoch": 1.01, "learning_rate": 9.911486486486486e-05, "loss": 1.1242, "step": 1660 }, { "epoch": 1.01, "learning_rate": 9.910135135135136e-05, "loss": 1.0103, "step": 1670 }, { "epoch": 1.01, "learning_rate": 9.908783783783784e-05, "loss": 1.23, "step": 1680 }, { "epoch": 1.01, "learning_rate": 9.907432432432433e-05, "loss": 1.3467, "step": 1690 }, { "epoch": 1.01, "learning_rate": 9.906081081081082e-05, "loss": 0.885, "step": 1700 }, { "epoch": 1.01, "learning_rate": 9.90472972972973e-05, "loss": 0.8155, "step": 1710 }, { "epoch": 1.01, "learning_rate": 9.903378378378378e-05, "loss": 0.9426, "step": 1720 }, { "epoch": 1.01, "learning_rate": 9.902027027027027e-05, "loss": 1.0731, "step": 1730 }, { "epoch": 1.01, "learning_rate": 9.900675675675675e-05, "loss": 1.1934, "step": 1740 }, { "epoch": 1.01, "learning_rate": 9.899324324324325e-05, "loss": 0.9935, "step": 1750 }, { "epoch": 1.01, "learning_rate": 9.897972972972973e-05, "loss": 0.9233, "step": 1760 }, { "epoch": 1.01, "learning_rate": 9.896621621621622e-05, "loss": 0.9416, "step": 1770 }, { "epoch": 1.01, "learning_rate": 9.89527027027027e-05, "loss": 0.783, "step": 1780 }, { "epoch": 1.01, "learning_rate": 9.89391891891892e-05, "loss": 0.8706, "step": 1790 }, { "epoch": 1.01, "learning_rate": 9.892567567567568e-05, "loss": 0.5307, "step": 1800 }, { "epoch": 1.01, "learning_rate": 9.891216216216217e-05, "loss": 0.8379, "step": 1810 }, { "epoch": 1.01, "learning_rate": 9.889864864864866e-05, "loss": 1.0918, "step": 1820 }, { "epoch": 1.01, "learning_rate": 9.888513513513514e-05, "loss": 1.3653, "step": 1830 }, { "epoch": 1.01, "learning_rate": 9.887162162162162e-05, "loss": 0.6974, "step": 1840 }, { "epoch": 1.01, "learning_rate": 9.885810810810811e-05, "loss": 0.7898, "step": 1850 }, { "epoch": 1.01, "learning_rate": 9.88445945945946e-05, "loss": 0.858, "step": 1860 }, { "epoch": 1.01, "learning_rate": 9.883108108108109e-05, "loss": 0.9756, "step": 1870 }, { "epoch": 1.01, "learning_rate": 9.881756756756757e-05, "loss": 0.9081, "step": 1880 }, { "epoch": 1.01, "learning_rate": 9.880405405405406e-05, "loss": 1.1205, "step": 1890 }, { "epoch": 1.01, "learning_rate": 9.879054054054054e-05, "loss": 0.795, "step": 1900 }, { "epoch": 1.01, "learning_rate": 9.877702702702704e-05, "loss": 0.7786, "step": 1910 }, { "epoch": 1.01, "learning_rate": 9.876351351351352e-05, "loss": 0.8629, "step": 1920 }, { "epoch": 1.01, "learning_rate": 9.875000000000002e-05, "loss": 1.0116, "step": 1930 }, { "epoch": 1.01, "learning_rate": 9.87364864864865e-05, "loss": 1.1012, "step": 1940 }, { "epoch": 1.01, "learning_rate": 9.872297297297298e-05, "loss": 1.2204, "step": 1950 }, { "epoch": 1.01, "learning_rate": 9.870945945945946e-05, "loss": 1.1798, "step": 1960 }, { "epoch": 1.01, "learning_rate": 9.869594594594595e-05, "loss": 1.5934, "step": 1970 }, { "epoch": 1.01, "learning_rate": 9.868243243243243e-05, "loss": 1.4101, "step": 1980 }, { "epoch": 1.01, "learning_rate": 9.866891891891893e-05, "loss": 1.5677, "step": 1990 }, { "epoch": 1.01, "learning_rate": 9.865540540540541e-05, "loss": 1.3429, "step": 2000 }, { "epoch": 1.01, "eval_loss": 0.4242011606693268, "eval_runtime": 129.994, "eval_samples_per_second": 27.755, "eval_steps_per_second": 3.469, "eval_wer": 0.4358197828821693, "step": 2000 }, { "epoch": 1.01, "learning_rate": 9.86418918918919e-05, "loss": 1.1514, "step": 2010 }, { "epoch": 1.01, "learning_rate": 9.862837837837838e-05, "loss": 1.089, "step": 2020 }, { "epoch": 1.01, "learning_rate": 9.861486486486487e-05, "loss": 1.1957, "step": 2030 }, { "epoch": 1.01, "learning_rate": 9.860135135135136e-05, "loss": 1.0991, "step": 2040 }, { "epoch": 2.0, "learning_rate": 9.858783783783784e-05, "loss": 1.314, "step": 2050 }, { "epoch": 2.0, "learning_rate": 9.857432432432434e-05, "loss": 1.0875, "step": 2060 }, { "epoch": 2.0, "learning_rate": 9.856081081081082e-05, "loss": 1.022, "step": 2070 }, { "epoch": 2.0, "learning_rate": 9.85472972972973e-05, "loss": 0.9634, "step": 2080 }, { "epoch": 2.0, "learning_rate": 9.853378378378378e-05, "loss": 0.9339, "step": 2090 }, { "epoch": 2.0, "learning_rate": 9.852027027027027e-05, "loss": 0.9281, "step": 2100 }, { "epoch": 2.0, "learning_rate": 9.850675675675675e-05, "loss": 1.1117, "step": 2110 }, { "epoch": 2.0, "learning_rate": 9.849324324324325e-05, "loss": 1.0056, "step": 2120 }, { "epoch": 2.0, "learning_rate": 9.847972972972973e-05, "loss": 0.8432, "step": 2130 }, { "epoch": 2.0, "learning_rate": 9.846621621621623e-05, "loss": 0.9083, "step": 2140 }, { "epoch": 2.0, "learning_rate": 9.84527027027027e-05, "loss": 0.9065, "step": 2150 }, { "epoch": 2.0, "learning_rate": 9.84391891891892e-05, "loss": 0.8697, "step": 2160 }, { "epoch": 2.0, "learning_rate": 9.842567567567568e-05, "loss": 0.6629, "step": 2170 }, { "epoch": 2.0, "learning_rate": 9.841216216216216e-05, "loss": 0.5975, "step": 2180 }, { "epoch": 2.0, "learning_rate": 9.839864864864864e-05, "loss": 0.5513, "step": 2190 }, { "epoch": 2.0, "learning_rate": 9.838513513513514e-05, "loss": 0.5223, "step": 2200 }, { "epoch": 2.0, "learning_rate": 9.837162162162162e-05, "loss": 1.5895, "step": 2210 }, { "epoch": 2.0, "learning_rate": 9.835810810810811e-05, "loss": 1.5385, "step": 2220 }, { "epoch": 2.0, "learning_rate": 9.83445945945946e-05, "loss": 3.1014, "step": 2230 }, { "epoch": 2.0, "learning_rate": 9.833108108108109e-05, "loss": 2.9294, "step": 2240 }, { "epoch": 2.0, "learning_rate": 9.831756756756757e-05, "loss": 2.8178, "step": 2250 }, { "epoch": 2.0, "learning_rate": 9.830405405405407e-05, "loss": 2.8213, "step": 2260 }, { "epoch": 2.0, "learning_rate": 9.829054054054055e-05, "loss": 2.4418, "step": 2270 }, { "epoch": 2.0, "learning_rate": 9.827702702702704e-05, "loss": 2.3031, "step": 2280 }, { "epoch": 2.0, "learning_rate": 9.826351351351352e-05, "loss": 1.603, "step": 2290 }, { "epoch": 2.0, "learning_rate": 9.825e-05, "loss": 0.7931, "step": 2300 }, { "epoch": 2.0, "learning_rate": 9.823648648648648e-05, "loss": 0.4881, "step": 2310 }, { "epoch": 2.0, "learning_rate": 9.822297297297298e-05, "loss": 0.726, "step": 2320 }, { "epoch": 2.0, "learning_rate": 9.820945945945946e-05, "loss": 0.837, "step": 2330 }, { "epoch": 2.0, "learning_rate": 9.819594594594595e-05, "loss": 0.8695, "step": 2340 }, { "epoch": 2.0, "learning_rate": 9.818243243243244e-05, "loss": 0.8938, "step": 2350 }, { "epoch": 2.0, "learning_rate": 9.816891891891893e-05, "loss": 0.7126, "step": 2360 }, { "epoch": 2.0, "learning_rate": 9.815540540540541e-05, "loss": 0.4902, "step": 2370 }, { "epoch": 2.0, "learning_rate": 9.81418918918919e-05, "loss": 0.7078, "step": 2380 }, { "epoch": 2.0, "learning_rate": 9.812837837837839e-05, "loss": 0.6085, "step": 2390 }, { "epoch": 2.0, "learning_rate": 9.811486486486488e-05, "loss": 0.7467, "step": 2400 }, { "epoch": 2.0, "learning_rate": 9.810135135135136e-05, "loss": 0.713, "step": 2410 }, { "epoch": 2.0, "learning_rate": 9.808783783783784e-05, "loss": 0.5773, "step": 2420 }, { "epoch": 2.01, "learning_rate": 9.807432432432432e-05, "loss": 0.4913, "step": 2430 }, { "epoch": 2.01, "learning_rate": 9.80608108108108e-05, "loss": 0.3871, "step": 2440 }, { "epoch": 2.01, "learning_rate": 9.80472972972973e-05, "loss": 0.5749, "step": 2450 }, { "epoch": 2.01, "learning_rate": 9.803378378378378e-05, "loss": 0.5486, "step": 2460 }, { "epoch": 2.01, "learning_rate": 9.802027027027028e-05, "loss": 0.5363, "step": 2470 }, { "epoch": 2.01, "learning_rate": 9.800675675675676e-05, "loss": 0.5494, "step": 2480 }, { "epoch": 2.01, "learning_rate": 9.799324324324325e-05, "loss": 0.8499, "step": 2490 }, { "epoch": 2.01, "learning_rate": 9.797972972972973e-05, "loss": 0.6022, "step": 2500 }, { "epoch": 2.01, "eval_loss": 0.2851092219352722, "eval_runtime": 130.4093, "eval_samples_per_second": 27.667, "eval_steps_per_second": 3.458, "eval_wer": 0.29646368168475984, "step": 2500 }, { "epoch": 2.01, "learning_rate": 9.796621621621623e-05, "loss": 0.7779, "step": 2510 }, { "epoch": 2.01, "learning_rate": 9.795270270270271e-05, "loss": 0.8424, "step": 2520 }, { "epoch": 2.01, "learning_rate": 9.79391891891892e-05, "loss": 0.8125, "step": 2530 }, { "epoch": 2.01, "learning_rate": 9.792567567567568e-05, "loss": 0.9425, "step": 2540 }, { "epoch": 2.01, "learning_rate": 9.791216216216216e-05, "loss": 0.7634, "step": 2550 }, { "epoch": 2.01, "learning_rate": 9.789864864864865e-05, "loss": 0.8989, "step": 2560 }, { "epoch": 2.01, "learning_rate": 9.788513513513514e-05, "loss": 1.2156, "step": 2570 }, { "epoch": 2.01, "learning_rate": 9.787162162162162e-05, "loss": 1.0036, "step": 2580 }, { "epoch": 2.01, "learning_rate": 9.785810810810812e-05, "loss": 0.4826, "step": 2590 }, { "epoch": 2.01, "learning_rate": 9.78445945945946e-05, "loss": 0.5392, "step": 2600 }, { "epoch": 2.01, "learning_rate": 9.783108108108109e-05, "loss": 0.5652, "step": 2610 }, { "epoch": 2.01, "learning_rate": 9.781756756756757e-05, "loss": 0.5725, "step": 2620 }, { "epoch": 2.01, "learning_rate": 9.780405405405407e-05, "loss": 0.5181, "step": 2630 }, { "epoch": 2.01, "learning_rate": 9.779054054054055e-05, "loss": 0.4747, "step": 2640 }, { "epoch": 2.01, "learning_rate": 9.777702702702703e-05, "loss": 0.4435, "step": 2650 }, { "epoch": 2.01, "learning_rate": 9.776351351351351e-05, "loss": 0.5251, "step": 2660 }, { "epoch": 2.01, "learning_rate": 9.775e-05, "loss": 0.9123, "step": 2670 }, { "epoch": 2.01, "learning_rate": 9.773648648648649e-05, "loss": 0.7849, "step": 2680 }, { "epoch": 2.01, "learning_rate": 9.772297297297298e-05, "loss": 0.7774, "step": 2690 }, { "epoch": 2.01, "learning_rate": 9.770945945945946e-05, "loss": 0.8067, "step": 2700 }, { "epoch": 2.01, "learning_rate": 9.769594594594596e-05, "loss": 1.1449, "step": 2710 }, { "epoch": 2.01, "learning_rate": 9.768243243243244e-05, "loss": 0.648, "step": 2720 }, { "epoch": 2.01, "learning_rate": 9.766891891891893e-05, "loss": 0.6251, "step": 2730 }, { "epoch": 2.01, "learning_rate": 9.765540540540541e-05, "loss": 0.7056, "step": 2740 }, { "epoch": 2.01, "learning_rate": 9.76418918918919e-05, "loss": 0.8207, "step": 2750 }, { "epoch": 2.01, "learning_rate": 9.762837837837839e-05, "loss": 0.7726, "step": 2760 }, { "epoch": 2.01, "learning_rate": 9.761486486486487e-05, "loss": 0.7331, "step": 2770 }, { "epoch": 2.01, "learning_rate": 9.760135135135135e-05, "loss": 0.6371, "step": 2780 }, { "epoch": 2.01, "learning_rate": 9.758783783783784e-05, "loss": 0.7216, "step": 2790 }, { "epoch": 2.01, "learning_rate": 9.757432432432433e-05, "loss": 0.5996, "step": 2800 }, { "epoch": 2.01, "learning_rate": 9.756081081081082e-05, "loss": 0.6228, "step": 2810 }, { "epoch": 2.01, "learning_rate": 9.75472972972973e-05, "loss": 0.4125, "step": 2820 }, { "epoch": 2.01, "learning_rate": 9.753378378378378e-05, "loss": 0.4194, "step": 2830 }, { "epoch": 2.01, "learning_rate": 9.752027027027028e-05, "loss": 0.7482, "step": 2840 }, { "epoch": 2.01, "learning_rate": 9.750675675675676e-05, "loss": 1.3029, "step": 2850 }, { "epoch": 2.01, "learning_rate": 9.749324324324325e-05, "loss": 0.5155, "step": 2860 }, { "epoch": 2.01, "learning_rate": 9.747972972972973e-05, "loss": 0.505, "step": 2870 }, { "epoch": 2.01, "learning_rate": 9.746621621621623e-05, "loss": 0.6677, "step": 2880 }, { "epoch": 2.01, "learning_rate": 9.745270270270271e-05, "loss": 0.6703, "step": 2890 }, { "epoch": 2.01, "learning_rate": 9.743918918918919e-05, "loss": 0.6367, "step": 2900 }, { "epoch": 2.01, "learning_rate": 9.742567567567567e-05, "loss": 0.7566, "step": 2910 }, { "epoch": 2.01, "learning_rate": 9.741216216216217e-05, "loss": 0.7535, "step": 2920 }, { "epoch": 2.01, "learning_rate": 9.739864864864865e-05, "loss": 0.5089, "step": 2930 }, { "epoch": 2.01, "learning_rate": 9.738513513513514e-05, "loss": 0.6852, "step": 2940 }, { "epoch": 2.01, "learning_rate": 9.737162162162162e-05, "loss": 0.7436, "step": 2950 }, { "epoch": 2.01, "learning_rate": 9.735810810810812e-05, "loss": 0.8595, "step": 2960 }, { "epoch": 2.01, "learning_rate": 9.73445945945946e-05, "loss": 0.9633, "step": 2970 }, { "epoch": 2.01, "learning_rate": 9.733108108108109e-05, "loss": 0.8152, "step": 2980 }, { "epoch": 2.01, "learning_rate": 9.731756756756757e-05, "loss": 1.4212, "step": 2990 }, { "epoch": 2.01, "learning_rate": 9.730405405405407e-05, "loss": 1.122, "step": 3000 }, { "epoch": 2.01, "eval_loss": 0.28004416823387146, "eval_runtime": 131.1266, "eval_samples_per_second": 27.515, "eval_steps_per_second": 3.439, "eval_wer": 0.2964170898755999, "step": 3000 }, { "epoch": 2.01, "learning_rate": 9.729054054054055e-05, "loss": 1.2432, "step": 3010 }, { "epoch": 2.01, "learning_rate": 9.727702702702703e-05, "loss": 1.1417, "step": 3020 }, { "epoch": 2.01, "learning_rate": 9.726351351351351e-05, "loss": 0.9486, "step": 3030 }, { "epoch": 2.01, "learning_rate": 9.725e-05, "loss": 0.9525, "step": 3040 }, { "epoch": 2.01, "learning_rate": 9.723648648648649e-05, "loss": 0.9115, "step": 3050 }, { "epoch": 2.01, "learning_rate": 9.722297297297298e-05, "loss": 0.9061, "step": 3060 }, { "epoch": 3.0, "learning_rate": 9.720945945945946e-05, "loss": 1.2054, "step": 3070 }, { "epoch": 3.0, "learning_rate": 9.719594594594596e-05, "loss": 0.9302, "step": 3080 }, { "epoch": 3.0, "learning_rate": 9.718243243243244e-05, "loss": 0.8261, "step": 3090 }, { "epoch": 3.0, "learning_rate": 9.716891891891893e-05, "loss": 0.8536, "step": 3100 }, { "epoch": 3.0, "learning_rate": 9.715540540540541e-05, "loss": 0.7331, "step": 3110 }, { "epoch": 3.0, "learning_rate": 9.71418918918919e-05, "loss": 0.7779, "step": 3120 }, { "epoch": 3.0, "learning_rate": 9.712837837837838e-05, "loss": 0.8313, "step": 3130 }, { "epoch": 3.0, "learning_rate": 9.711486486486487e-05, "loss": 0.9463, "step": 3140 }, { "epoch": 3.0, "learning_rate": 9.710135135135135e-05, "loss": 0.7132, "step": 3150 }, { "epoch": 3.0, "learning_rate": 9.708783783783785e-05, "loss": 0.7794, "step": 3160 }, { "epoch": 3.0, "learning_rate": 9.707432432432433e-05, "loss": 0.76, "step": 3170 }, { "epoch": 3.0, "learning_rate": 9.706081081081082e-05, "loss": 0.6919, "step": 3180 }, { "epoch": 3.0, "learning_rate": 9.70472972972973e-05, "loss": 0.6651, "step": 3190 }, { "epoch": 3.0, "learning_rate": 9.70337837837838e-05, "loss": 0.5285, "step": 3200 }, { "epoch": 3.0, "learning_rate": 9.702027027027028e-05, "loss": 0.487, "step": 3210 }, { "epoch": 3.0, "learning_rate": 9.700675675675676e-05, "loss": 0.4728, "step": 3220 }, { "epoch": 3.0, "learning_rate": 9.699324324324325e-05, "loss": 1.0522, "step": 3230 }, { "epoch": 3.0, "learning_rate": 9.697972972972973e-05, "loss": 1.6241, "step": 3240 }, { "epoch": 3.0, "learning_rate": 9.696621621621622e-05, "loss": 2.5393, "step": 3250 }, { "epoch": 3.0, "learning_rate": 9.69527027027027e-05, "loss": 2.7714, "step": 3260 }, { "epoch": 3.0, "learning_rate": 9.693918918918919e-05, "loss": 2.7379, "step": 3270 }, { "epoch": 3.0, "learning_rate": 9.692567567567567e-05, "loss": 2.7175, "step": 3280 }, { "epoch": 3.0, "learning_rate": 9.691216216216217e-05, "loss": 2.8519, "step": 3290 }, { "epoch": 3.0, "learning_rate": 9.689864864864865e-05, "loss": 2.0362, "step": 3300 }, { "epoch": 3.0, "learning_rate": 9.688513513513514e-05, "loss": 1.632, "step": 3310 }, { "epoch": 3.0, "learning_rate": 9.687162162162162e-05, "loss": 0.8863, "step": 3320 }, { "epoch": 3.0, "learning_rate": 9.685810810810812e-05, "loss": 0.3847, "step": 3330 }, { "epoch": 3.0, "learning_rate": 9.68445945945946e-05, "loss": 0.5786, "step": 3340 }, { "epoch": 3.0, "learning_rate": 9.68310810810811e-05, "loss": 0.5712, "step": 3350 }, { "epoch": 3.0, "learning_rate": 9.681756756756757e-05, "loss": 0.6195, "step": 3360 }, { "epoch": 3.0, "learning_rate": 9.680405405405406e-05, "loss": 0.8676, "step": 3370 }, { "epoch": 3.0, "learning_rate": 9.679054054054054e-05, "loss": 0.6014, "step": 3380 }, { "epoch": 3.0, "learning_rate": 9.677702702702703e-05, "loss": 0.3997, "step": 3390 }, { "epoch": 3.0, "learning_rate": 9.676351351351351e-05, "loss": 0.5864, "step": 3400 }, { "epoch": 3.0, "learning_rate": 9.675000000000001e-05, "loss": 0.4978, "step": 3410 }, { "epoch": 3.0, "learning_rate": 9.673648648648649e-05, "loss": 0.6212, "step": 3420 }, { "epoch": 3.0, "learning_rate": 9.672297297297298e-05, "loss": 0.6282, "step": 3430 }, { "epoch": 3.0, "learning_rate": 9.670945945945946e-05, "loss": 0.4602, "step": 3440 }, { "epoch": 3.01, "learning_rate": 9.669594594594596e-05, "loss": 0.4737, "step": 3450 }, { "epoch": 3.01, "learning_rate": 9.668243243243244e-05, "loss": 0.2953, "step": 3460 }, { "epoch": 3.01, "learning_rate": 9.666891891891892e-05, "loss": 0.4169, "step": 3470 }, { "epoch": 3.01, "learning_rate": 9.66554054054054e-05, "loss": 0.4744, "step": 3480 }, { "epoch": 3.01, "learning_rate": 9.66418918918919e-05, "loss": 0.3556, "step": 3490 }, { "epoch": 3.01, "learning_rate": 9.662837837837838e-05, "loss": 0.5454, "step": 3500 }, { "epoch": 3.01, "eval_loss": 0.22373759746551514, "eval_runtime": 128.9953, "eval_samples_per_second": 27.97, "eval_steps_per_second": 3.496, "eval_wer": 0.23309882122722825, "step": 3500 }, { "epoch": 3.01, "learning_rate": 9.661486486486487e-05, "loss": 0.7028, "step": 3510 }, { "epoch": 3.01, "learning_rate": 9.660135135135135e-05, "loss": 0.612, "step": 3520 }, { "epoch": 3.01, "learning_rate": 9.658783783783785e-05, "loss": 0.5407, "step": 3530 }, { "epoch": 3.01, "learning_rate": 9.657432432432433e-05, "loss": 0.7179, "step": 3540 }, { "epoch": 3.01, "learning_rate": 9.656081081081082e-05, "loss": 0.6747, "step": 3550 }, { "epoch": 3.01, "learning_rate": 9.65472972972973e-05, "loss": 0.8762, "step": 3560 }, { "epoch": 3.01, "learning_rate": 9.65337837837838e-05, "loss": 0.707, "step": 3570 }, { "epoch": 3.01, "learning_rate": 9.652027027027028e-05, "loss": 0.5785, "step": 3580 }, { "epoch": 3.01, "learning_rate": 9.650675675675676e-05, "loss": 1.1534, "step": 3590 }, { "epoch": 3.01, "learning_rate": 9.649324324324324e-05, "loss": 0.9941, "step": 3600 }, { "epoch": 3.01, "learning_rate": 9.647972972972974e-05, "loss": 0.5391, "step": 3610 }, { "epoch": 3.01, "learning_rate": 9.646621621621622e-05, "loss": 0.3983, "step": 3620 }, { "epoch": 3.01, "learning_rate": 9.64527027027027e-05, "loss": 0.5865, "step": 3630 }, { "epoch": 3.01, "learning_rate": 9.643918918918919e-05, "loss": 0.4461, "step": 3640 }, { "epoch": 3.01, "learning_rate": 9.642567567567567e-05, "loss": 0.4761, "step": 3650 }, { "epoch": 3.01, "learning_rate": 9.641216216216217e-05, "loss": 0.3955, "step": 3660 }, { "epoch": 3.01, "learning_rate": 9.639864864864865e-05, "loss": 0.3828, "step": 3670 }, { "epoch": 3.01, "learning_rate": 9.638513513513514e-05, "loss": 0.4001, "step": 3680 }, { "epoch": 3.01, "learning_rate": 9.637162162162163e-05, "loss": 0.7754, "step": 3690 }, { "epoch": 3.01, "learning_rate": 9.635810810810812e-05, "loss": 0.7455, "step": 3700 }, { "epoch": 3.01, "learning_rate": 9.63445945945946e-05, "loss": 0.656, "step": 3710 }, { "epoch": 3.01, "learning_rate": 9.633108108108108e-05, "loss": 0.6787, "step": 3720 }, { "epoch": 3.01, "learning_rate": 9.631756756756756e-05, "loss": 0.8513, "step": 3730 }, { "epoch": 3.01, "learning_rate": 9.630405405405406e-05, "loss": 0.7474, "step": 3740 }, { "epoch": 3.01, "learning_rate": 9.629054054054054e-05, "loss": 0.5131, "step": 3750 }, { "epoch": 3.01, "learning_rate": 9.627702702702703e-05, "loss": 0.5464, "step": 3760 }, { "epoch": 3.01, "learning_rate": 9.626351351351351e-05, "loss": 0.6753, "step": 3770 }, { "epoch": 3.01, "learning_rate": 9.625000000000001e-05, "loss": 0.8355, "step": 3780 }, { "epoch": 3.01, "learning_rate": 9.623648648648649e-05, "loss": 0.6334, "step": 3790 }, { "epoch": 3.01, "learning_rate": 9.622297297297298e-05, "loss": 0.5399, "step": 3800 }, { "epoch": 3.01, "learning_rate": 9.620945945945947e-05, "loss": 0.7102, "step": 3810 }, { "epoch": 3.01, "learning_rate": 9.619594594594596e-05, "loss": 0.5091, "step": 3820 }, { "epoch": 3.01, "learning_rate": 9.618243243243244e-05, "loss": 0.4898, "step": 3830 }, { "epoch": 3.01, "learning_rate": 9.616891891891892e-05, "loss": 0.5353, "step": 3840 }, { "epoch": 3.01, "learning_rate": 9.61554054054054e-05, "loss": 0.3434, "step": 3850 }, { "epoch": 3.01, "learning_rate": 9.61418918918919e-05, "loss": 0.5737, "step": 3860 }, { "epoch": 3.01, "learning_rate": 9.612837837837838e-05, "loss": 1.0459, "step": 3870 }, { "epoch": 3.01, "learning_rate": 9.611486486486487e-05, "loss": 0.651, "step": 3880 }, { "epoch": 3.01, "learning_rate": 9.610135135135135e-05, "loss": 0.4436, "step": 3890 }, { "epoch": 3.01, "learning_rate": 9.608783783783785e-05, "loss": 0.5495, "step": 3900 }, { "epoch": 3.01, "learning_rate": 9.607432432432433e-05, "loss": 0.5305, "step": 3910 }, { "epoch": 3.01, "learning_rate": 9.606081081081082e-05, "loss": 0.5645, "step": 3920 }, { "epoch": 3.01, "learning_rate": 9.60472972972973e-05, "loss": 0.697, "step": 3930 }, { "epoch": 3.01, "learning_rate": 9.603378378378379e-05, "loss": 0.6943, "step": 3940 }, { "epoch": 3.01, "learning_rate": 9.602027027027027e-05, "loss": 0.4983, "step": 3950 }, { "epoch": 3.01, "learning_rate": 9.600675675675676e-05, "loss": 0.6126, "step": 3960 }, { "epoch": 3.01, "learning_rate": 9.599324324324324e-05, "loss": 0.5486, "step": 3970 }, { "epoch": 3.01, "learning_rate": 9.597972972972974e-05, "loss": 0.8222, "step": 3980 }, { "epoch": 3.01, "learning_rate": 9.596621621621622e-05, "loss": 0.8052, "step": 3990 }, { "epoch": 3.01, "learning_rate": 9.595270270270271e-05, "loss": 0.7553, "step": 4000 }, { "epoch": 3.01, "eval_loss": 0.21124105155467987, "eval_runtime": 130.2843, "eval_samples_per_second": 27.693, "eval_steps_per_second": 3.462, "eval_wer": 0.2271350696547547, "step": 4000 }, { "epoch": 3.01, "learning_rate": 9.59391891891892e-05, "loss": 1.0814, "step": 4010 }, { "epoch": 3.01, "learning_rate": 9.592567567567569e-05, "loss": 1.1397, "step": 4020 }, { "epoch": 3.01, "learning_rate": 9.591216216216217e-05, "loss": 1.048, "step": 4030 }, { "epoch": 3.01, "learning_rate": 9.589864864864865e-05, "loss": 1.1016, "step": 4040 }, { "epoch": 3.01, "learning_rate": 9.588513513513515e-05, "loss": 0.9376, "step": 4050 }, { "epoch": 3.01, "learning_rate": 9.587162162162163e-05, "loss": 0.8631, "step": 4060 }, { "epoch": 3.01, "learning_rate": 9.585810810810811e-05, "loss": 0.8159, "step": 4070 }, { "epoch": 3.01, "learning_rate": 9.584459459459459e-05, "loss": 0.816, "step": 4080 }, { "epoch": 3.01, "learning_rate": 9.583108108108108e-05, "loss": 1.024, "step": 4090 }, { "epoch": 4.0, "learning_rate": 9.581756756756756e-05, "loss": 0.966, "step": 4100 }, { "epoch": 4.0, "learning_rate": 9.580405405405406e-05, "loss": 0.7753, "step": 4110 }, { "epoch": 4.0, "learning_rate": 9.579054054054054e-05, "loss": 0.7794, "step": 4120 }, { "epoch": 4.0, "learning_rate": 9.577702702702703e-05, "loss": 0.7129, "step": 4130 }, { "epoch": 4.0, "learning_rate": 9.576351351351352e-05, "loss": 0.6968, "step": 4140 }, { "epoch": 4.0, "learning_rate": 9.575000000000001e-05, "loss": 0.7047, "step": 4150 }, { "epoch": 4.0, "learning_rate": 9.573648648648649e-05, "loss": 0.9375, "step": 4160 }, { "epoch": 4.0, "learning_rate": 9.572297297297299e-05, "loss": 0.6873, "step": 4170 }, { "epoch": 4.0, "learning_rate": 9.570945945945947e-05, "loss": 0.6741, "step": 4180 }, { "epoch": 4.0, "learning_rate": 9.569594594594595e-05, "loss": 0.6796, "step": 4190 }, { "epoch": 4.0, "learning_rate": 9.568243243243243e-05, "loss": 0.66, "step": 4200 }, { "epoch": 4.0, "learning_rate": 9.566891891891892e-05, "loss": 0.6426, "step": 4210 }, { "epoch": 4.0, "learning_rate": 9.56554054054054e-05, "loss": 0.4642, "step": 4220 }, { "epoch": 4.0, "learning_rate": 9.56418918918919e-05, "loss": 0.4183, "step": 4230 }, { "epoch": 4.0, "learning_rate": 9.562837837837838e-05, "loss": 0.4384, "step": 4240 }, { "epoch": 4.0, "learning_rate": 9.561486486486487e-05, "loss": 0.5375, "step": 4250 }, { "epoch": 4.0, "learning_rate": 9.560135135135136e-05, "loss": 1.7701, "step": 4260 }, { "epoch": 4.0, "learning_rate": 9.558783783783785e-05, "loss": 1.8313, "step": 4270 }, { "epoch": 4.0, "learning_rate": 9.557432432432433e-05, "loss": 2.768, "step": 4280 }, { "epoch": 4.0, "learning_rate": 9.556081081081083e-05, "loss": 2.6691, "step": 4290 }, { "epoch": 4.0, "learning_rate": 9.55472972972973e-05, "loss": 2.6992, "step": 4300 }, { "epoch": 4.0, "learning_rate": 9.553378378378379e-05, "loss": 2.5017, "step": 4310 }, { "epoch": 4.0, "learning_rate": 9.552027027027027e-05, "loss": 2.0609, "step": 4320 }, { "epoch": 4.0, "learning_rate": 9.550675675675676e-05, "loss": 2.0415, "step": 4330 }, { "epoch": 4.0, "learning_rate": 9.549324324324324e-05, "loss": 0.8992, "step": 4340 }, { "epoch": 4.0, "learning_rate": 9.547972972972974e-05, "loss": 0.3826, "step": 4350 }, { "epoch": 4.0, "learning_rate": 9.546621621621622e-05, "loss": 0.5578, "step": 4360 }, { "epoch": 4.0, "learning_rate": 9.545270270270271e-05, "loss": 0.4722, "step": 4370 }, { "epoch": 4.0, "learning_rate": 9.54391891891892e-05, "loss": 0.697, "step": 4380 }, { "epoch": 4.0, "learning_rate": 9.542567567567569e-05, "loss": 0.7186, "step": 4390 }, { "epoch": 4.0, "learning_rate": 9.541216216216217e-05, "loss": 0.7146, "step": 4400 }, { "epoch": 4.0, "learning_rate": 9.539864864864865e-05, "loss": 0.4081, "step": 4410 }, { "epoch": 4.0, "learning_rate": 9.538513513513513e-05, "loss": 0.4094, "step": 4420 }, { "epoch": 4.0, "learning_rate": 9.537162162162161e-05, "loss": 0.5002, "step": 4430 }, { "epoch": 4.0, "learning_rate": 9.535810810810811e-05, "loss": 0.5455, "step": 4440 }, { "epoch": 4.0, "learning_rate": 9.534459459459459e-05, "loss": 0.5295, "step": 4450 }, { "epoch": 4.0, "learning_rate": 9.533108108108108e-05, "loss": 0.4868, "step": 4460 }, { "epoch": 4.01, "learning_rate": 9.531756756756757e-05, "loss": 0.4415, "step": 4470 }, { "epoch": 4.01, "learning_rate": 9.530405405405406e-05, "loss": 0.3083, "step": 4480 }, { "epoch": 4.01, "learning_rate": 9.529054054054054e-05, "loss": 0.3284, "step": 4490 }, { "epoch": 4.01, "learning_rate": 9.527702702702704e-05, "loss": 0.4752, "step": 4500 }, { "epoch": 4.01, "eval_loss": 0.2037777453660965, "eval_runtime": 136.779, "eval_samples_per_second": 26.378, "eval_steps_per_second": 3.297, "eval_wer": 0.21921446209756326, "step": 4500 }, { "epoch": 4.01, "learning_rate": 9.526351351351352e-05, "loss": 0.333, "step": 4510 }, { "epoch": 4.01, "learning_rate": 9.525000000000001e-05, "loss": 0.455, "step": 4520 }, { "epoch": 4.01, "learning_rate": 9.523648648648649e-05, "loss": 0.5595, "step": 4530 }, { "epoch": 4.01, "learning_rate": 9.522297297297297e-05, "loss": 0.5317, "step": 4540 }, { "epoch": 4.01, "learning_rate": 9.520945945945945e-05, "loss": 0.4597, "step": 4550 }, { "epoch": 4.01, "learning_rate": 9.519594594594595e-05, "loss": 0.6914, "step": 4560 }, { "epoch": 4.01, "learning_rate": 9.518243243243243e-05, "loss": 0.6782, "step": 4570 }, { "epoch": 4.01, "learning_rate": 9.516891891891892e-05, "loss": 0.7018, "step": 4580 }, { "epoch": 4.01, "learning_rate": 9.51554054054054e-05, "loss": 0.7104, "step": 4590 }, { "epoch": 4.01, "learning_rate": 9.51418918918919e-05, "loss": 0.4397, "step": 4600 }, { "epoch": 4.01, "learning_rate": 9.512837837837838e-05, "loss": 0.8754, "step": 4610 }, { "epoch": 4.01, "learning_rate": 9.511486486486488e-05, "loss": 0.9121, "step": 4620 }, { "epoch": 4.01, "learning_rate": 9.510135135135136e-05, "loss": 0.6368, "step": 4630 }, { "epoch": 4.01, "learning_rate": 9.508783783783785e-05, "loss": 0.306, "step": 4640 }, { "epoch": 4.01, "learning_rate": 9.507432432432433e-05, "loss": 0.5111, "step": 4650 }, { "epoch": 4.01, "learning_rate": 9.506081081081081e-05, "loss": 0.4673, "step": 4660 }, { "epoch": 4.01, "learning_rate": 9.50472972972973e-05, "loss": 0.4565, "step": 4670 }, { "epoch": 4.01, "learning_rate": 9.503378378378379e-05, "loss": 0.3378, "step": 4680 }, { "epoch": 4.01, "learning_rate": 9.502027027027027e-05, "loss": 0.343, "step": 4690 }, { "epoch": 4.01, "learning_rate": 9.500675675675676e-05, "loss": 0.3447, "step": 4700 }, { "epoch": 4.01, "learning_rate": 9.499324324324325e-05, "loss": 0.647, "step": 4710 }, { "epoch": 4.01, "learning_rate": 9.497972972972974e-05, "loss": 0.718, "step": 4720 }, { "epoch": 4.01, "learning_rate": 9.496621621621622e-05, "loss": 0.677, "step": 4730 }, { "epoch": 4.01, "learning_rate": 9.495270270270272e-05, "loss": 0.5751, "step": 4740 }, { "epoch": 4.01, "learning_rate": 9.49391891891892e-05, "loss": 0.7532, "step": 4750 }, { "epoch": 4.01, "learning_rate": 9.492567567567569e-05, "loss": 0.7705, "step": 4760 }, { "epoch": 4.01, "learning_rate": 9.491216216216217e-05, "loss": 0.461, "step": 4770 }, { "epoch": 4.01, "learning_rate": 9.489864864864865e-05, "loss": 0.4818, "step": 4780 }, { "epoch": 4.01, "learning_rate": 9.488513513513513e-05, "loss": 0.5647, "step": 4790 }, { "epoch": 4.01, "learning_rate": 9.487162162162163e-05, "loss": 0.7138, "step": 4800 }, { "epoch": 4.01, "learning_rate": 9.485810810810811e-05, "loss": 0.7833, "step": 4810 }, { "epoch": 4.01, "learning_rate": 9.48445945945946e-05, "loss": 0.5336, "step": 4820 }, { "epoch": 4.01, "learning_rate": 9.483108108108109e-05, "loss": 0.558, "step": 4830 }, { "epoch": 4.01, "learning_rate": 9.481756756756757e-05, "loss": 0.446, "step": 4840 }, { "epoch": 4.01, "learning_rate": 9.480405405405406e-05, "loss": 0.4379, "step": 4850 }, { "epoch": 4.01, "learning_rate": 9.479054054054054e-05, "loss": 0.5588, "step": 4860 }, { "epoch": 4.01, "learning_rate": 9.477702702702704e-05, "loss": 0.2888, "step": 4870 }, { "epoch": 4.01, "learning_rate": 9.476351351351352e-05, "loss": 0.5464, "step": 4880 }, { "epoch": 4.01, "learning_rate": 9.475e-05, "loss": 0.7507, "step": 4890 }, { "epoch": 4.01, "learning_rate": 9.473648648648648e-05, "loss": 0.8171, "step": 4900 }, { "epoch": 4.01, "learning_rate": 9.472297297297297e-05, "loss": 0.4279, "step": 4910 }, { "epoch": 4.01, "learning_rate": 9.470945945945946e-05, "loss": 0.4815, "step": 4920 }, { "epoch": 4.01, "learning_rate": 9.469594594594595e-05, "loss": 0.5521, "step": 4930 }, { "epoch": 4.01, "learning_rate": 9.468243243243243e-05, "loss": 0.5152, "step": 4940 }, { "epoch": 4.01, "learning_rate": 9.466891891891893e-05, "loss": 0.6454, "step": 4950 }, { "epoch": 4.01, "learning_rate": 9.465540540540541e-05, "loss": 0.7156, "step": 4960 }, { "epoch": 4.01, "learning_rate": 9.46418918918919e-05, "loss": 0.4328, "step": 4970 }, { "epoch": 4.01, "learning_rate": 9.462837837837838e-05, "loss": 0.5576, "step": 4980 }, { "epoch": 4.01, "learning_rate": 9.461486486486488e-05, "loss": 0.5349, "step": 4990 }, { "epoch": 4.01, "learning_rate": 9.460135135135136e-05, "loss": 0.7205, "step": 5000 }, { "epoch": 4.01, "eval_loss": 0.18799734115600586, "eval_runtime": 133.9873, "eval_samples_per_second": 26.928, "eval_steps_per_second": 3.366, "eval_wer": 0.19671061827330755, "step": 5000 }, { "epoch": 4.01, "learning_rate": 9.458783783783784e-05, "loss": 0.721, "step": 5010 }, { "epoch": 4.01, "learning_rate": 9.457432432432432e-05, "loss": 0.7937, "step": 5020 }, { "epoch": 4.01, "learning_rate": 9.456081081081081e-05, "loss": 0.8391, "step": 5030 }, { "epoch": 4.01, "learning_rate": 9.45472972972973e-05, "loss": 1.1416, "step": 5040 }, { "epoch": 4.01, "learning_rate": 9.453378378378379e-05, "loss": 0.8937, "step": 5050 }, { "epoch": 4.01, "learning_rate": 9.452027027027027e-05, "loss": 1.1515, "step": 5060 }, { "epoch": 4.01, "learning_rate": 9.450675675675677e-05, "loss": 0.9117, "step": 5070 }, { "epoch": 4.01, "learning_rate": 9.449324324324325e-05, "loss": 0.8004, "step": 5080 }, { "epoch": 4.01, "learning_rate": 9.447972972972974e-05, "loss": 0.8111, "step": 5090 }, { "epoch": 4.01, "learning_rate": 9.446621621621622e-05, "loss": 0.8078, "step": 5100 }, { "epoch": 4.01, "learning_rate": 9.445270270270272e-05, "loss": 0.8446, "step": 5110 }, { "epoch": 5.0, "learning_rate": 9.44391891891892e-05, "loss": 0.927, "step": 5120 }, { "epoch": 5.0, "learning_rate": 9.442567567567568e-05, "loss": 0.7083, "step": 5130 }, { "epoch": 5.0, "learning_rate": 9.441216216216216e-05, "loss": 0.7111, "step": 5140 }, { "epoch": 5.0, "learning_rate": 9.439864864864866e-05, "loss": 0.6756, "step": 5150 }, { "epoch": 5.0, "learning_rate": 9.438513513513514e-05, "loss": 0.6514, "step": 5160 }, { "epoch": 5.0, "learning_rate": 9.437162162162163e-05, "loss": 0.6773, "step": 5170 }, { "epoch": 5.0, "learning_rate": 9.435810810810811e-05, "loss": 0.8792, "step": 5180 }, { "epoch": 5.0, "learning_rate": 9.43445945945946e-05, "loss": 0.6256, "step": 5190 }, { "epoch": 5.0, "learning_rate": 9.433108108108109e-05, "loss": 0.6518, "step": 5200 }, { "epoch": 5.0, "learning_rate": 9.431756756756758e-05, "loss": 0.6692, "step": 5210 }, { "epoch": 5.0, "learning_rate": 9.430405405405406e-05, "loss": 0.6297, "step": 5220 }, { "epoch": 5.0, "learning_rate": 9.429054054054054e-05, "loss": 0.64, "step": 5230 }, { "epoch": 5.0, "learning_rate": 9.427702702702702e-05, "loss": 0.4581, "step": 5240 }, { "epoch": 5.0, "learning_rate": 9.426351351351352e-05, "loss": 0.4213, "step": 5250 }, { "epoch": 5.0, "learning_rate": 9.425e-05, "loss": 0.4002, "step": 5260 }, { "epoch": 5.0, "learning_rate": 9.423648648648648e-05, "loss": 0.4157, "step": 5270 }, { "epoch": 5.0, "learning_rate": 9.422297297297298e-05, "loss": 1.5343, "step": 5280 }, { "epoch": 5.0, "learning_rate": 9.420945945945946e-05, "loss": 1.3924, "step": 5290 }, { "epoch": 5.0, "learning_rate": 9.419594594594595e-05, "loss": 2.8099, "step": 5300 }, { "epoch": 5.0, "learning_rate": 9.418243243243243e-05, "loss": 2.5756, "step": 5310 }, { "epoch": 5.0, "learning_rate": 9.416891891891893e-05, "loss": 2.6888, "step": 5320 }, { "epoch": 5.0, "learning_rate": 9.415540540540541e-05, "loss": 2.6892, "step": 5330 }, { "epoch": 5.0, "learning_rate": 9.41418918918919e-05, "loss": 1.9475, "step": 5340 }, { "epoch": 5.0, "learning_rate": 9.412837837837838e-05, "loss": 2.1921, "step": 5350 }, { "epoch": 5.0, "learning_rate": 9.411486486486487e-05, "loss": 1.1596, "step": 5360 }, { "epoch": 5.0, "learning_rate": 9.410135135135135e-05, "loss": 0.5187, "step": 5370 }, { "epoch": 5.0, "learning_rate": 9.408783783783784e-05, "loss": 0.4042, "step": 5380 }, { "epoch": 5.0, "learning_rate": 9.407432432432432e-05, "loss": 0.4968, "step": 5390 }, { "epoch": 5.0, "learning_rate": 9.406081081081082e-05, "loss": 0.5388, "step": 5400 }, { "epoch": 5.0, "learning_rate": 9.40472972972973e-05, "loss": 0.6662, "step": 5410 }, { "epoch": 5.0, "learning_rate": 9.403378378378379e-05, "loss": 0.6842, "step": 5420 }, { "epoch": 5.0, "learning_rate": 9.402027027027027e-05, "loss": 0.4571, "step": 5430 }, { "epoch": 5.0, "learning_rate": 9.400675675675677e-05, "loss": 0.3439, "step": 5440 }, { "epoch": 5.0, "learning_rate": 9.399324324324325e-05, "loss": 0.5168, "step": 5450 }, { "epoch": 5.0, "learning_rate": 9.397972972972974e-05, "loss": 0.4583, "step": 5460 }, { "epoch": 5.0, "learning_rate": 9.396621621621622e-05, "loss": 0.5647, "step": 5470 }, { "epoch": 5.0, "learning_rate": 9.39527027027027e-05, "loss": 0.4671, "step": 5480 }, { "epoch": 5.0, "learning_rate": 9.393918918918919e-05, "loss": 0.3717, "step": 5490 }, { "epoch": 5.01, "learning_rate": 9.392567567567568e-05, "loss": 0.3353, "step": 5500 }, { "epoch": 5.01, "eval_loss": 0.18369728326797485, "eval_runtime": 130.4295, "eval_samples_per_second": 27.662, "eval_steps_per_second": 3.458, "eval_wer": 0.1897218468993151, "step": 5500 }, { "epoch": 5.01, "learning_rate": 9.391216216216216e-05, "loss": 0.2347, "step": 5510 }, { "epoch": 5.01, "learning_rate": 9.389864864864866e-05, "loss": 0.428, "step": 5520 }, { "epoch": 5.01, "learning_rate": 9.388513513513514e-05, "loss": 0.4297, "step": 5530 }, { "epoch": 5.01, "learning_rate": 9.387162162162163e-05, "loss": 0.3643, "step": 5540 }, { "epoch": 5.01, "learning_rate": 9.385810810810811e-05, "loss": 0.4684, "step": 5550 }, { "epoch": 5.01, "learning_rate": 9.384459459459461e-05, "loss": 0.6639, "step": 5560 }, { "epoch": 5.01, "learning_rate": 9.383108108108109e-05, "loss": 0.4163, "step": 5570 }, { "epoch": 5.01, "learning_rate": 9.381756756756758e-05, "loss": 0.5832, "step": 5580 }, { "epoch": 5.01, "learning_rate": 9.380405405405406e-05, "loss": 0.624, "step": 5590 }, { "epoch": 5.01, "learning_rate": 9.379054054054055e-05, "loss": 0.6583, "step": 5600 }, { "epoch": 5.01, "learning_rate": 9.377702702702703e-05, "loss": 0.696, "step": 5610 }, { "epoch": 5.01, "learning_rate": 9.376351351351352e-05, "loss": 0.5506, "step": 5620 }, { "epoch": 5.01, "learning_rate": 9.375e-05, "loss": 0.6814, "step": 5630 }, { "epoch": 5.01, "learning_rate": 9.373648648648648e-05, "loss": 0.9632, "step": 5640 }, { "epoch": 5.01, "learning_rate": 9.372297297297298e-05, "loss": 0.775, "step": 5650 }, { "epoch": 5.01, "learning_rate": 9.370945945945946e-05, "loss": 0.3697, "step": 5660 }, { "epoch": 5.01, "learning_rate": 9.369594594594595e-05, "loss": 0.455, "step": 5670 }, { "epoch": 5.01, "learning_rate": 9.368243243243243e-05, "loss": 0.4261, "step": 5680 }, { "epoch": 5.01, "learning_rate": 9.366891891891893e-05, "loss": 0.3572, "step": 5690 }, { "epoch": 5.01, "learning_rate": 9.365540540540541e-05, "loss": 0.3937, "step": 5700 }, { "epoch": 5.01, "learning_rate": 9.364189189189189e-05, "loss": 0.3396, "step": 5710 }, { "epoch": 5.01, "learning_rate": 9.362837837837837e-05, "loss": 0.3113, "step": 5720 }, { "epoch": 5.01, "learning_rate": 9.361486486486487e-05, "loss": 0.3959, "step": 5730 }, { "epoch": 5.01, "learning_rate": 9.360135135135135e-05, "loss": 0.7094, "step": 5740 }, { "epoch": 5.01, "learning_rate": 9.358783783783784e-05, "loss": 0.6883, "step": 5750 }, { "epoch": 5.01, "learning_rate": 9.357432432432432e-05, "loss": 0.5271, "step": 5760 }, { "epoch": 5.01, "learning_rate": 9.356081081081082e-05, "loss": 0.6493, "step": 5770 }, { "epoch": 5.01, "learning_rate": 9.35472972972973e-05, "loss": 0.8679, "step": 5780 }, { "epoch": 5.01, "learning_rate": 9.35337837837838e-05, "loss": 0.5402, "step": 5790 }, { "epoch": 5.01, "learning_rate": 9.352027027027027e-05, "loss": 0.4243, "step": 5800 }, { "epoch": 5.01, "learning_rate": 9.350675675675677e-05, "loss": 0.4983, "step": 5810 }, { "epoch": 5.01, "learning_rate": 9.349324324324325e-05, "loss": 0.6373, "step": 5820 }, { "epoch": 5.01, "learning_rate": 9.347972972972973e-05, "loss": 0.5871, "step": 5830 }, { "epoch": 5.01, "learning_rate": 9.346621621621621e-05, "loss": 0.5397, "step": 5840 }, { "epoch": 5.01, "learning_rate": 9.34527027027027e-05, "loss": 0.539, "step": 5850 }, { "epoch": 5.01, "learning_rate": 9.343918918918919e-05, "loss": 0.5237, "step": 5860 }, { "epoch": 5.01, "learning_rate": 9.342567567567568e-05, "loss": 0.4079, "step": 5870 }, { "epoch": 5.01, "learning_rate": 9.341216216216216e-05, "loss": 0.489, "step": 5880 }, { "epoch": 5.01, "learning_rate": 9.339864864864866e-05, "loss": 0.2677, "step": 5890 }, { "epoch": 5.01, "learning_rate": 9.338513513513514e-05, "loss": 0.4115, "step": 5900 }, { "epoch": 5.01, "learning_rate": 9.337162162162163e-05, "loss": 0.5822, "step": 5910 }, { "epoch": 5.01, "learning_rate": 9.335810810810811e-05, "loss": 1.0005, "step": 5920 }, { "epoch": 5.01, "learning_rate": 9.334459459459461e-05, "loss": 0.3886, "step": 5930 }, { "epoch": 5.01, "learning_rate": 9.333108108108109e-05, "loss": 0.3868, "step": 5940 }, { "epoch": 5.01, "learning_rate": 9.331756756756757e-05, "loss": 0.5626, "step": 5950 }, { "epoch": 5.01, "learning_rate": 9.330405405405405e-05, "loss": 0.5125, "step": 5960 }, { "epoch": 5.01, "learning_rate": 9.329054054054055e-05, "loss": 0.5065, "step": 5970 }, { "epoch": 5.01, "learning_rate": 9.327702702702703e-05, "loss": 0.6939, "step": 5980 }, { "epoch": 5.01, "learning_rate": 9.326351351351352e-05, "loss": 0.5594, "step": 5990 }, { "epoch": 5.01, "learning_rate": 9.325e-05, "loss": 0.4012, "step": 6000 }, { "epoch": 5.01, "eval_loss": 0.1661776453256607, "eval_runtime": 129.0104, "eval_samples_per_second": 27.967, "eval_steps_per_second": 3.496, "eval_wer": 0.17779434375436798, "step": 6000 }, { "epoch": 5.01, "learning_rate": 9.32364864864865e-05, "loss": 0.5307, "step": 6010 }, { "epoch": 5.01, "learning_rate": 9.322297297297298e-05, "loss": 0.6021, "step": 6020 }, { "epoch": 5.01, "learning_rate": 9.320945945945947e-05, "loss": 0.6841, "step": 6030 }, { "epoch": 5.01, "learning_rate": 9.319594594594595e-05, "loss": 0.8046, "step": 6040 }, { "epoch": 5.01, "learning_rate": 9.318243243243244e-05, "loss": 0.6593, "step": 6050 }, { "epoch": 5.01, "learning_rate": 9.316891891891893e-05, "loss": 1.0739, "step": 6060 }, { "epoch": 5.01, "learning_rate": 9.315540540540541e-05, "loss": 0.8971, "step": 6070 }, { "epoch": 5.01, "learning_rate": 9.314189189189189e-05, "loss": 1.0407, "step": 6080 }, { "epoch": 5.01, "learning_rate": 9.312837837837837e-05, "loss": 0.9196, "step": 6090 }, { "epoch": 5.01, "learning_rate": 9.311486486486487e-05, "loss": 0.7806, "step": 6100 }, { "epoch": 5.01, "learning_rate": 9.310135135135135e-05, "loss": 0.7651, "step": 6110 }, { "epoch": 5.01, "learning_rate": 9.308783783783784e-05, "loss": 0.7861, "step": 6120 }, { "epoch": 5.01, "learning_rate": 9.307432432432432e-05, "loss": 0.7836, "step": 6130 }, { "epoch": 6.0, "learning_rate": 9.306081081081082e-05, "loss": 1.0025, "step": 6140 }, { "epoch": 6.0, "learning_rate": 9.30472972972973e-05, "loss": 0.7248, "step": 6150 }, { "epoch": 6.0, "learning_rate": 9.30337837837838e-05, "loss": 0.6555, "step": 6160 }, { "epoch": 6.0, "learning_rate": 9.302027027027028e-05, "loss": 0.7001, "step": 6170 }, { "epoch": 6.0, "learning_rate": 9.300675675675676e-05, "loss": 0.5637, "step": 6180 }, { "epoch": 6.0, "learning_rate": 9.299324324324324e-05, "loss": 0.6621, "step": 6190 }, { "epoch": 6.0, "learning_rate": 9.297972972972973e-05, "loss": 0.6818, "step": 6200 }, { "epoch": 6.0, "learning_rate": 9.296621621621621e-05, "loss": 0.7579, "step": 6210 }, { "epoch": 6.0, "learning_rate": 9.295270270270271e-05, "loss": 0.5709, "step": 6220 }, { "epoch": 6.0, "learning_rate": 9.293918918918919e-05, "loss": 0.6527, "step": 6230 }, { "epoch": 6.0, "learning_rate": 9.292567567567568e-05, "loss": 0.615, "step": 6240 }, { "epoch": 6.0, "learning_rate": 9.291216216216216e-05, "loss": 0.614, "step": 6250 }, { "epoch": 6.0, "learning_rate": 9.289864864864866e-05, "loss": 0.5586, "step": 6260 }, { "epoch": 6.0, "learning_rate": 9.288513513513514e-05, "loss": 0.3796, "step": 6270 }, { "epoch": 6.0, "learning_rate": 9.287162162162163e-05, "loss": 0.3974, "step": 6280 }, { "epoch": 6.0, "learning_rate": 9.285810810810812e-05, "loss": 0.386, "step": 6290 }, { "epoch": 6.0, "learning_rate": 9.28445945945946e-05, "loss": 1.0275, "step": 6300 }, { "epoch": 6.0, "learning_rate": 9.283108108108108e-05, "loss": 1.317, "step": 6310 }, { "epoch": 6.0, "learning_rate": 9.281756756756757e-05, "loss": 2.4912, "step": 6320 }, { "epoch": 6.0, "learning_rate": 9.280405405405405e-05, "loss": 2.6552, "step": 6330 }, { "epoch": 6.0, "learning_rate": 9.279054054054055e-05, "loss": 2.6056, "step": 6340 }, { "epoch": 6.0, "learning_rate": 9.277702702702703e-05, "loss": 2.6671, "step": 6350 }, { "epoch": 6.0, "learning_rate": 9.276351351351352e-05, "loss": 2.2159, "step": 6360 }, { "epoch": 6.0, "learning_rate": 9.275e-05, "loss": 2.06, "step": 6370 }, { "epoch": 6.0, "learning_rate": 9.27364864864865e-05, "loss": 1.4141, "step": 6380 }, { "epoch": 6.0, "learning_rate": 9.272297297297298e-05, "loss": 0.6748, "step": 6390 }, { "epoch": 6.0, "learning_rate": 9.270945945945947e-05, "loss": 0.3289, "step": 6400 }, { "epoch": 6.0, "learning_rate": 9.269594594594596e-05, "loss": 0.475, "step": 6410 }, { "epoch": 6.0, "learning_rate": 9.268243243243244e-05, "loss": 0.4674, "step": 6420 }, { "epoch": 6.0, "learning_rate": 9.266891891891892e-05, "loss": 0.4958, "step": 6430 }, { "epoch": 6.0, "learning_rate": 9.26554054054054e-05, "loss": 0.7582, "step": 6440 }, { "epoch": 6.0, "learning_rate": 9.26418918918919e-05, "loss": 0.4292, "step": 6450 }, { "epoch": 6.0, "learning_rate": 9.262837837837837e-05, "loss": 0.3037, "step": 6460 }, { "epoch": 6.0, "learning_rate": 9.261486486486487e-05, "loss": 0.4815, "step": 6470 }, { "epoch": 6.0, "learning_rate": 9.260135135135135e-05, "loss": 0.3701, "step": 6480 }, { "epoch": 6.0, "learning_rate": 9.258783783783784e-05, "loss": 0.5031, "step": 6490 }, { "epoch": 6.0, "learning_rate": 9.257432432432433e-05, "loss": 0.5349, "step": 6500 }, { "epoch": 6.0, "eval_loss": 0.16857638955116272, "eval_runtime": 129.3708, "eval_samples_per_second": 27.889, "eval_steps_per_second": 3.486, "eval_wer": 0.18571495131155943, "step": 6500 }, { "epoch": 6.0, "learning_rate": 9.256081081081082e-05, "loss": 0.3543, "step": 6510 }, { "epoch": 6.01, "learning_rate": 9.25472972972973e-05, "loss": 0.37, "step": 6520 }, { "epoch": 6.01, "learning_rate": 9.25337837837838e-05, "loss": 0.2592, "step": 6530 }, { "epoch": 6.01, "learning_rate": 9.252027027027028e-05, "loss": 0.3536, "step": 6540 }, { "epoch": 6.01, "learning_rate": 9.250675675675676e-05, "loss": 0.3973, "step": 6550 }, { "epoch": 6.01, "learning_rate": 9.249324324324324e-05, "loss": 0.2824, "step": 6560 }, { "epoch": 6.01, "learning_rate": 9.247972972972973e-05, "loss": 0.4212, "step": 6570 }, { "epoch": 6.01, "learning_rate": 9.246621621621621e-05, "loss": 0.5686, "step": 6580 }, { "epoch": 6.01, "learning_rate": 9.245270270270271e-05, "loss": 0.5169, "step": 6590 }, { "epoch": 6.01, "learning_rate": 9.243918918918919e-05, "loss": 0.49, "step": 6600 }, { "epoch": 6.01, "learning_rate": 9.242567567567568e-05, "loss": 0.6219, "step": 6610 }, { "epoch": 6.01, "learning_rate": 9.241216216216217e-05, "loss": 0.5781, "step": 6620 }, { "epoch": 6.01, "learning_rate": 9.239864864864866e-05, "loss": 0.6507, "step": 6630 }, { "epoch": 6.01, "learning_rate": 9.238513513513514e-05, "loss": 0.5442, "step": 6640 }, { "epoch": 6.01, "learning_rate": 9.237162162162162e-05, "loss": 0.4987, "step": 6650 }, { "epoch": 6.01, "learning_rate": 9.23581081081081e-05, "loss": 0.8995, "step": 6660 }, { "epoch": 6.01, "learning_rate": 9.23445945945946e-05, "loss": 0.8149, "step": 6670 }, { "epoch": 6.01, "learning_rate": 9.233108108108108e-05, "loss": 0.3708, "step": 6680 }, { "epoch": 6.01, "learning_rate": 9.231756756756757e-05, "loss": 0.3488, "step": 6690 }, { "epoch": 6.01, "learning_rate": 9.230405405405405e-05, "loss": 0.4607, "step": 6700 }, { "epoch": 6.01, "learning_rate": 9.229054054054055e-05, "loss": 0.3896, "step": 6710 }, { "epoch": 6.01, "learning_rate": 9.227702702702703e-05, "loss": 0.353, "step": 6720 }, { "epoch": 6.01, "learning_rate": 9.226351351351353e-05, "loss": 0.3311, "step": 6730 }, { "epoch": 6.01, "learning_rate": 9.225e-05, "loss": 0.3612, "step": 6740 }, { "epoch": 6.01, "learning_rate": 9.22364864864865e-05, "loss": 0.3267, "step": 6750 }, { "epoch": 6.01, "learning_rate": 9.222297297297298e-05, "loss": 0.6798, "step": 6760 }, { "epoch": 6.01, "learning_rate": 9.220945945945946e-05, "loss": 0.6258, "step": 6770 }, { "epoch": 6.01, "learning_rate": 9.219594594594594e-05, "loss": 0.5654, "step": 6780 }, { "epoch": 6.01, "learning_rate": 9.218243243243244e-05, "loss": 0.561, "step": 6790 }, { "epoch": 6.01, "learning_rate": 9.216891891891892e-05, "loss": 0.7948, "step": 6800 }, { "epoch": 6.01, "learning_rate": 9.215540540540541e-05, "loss": 0.5768, "step": 6810 }, { "epoch": 6.01, "learning_rate": 9.21418918918919e-05, "loss": 0.3794, "step": 6820 }, { "epoch": 6.01, "learning_rate": 9.212837837837839e-05, "loss": 0.4938, "step": 6830 }, { "epoch": 6.01, "learning_rate": 9.211486486486487e-05, "loss": 0.5871, "step": 6840 }, { "epoch": 6.01, "learning_rate": 9.210135135135135e-05, "loss": 0.6328, "step": 6850 }, { "epoch": 6.01, "learning_rate": 9.208783783783785e-05, "loss": 0.5453, "step": 6860 }, { "epoch": 6.01, "learning_rate": 9.207432432432433e-05, "loss": 0.5464, "step": 6870 }, { "epoch": 6.01, "learning_rate": 9.206081081081082e-05, "loss": 0.5354, "step": 6880 }, { "epoch": 6.01, "learning_rate": 9.20472972972973e-05, "loss": 0.4288, "step": 6890 }, { "epoch": 6.01, "learning_rate": 9.203378378378378e-05, "loss": 0.4204, "step": 6900 }, { "epoch": 6.01, "learning_rate": 9.202027027027026e-05, "loss": 0.3571, "step": 6910 }, { "epoch": 6.01, "learning_rate": 9.200675675675676e-05, "loss": 0.268, "step": 6920 }, { "epoch": 6.01, "learning_rate": 9.199324324324324e-05, "loss": 0.4752, "step": 6930 }, { "epoch": 6.01, "learning_rate": 9.197972972972974e-05, "loss": 0.9386, "step": 6940 }, { "epoch": 6.01, "learning_rate": 9.196621621621622e-05, "loss": 0.443, "step": 6950 }, { "epoch": 6.01, "learning_rate": 9.195270270270271e-05, "loss": 0.3867, "step": 6960 }, { "epoch": 6.01, "learning_rate": 9.193918918918919e-05, "loss": 0.5041, "step": 6970 }, { "epoch": 6.01, "learning_rate": 9.192567567567569e-05, "loss": 0.4385, "step": 6980 }, { "epoch": 6.01, "learning_rate": 9.191216216216217e-05, "loss": 0.468, "step": 6990 }, { "epoch": 6.01, "learning_rate": 9.189864864864866e-05, "loss": 0.5809, "step": 7000 }, { "epoch": 6.01, "eval_loss": 0.156533882021904, "eval_runtime": 127.1038, "eval_samples_per_second": 28.386, "eval_steps_per_second": 3.548, "eval_wer": 0.17681591576200903, "step": 7000 }, { "epoch": 6.01, "learning_rate": 9.188513513513514e-05, "loss": 0.6331, "step": 7010 }, { "epoch": 6.01, "learning_rate": 9.187162162162162e-05, "loss": 0.3508, "step": 7020 }, { "epoch": 6.01, "learning_rate": 9.18581081081081e-05, "loss": 0.525, "step": 7030 }, { "epoch": 6.01, "learning_rate": 9.18445945945946e-05, "loss": 0.438, "step": 7040 }, { "epoch": 6.01, "learning_rate": 9.183108108108108e-05, "loss": 0.7169, "step": 7050 }, { "epoch": 6.01, "learning_rate": 9.181756756756758e-05, "loss": 0.7156, "step": 7060 }, { "epoch": 6.01, "learning_rate": 9.180405405405406e-05, "loss": 0.5962, "step": 7070 }, { "epoch": 6.01, "learning_rate": 9.179054054054055e-05, "loss": 0.9764, "step": 7080 }, { "epoch": 6.01, "learning_rate": 9.177702702702703e-05, "loss": 0.9204, "step": 7090 }, { "epoch": 6.01, "learning_rate": 9.176351351351353e-05, "loss": 0.9245, "step": 7100 }, { "epoch": 6.01, "learning_rate": 9.175000000000001e-05, "loss": 0.9903, "step": 7110 }, { "epoch": 6.01, "learning_rate": 9.173648648648649e-05, "loss": 0.7602, "step": 7120 }, { "epoch": 6.01, "learning_rate": 9.172297297297297e-05, "loss": 0.7368, "step": 7130 }, { "epoch": 6.01, "learning_rate": 9.170945945945946e-05, "loss": 0.724, "step": 7140 }, { "epoch": 6.01, "learning_rate": 9.169594594594595e-05, "loss": 0.7057, "step": 7150 }, { "epoch": 6.01, "learning_rate": 9.168243243243244e-05, "loss": 0.9423, "step": 7160 }, { "epoch": 7.0, "learning_rate": 9.166891891891892e-05, "loss": 0.7366, "step": 7170 }, { "epoch": 7.0, "learning_rate": 9.165540540540542e-05, "loss": 0.6764, "step": 7180 }, { "epoch": 7.0, "learning_rate": 9.16418918918919e-05, "loss": 0.6898, "step": 7190 }, { "epoch": 7.0, "learning_rate": 9.162837837837839e-05, "loss": 0.5847, "step": 7200 }, { "epoch": 7.0, "learning_rate": 9.161486486486487e-05, "loss": 0.6095, "step": 7210 }, { "epoch": 7.0, "learning_rate": 9.160135135135137e-05, "loss": 0.618, "step": 7220 }, { "epoch": 7.0, "learning_rate": 9.158783783783785e-05, "loss": 0.8013, "step": 7230 }, { "epoch": 7.0, "learning_rate": 9.157432432432433e-05, "loss": 0.5843, "step": 7240 }, { "epoch": 7.0, "learning_rate": 9.156081081081081e-05, "loss": 0.6098, "step": 7250 }, { "epoch": 7.0, "learning_rate": 9.154729729729729e-05, "loss": 0.6685, "step": 7260 }, { "epoch": 7.0, "learning_rate": 9.153378378378379e-05, "loss": 0.5648, "step": 7270 }, { "epoch": 7.0, "learning_rate": 9.152027027027027e-05, "loss": 0.6081, "step": 7280 }, { "epoch": 7.0, "learning_rate": 9.150675675675676e-05, "loss": 0.4437, "step": 7290 }, { "epoch": 7.0, "learning_rate": 9.149324324324324e-05, "loss": 0.3754, "step": 7300 }, { "epoch": 7.0, "learning_rate": 9.147972972972974e-05, "loss": 0.387, "step": 7310 }, { "epoch": 7.0, "learning_rate": 9.146621621621622e-05, "loss": 0.5175, "step": 7320 }, { "epoch": 7.0, "learning_rate": 9.145270270270271e-05, "loss": 1.7111, "step": 7330 }, { "epoch": 7.0, "learning_rate": 9.143918918918919e-05, "loss": 1.8992, "step": 7340 }, { "epoch": 7.0, "learning_rate": 9.142567567567569e-05, "loss": 2.7111, "step": 7350 }, { "epoch": 7.0, "learning_rate": 9.141216216216217e-05, "loss": 2.5744, "step": 7360 }, { "epoch": 7.0, "learning_rate": 9.139864864864865e-05, "loss": 2.6575, "step": 7370 }, { "epoch": 7.0, "learning_rate": 9.138513513513513e-05, "loss": 2.3977, "step": 7380 }, { "epoch": 7.0, "learning_rate": 9.137162162162163e-05, "loss": 1.9093, "step": 7390 }, { "epoch": 7.0, "learning_rate": 9.13581081081081e-05, "loss": 1.7092, "step": 7400 }, { "epoch": 7.0, "learning_rate": 9.13445945945946e-05, "loss": 0.7965, "step": 7410 }, { "epoch": 7.0, "learning_rate": 9.133108108108108e-05, "loss": 0.2709, "step": 7420 }, { "epoch": 7.0, "learning_rate": 9.131756756756758e-05, "loss": 0.4499, "step": 7430 }, { "epoch": 7.0, "learning_rate": 9.130405405405406e-05, "loss": 0.3705, "step": 7440 }, { "epoch": 7.0, "learning_rate": 9.129054054054055e-05, "loss": 0.5024, "step": 7450 }, { "epoch": 7.0, "learning_rate": 9.127702702702703e-05, "loss": 0.6647, "step": 7460 }, { "epoch": 7.0, "learning_rate": 9.126351351351351e-05, "loss": 0.5421, "step": 7470 }, { "epoch": 7.0, "learning_rate": 9.125e-05, "loss": 0.2972, "step": 7480 }, { "epoch": 7.0, "learning_rate": 9.123648648648649e-05, "loss": 0.3713, "step": 7490 }, { "epoch": 7.0, "learning_rate": 9.122297297297297e-05, "loss": 0.3766, "step": 7500 }, { "epoch": 7.0, "eval_loss": 0.16591981053352356, "eval_runtime": 128.1932, "eval_samples_per_second": 28.145, "eval_steps_per_second": 3.518, "eval_wer": 0.17513861063225086, "step": 7500 }, { "epoch": 7.0, "learning_rate": 9.120945945945947e-05, "loss": 0.4474, "step": 7510 }, { "epoch": 7.0, "learning_rate": 9.119594594594595e-05, "loss": 0.5173, "step": 7520 }, { "epoch": 7.0, "learning_rate": 9.118243243243244e-05, "loss": 0.364, "step": 7530 }, { "epoch": 7.01, "learning_rate": 9.116891891891892e-05, "loss": 0.3366, "step": 7540 }, { "epoch": 7.01, "learning_rate": 9.115540540540542e-05, "loss": 0.266, "step": 7550 }, { "epoch": 7.01, "learning_rate": 9.11418918918919e-05, "loss": 0.2684, "step": 7560 }, { "epoch": 7.01, "learning_rate": 9.112837837837839e-05, "loss": 0.4059, "step": 7570 }, { "epoch": 7.01, "learning_rate": 9.111486486486487e-05, "loss": 0.2735, "step": 7580 }, { "epoch": 7.01, "learning_rate": 9.110135135135135e-05, "loss": 0.4216, "step": 7590 }, { "epoch": 7.01, "learning_rate": 9.108783783783784e-05, "loss": 0.4686, "step": 7600 }, { "epoch": 7.01, "learning_rate": 9.107432432432433e-05, "loss": 0.4544, "step": 7610 }, { "epoch": 7.01, "learning_rate": 9.106081081081081e-05, "loss": 0.3979, "step": 7620 }, { "epoch": 7.01, "learning_rate": 9.10472972972973e-05, "loss": 0.6087, "step": 7630 }, { "epoch": 7.01, "learning_rate": 9.103378378378379e-05, "loss": 0.5358, "step": 7640 }, { "epoch": 7.01, "learning_rate": 9.102027027027027e-05, "loss": 0.6055, "step": 7650 }, { "epoch": 7.01, "learning_rate": 9.100675675675676e-05, "loss": 0.6284, "step": 7660 }, { "epoch": 7.01, "learning_rate": 9.099324324324324e-05, "loss": 0.4266, "step": 7670 }, { "epoch": 7.01, "learning_rate": 9.097972972972974e-05, "loss": 0.8236, "step": 7680 }, { "epoch": 7.01, "learning_rate": 9.096621621621622e-05, "loss": 0.8375, "step": 7690 }, { "epoch": 7.01, "learning_rate": 9.095270270270271e-05, "loss": 0.5129, "step": 7700 }, { "epoch": 7.01, "learning_rate": 9.09391891891892e-05, "loss": 0.2489, "step": 7710 }, { "epoch": 7.01, "learning_rate": 9.092567567567568e-05, "loss": 0.43, "step": 7720 }, { "epoch": 7.01, "learning_rate": 9.091216216216216e-05, "loss": 0.3585, "step": 7730 }, { "epoch": 7.01, "learning_rate": 9.089864864864865e-05, "loss": 0.3891, "step": 7740 }, { "epoch": 7.01, "learning_rate": 9.088513513513513e-05, "loss": 0.3233, "step": 7750 }, { "epoch": 7.01, "learning_rate": 9.087162162162163e-05, "loss": 0.3257, "step": 7760 }, { "epoch": 7.01, "learning_rate": 9.085810810810811e-05, "loss": 0.3043, "step": 7770 }, { "epoch": 7.01, "learning_rate": 9.08445945945946e-05, "loss": 0.6105, "step": 7780 }, { "epoch": 7.01, "learning_rate": 9.083108108108108e-05, "loss": 0.6061, "step": 7790 }, { "epoch": 7.01, "learning_rate": 9.081756756756758e-05, "loss": 0.6158, "step": 7800 }, { "epoch": 7.01, "learning_rate": 9.080405405405406e-05, "loss": 0.5213, "step": 7810 }, { "epoch": 7.01, "learning_rate": 9.079054054054055e-05, "loss": 0.7079, "step": 7820 }, { "epoch": 7.01, "learning_rate": 9.077702702702703e-05, "loss": 0.6201, "step": 7830 }, { "epoch": 7.01, "learning_rate": 9.076351351351352e-05, "loss": 0.3997, "step": 7840 }, { "epoch": 7.01, "learning_rate": 9.075e-05, "loss": 0.3991, "step": 7850 }, { "epoch": 7.01, "learning_rate": 9.073648648648649e-05, "loss": 0.5227, "step": 7860 }, { "epoch": 7.01, "learning_rate": 9.072297297297297e-05, "loss": 0.6187, "step": 7870 }, { "epoch": 7.01, "learning_rate": 9.070945945945947e-05, "loss": 0.6969, "step": 7880 }, { "epoch": 7.01, "learning_rate": 9.069594594594595e-05, "loss": 0.4228, "step": 7890 }, { "epoch": 7.01, "learning_rate": 9.068243243243244e-05, "loss": 0.5148, "step": 7900 }, { "epoch": 7.01, "learning_rate": 9.066891891891892e-05, "loss": 0.4281, "step": 7910 }, { "epoch": 7.01, "learning_rate": 9.065540540540542e-05, "loss": 0.3914, "step": 7920 }, { "epoch": 7.01, "learning_rate": 9.06418918918919e-05, "loss": 0.4614, "step": 7930 }, { "epoch": 7.01, "learning_rate": 9.062837837837838e-05, "loss": 0.2698, "step": 7940 }, { "epoch": 7.01, "learning_rate": 9.061486486486486e-05, "loss": 0.4592, "step": 7950 }, { "epoch": 7.01, "learning_rate": 9.060135135135136e-05, "loss": 0.7057, "step": 7960 }, { "epoch": 7.01, "learning_rate": 9.058783783783784e-05, "loss": 0.6525, "step": 7970 }, { "epoch": 7.01, "learning_rate": 9.057432432432433e-05, "loss": 0.3059, "step": 7980 }, { "epoch": 7.01, "learning_rate": 9.056081081081081e-05, "loss": 0.4526, "step": 7990 }, { "epoch": 7.01, "learning_rate": 9.054729729729731e-05, "loss": 0.4776, "step": 8000 }, { "epoch": 7.01, "eval_loss": 0.16314856708049774, "eval_runtime": 128.0582, "eval_samples_per_second": 28.175, "eval_steps_per_second": 3.522, "eval_wer": 0.17006010343381633, "step": 8000 }, { "epoch": 7.01, "learning_rate": 9.053378378378379e-05, "loss": 0.4418, "step": 8010 }, { "epoch": 7.01, "learning_rate": 9.052027027027028e-05, "loss": 0.5432, "step": 8020 }, { "epoch": 7.01, "learning_rate": 9.050675675675676e-05, "loss": 0.5906, "step": 8030 }, { "epoch": 7.01, "learning_rate": 9.049324324324326e-05, "loss": 0.368, "step": 8040 }, { "epoch": 7.01, "learning_rate": 9.047972972972974e-05, "loss": 0.5017, "step": 8050 }, { "epoch": 7.01, "learning_rate": 9.046621621621622e-05, "loss": 0.4455, "step": 8060 }, { "epoch": 7.01, "learning_rate": 9.04527027027027e-05, "loss": 0.6751, "step": 8070 }, { "epoch": 7.01, "learning_rate": 9.043918918918918e-05, "loss": 0.6348, "step": 8080 }, { "epoch": 7.01, "learning_rate": 9.042567567567568e-05, "loss": 0.6844, "step": 8090 }, { "epoch": 7.01, "learning_rate": 9.041216216216216e-05, "loss": 0.8195, "step": 8100 }, { "epoch": 7.01, "learning_rate": 9.039864864864865e-05, "loss": 0.9507, "step": 8110 }, { "epoch": 7.01, "learning_rate": 9.038513513513513e-05, "loss": 0.8606, "step": 8120 }, { "epoch": 7.01, "learning_rate": 9.037162162162163e-05, "loss": 1.0475, "step": 8130 }, { "epoch": 7.01, "learning_rate": 9.035810810810811e-05, "loss": 0.7131, "step": 8140 }, { "epoch": 7.01, "learning_rate": 9.03445945945946e-05, "loss": 0.6491, "step": 8150 }, { "epoch": 7.01, "learning_rate": 9.033108108108108e-05, "loss": 0.6487, "step": 8160 }, { "epoch": 7.01, "learning_rate": 9.031756756756758e-05, "loss": 0.6855, "step": 8170 }, { "epoch": 7.01, "learning_rate": 9.030405405405406e-05, "loss": 0.7765, "step": 8180 }, { "epoch": 8.0, "learning_rate": 9.029054054054054e-05, "loss": 0.7871, "step": 8190 }, { "epoch": 8.0, "learning_rate": 9.027702702702702e-05, "loss": 0.6447, "step": 8200 }, { "epoch": 8.0, "learning_rate": 9.026351351351352e-05, "loss": 0.7081, "step": 8210 }, { "epoch": 8.0, "learning_rate": 9.025e-05, "loss": 0.6292, "step": 8220 }, { "epoch": 8.0, "learning_rate": 9.023648648648649e-05, "loss": 0.5778, "step": 8230 }, { "epoch": 8.0, "learning_rate": 9.022297297297297e-05, "loss": 0.5697, "step": 8240 }, { "epoch": 8.0, "learning_rate": 9.020945945945947e-05, "loss": 0.806, "step": 8250 }, { "epoch": 8.0, "learning_rate": 9.019594594594595e-05, "loss": 0.5505, "step": 8260 }, { "epoch": 8.0, "learning_rate": 9.018243243243244e-05, "loss": 0.6074, "step": 8270 }, { "epoch": 8.0, "learning_rate": 9.016891891891893e-05, "loss": 0.6389, "step": 8280 }, { "epoch": 8.0, "learning_rate": 9.015540540540542e-05, "loss": 0.5619, "step": 8290 }, { "epoch": 8.0, "learning_rate": 9.01418918918919e-05, "loss": 0.5696, "step": 8300 }, { "epoch": 8.0, "learning_rate": 9.012837837837838e-05, "loss": 0.4095, "step": 8310 }, { "epoch": 8.0, "learning_rate": 9.011486486486486e-05, "loss": 0.3292, "step": 8320 }, { "epoch": 8.0, "learning_rate": 9.010135135135136e-05, "loss": 0.3588, "step": 8330 }, { "epoch": 8.0, "learning_rate": 9.008783783783784e-05, "loss": 0.4196, "step": 8340 }, { "epoch": 8.0, "learning_rate": 9.007432432432433e-05, "loss": 1.4511, "step": 8350 }, { "epoch": 8.0, "learning_rate": 9.006081081081081e-05, "loss": 1.4203, "step": 8360 }, { "epoch": 8.0, "learning_rate": 9.004729729729731e-05, "loss": 2.7992, "step": 8370 }, { "epoch": 8.0, "learning_rate": 9.003378378378379e-05, "loss": 2.535, "step": 8380 }, { "epoch": 8.0, "learning_rate": 9.002027027027028e-05, "loss": 2.6926, "step": 8390 }, { "epoch": 8.0, "learning_rate": 9.000675675675677e-05, "loss": 2.5546, "step": 8400 }, { "epoch": 8.0, "learning_rate": 8.999324324324325e-05, "loss": 1.8958, "step": 8410 }, { "epoch": 8.0, "learning_rate": 8.997972972972973e-05, "loss": 1.8825, "step": 8420 }, { "epoch": 8.0, "learning_rate": 8.996621621621622e-05, "loss": 0.9495, "step": 8430 }, { "epoch": 8.0, "learning_rate": 8.99527027027027e-05, "loss": 0.3966, "step": 8440 }, { "epoch": 8.0, "learning_rate": 8.993918918918918e-05, "loss": 0.3263, "step": 8450 }, { "epoch": 8.0, "learning_rate": 8.992567567567568e-05, "loss": 0.3999, "step": 8460 }, { "epoch": 8.0, "learning_rate": 8.991216216216216e-05, "loss": 0.5159, "step": 8470 }, { "epoch": 8.0, "learning_rate": 8.989864864864865e-05, "loss": 0.5663, "step": 8480 }, { "epoch": 8.0, "learning_rate": 8.988513513513514e-05, "loss": 0.6229, "step": 8490 }, { "epoch": 8.0, "learning_rate": 8.987162162162163e-05, "loss": 0.3713, "step": 8500 }, { "epoch": 8.0, "eval_loss": 0.15108059346675873, "eval_runtime": 130.5379, "eval_samples_per_second": 27.639, "eval_steps_per_second": 3.455, "eval_wer": 0.16032241531938685, "step": 8500 }, { "epoch": 8.0, "learning_rate": 8.985810810810811e-05, "loss": 0.3112, "step": 8510 }, { "epoch": 8.0, "learning_rate": 8.98445945945946e-05, "loss": 0.4059, "step": 8520 }, { "epoch": 8.0, "learning_rate": 8.983108108108109e-05, "loss": 0.3702, "step": 8530 }, { "epoch": 8.0, "learning_rate": 8.981756756756757e-05, "loss": 0.4845, "step": 8540 }, { "epoch": 8.0, "learning_rate": 8.980405405405405e-05, "loss": 0.4184, "step": 8550 }, { "epoch": 8.01, "learning_rate": 8.979054054054054e-05, "loss": 0.3304, "step": 8560 }, { "epoch": 8.01, "learning_rate": 8.977702702702702e-05, "loss": 0.2577, "step": 8570 }, { "epoch": 8.01, "learning_rate": 8.976351351351352e-05, "loss": 0.2473, "step": 8580 }, { "epoch": 8.01, "learning_rate": 8.975e-05, "loss": 0.4024, "step": 8590 }, { "epoch": 8.01, "learning_rate": 8.97364864864865e-05, "loss": 0.3375, "step": 8600 }, { "epoch": 8.01, "learning_rate": 8.972297297297298e-05, "loss": 0.3417, "step": 8610 }, { "epoch": 8.01, "learning_rate": 8.970945945945947e-05, "loss": 0.4578, "step": 8620 }, { "epoch": 8.01, "learning_rate": 8.969594594594595e-05, "loss": 0.5298, "step": 8630 }, { "epoch": 8.01, "learning_rate": 8.968243243243245e-05, "loss": 0.3622, "step": 8640 }, { "epoch": 8.01, "learning_rate": 8.966891891891893e-05, "loss": 0.5513, "step": 8650 }, { "epoch": 8.01, "learning_rate": 8.965540540540541e-05, "loss": 0.5829, "step": 8660 }, { "epoch": 8.01, "learning_rate": 8.964189189189189e-05, "loss": 0.6169, "step": 8670 }, { "epoch": 8.01, "learning_rate": 8.962837837837838e-05, "loss": 0.5352, "step": 8680 }, { "epoch": 8.01, "learning_rate": 8.961486486486486e-05, "loss": 0.4233, "step": 8690 }, { "epoch": 8.01, "learning_rate": 8.960135135135136e-05, "loss": 0.6805, "step": 8700 }, { "epoch": 8.01, "learning_rate": 8.958783783783784e-05, "loss": 0.8605, "step": 8710 }, { "epoch": 8.01, "learning_rate": 8.957432432432433e-05, "loss": 0.6327, "step": 8720 }, { "epoch": 8.01, "learning_rate": 8.956081081081082e-05, "loss": 0.2599, "step": 8730 }, { "epoch": 8.01, "learning_rate": 8.954729729729731e-05, "loss": 0.3797, "step": 8740 }, { "epoch": 8.01, "learning_rate": 8.953378378378379e-05, "loss": 0.3841, "step": 8750 }, { "epoch": 8.01, "learning_rate": 8.952027027027029e-05, "loss": 0.3435, "step": 8760 }, { "epoch": 8.01, "learning_rate": 8.950675675675677e-05, "loss": 0.289, "step": 8770 }, { "epoch": 8.01, "learning_rate": 8.949324324324325e-05, "loss": 0.2889, "step": 8780 }, { "epoch": 8.01, "learning_rate": 8.947972972972973e-05, "loss": 0.2956, "step": 8790 }, { "epoch": 8.01, "learning_rate": 8.946621621621622e-05, "loss": 0.4411, "step": 8800 }, { "epoch": 8.01, "learning_rate": 8.94527027027027e-05, "loss": 0.6439, "step": 8810 }, { "epoch": 8.01, "learning_rate": 8.94391891891892e-05, "loss": 0.5996, "step": 8820 }, { "epoch": 8.01, "learning_rate": 8.942567567567568e-05, "loss": 0.4954, "step": 8830 }, { "epoch": 8.01, "learning_rate": 8.941216216216217e-05, "loss": 0.5921, "step": 8840 }, { "epoch": 8.01, "learning_rate": 8.939864864864866e-05, "loss": 0.7455, "step": 8850 }, { "epoch": 8.01, "learning_rate": 8.938513513513514e-05, "loss": 0.4197, "step": 8860 }, { "epoch": 8.01, "learning_rate": 8.937162162162163e-05, "loss": 0.3349, "step": 8870 }, { "epoch": 8.01, "learning_rate": 8.935810810810811e-05, "loss": 0.4636, "step": 8880 }, { "epoch": 8.01, "learning_rate": 8.934459459459459e-05, "loss": 0.5972, "step": 8890 }, { "epoch": 8.01, "learning_rate": 8.933108108108107e-05, "loss": 0.5924, "step": 8900 }, { "epoch": 8.01, "learning_rate": 8.931756756756757e-05, "loss": 0.5179, "step": 8910 }, { "epoch": 8.01, "learning_rate": 8.930405405405405e-05, "loss": 0.4728, "step": 8920 }, { "epoch": 8.01, "learning_rate": 8.929054054054054e-05, "loss": 0.469, "step": 8930 }, { "epoch": 8.01, "learning_rate": 8.927702702702703e-05, "loss": 0.3901, "step": 8940 }, { "epoch": 8.01, "learning_rate": 8.926351351351352e-05, "loss": 0.4715, "step": 8950 }, { "epoch": 8.01, "learning_rate": 8.925e-05, "loss": 0.268, "step": 8960 }, { "epoch": 8.01, "learning_rate": 8.92364864864865e-05, "loss": 0.3655, "step": 8970 }, { "epoch": 8.01, "learning_rate": 8.922297297297298e-05, "loss": 0.4697, "step": 8980 }, { "epoch": 8.01, "learning_rate": 8.920945945945947e-05, "loss": 0.9273, "step": 8990 }, { "epoch": 8.01, "learning_rate": 8.919594594594595e-05, "loss": 0.3141, "step": 9000 }, { "epoch": 8.01, "eval_loss": 0.14772309362888336, "eval_runtime": 131.7757, "eval_samples_per_second": 27.38, "eval_steps_per_second": 3.422, "eval_wer": 0.16013604808274706, "step": 9000 }, { "epoch": 8.01, "learning_rate": 8.918243243243243e-05, "loss": 0.3795, "step": 9010 }, { "epoch": 8.01, "learning_rate": 8.916891891891891e-05, "loss": 0.4197, "step": 9020 }, { "epoch": 8.01, "learning_rate": 8.915540540540541e-05, "loss": 0.4919, "step": 9030 }, { "epoch": 8.01, "learning_rate": 8.914189189189189e-05, "loss": 0.4144, "step": 9040 }, { "epoch": 8.01, "learning_rate": 8.912837837837838e-05, "loss": 0.7081, "step": 9050 }, { "epoch": 8.01, "learning_rate": 8.911486486486487e-05, "loss": 0.4371, "step": 9060 }, { "epoch": 8.01, "learning_rate": 8.910135135135136e-05, "loss": 0.3886, "step": 9070 }, { "epoch": 8.01, "learning_rate": 8.908783783783784e-05, "loss": 0.4312, "step": 9080 }, { "epoch": 8.01, "learning_rate": 8.907432432432434e-05, "loss": 0.6141, "step": 9090 }, { "epoch": 8.01, "learning_rate": 8.906081081081082e-05, "loss": 0.655, "step": 9100 }, { "epoch": 8.01, "learning_rate": 8.904729729729731e-05, "loss": 0.6754, "step": 9110 }, { "epoch": 8.01, "learning_rate": 8.903378378378379e-05, "loss": 0.6632, "step": 9120 }, { "epoch": 8.01, "learning_rate": 8.902027027027027e-05, "loss": 0.8512, "step": 9130 }, { "epoch": 8.01, "learning_rate": 8.900675675675675e-05, "loss": 0.7077, "step": 9140 }, { "epoch": 8.01, "learning_rate": 8.899324324324325e-05, "loss": 0.97, "step": 9150 }, { "epoch": 8.01, "learning_rate": 8.897972972972973e-05, "loss": 0.7902, "step": 9160 }, { "epoch": 8.01, "learning_rate": 8.896621621621622e-05, "loss": 0.6793, "step": 9170 }, { "epoch": 8.01, "learning_rate": 8.89527027027027e-05, "loss": 0.65, "step": 9180 }, { "epoch": 8.01, "learning_rate": 8.89391891891892e-05, "loss": 0.6757, "step": 9190 }, { "epoch": 8.01, "learning_rate": 8.892567567567568e-05, "loss": 0.7219, "step": 9200 }, { "epoch": 9.0, "learning_rate": 8.891216216216218e-05, "loss": 0.8007, "step": 9210 }, { "epoch": 9.0, "learning_rate": 8.889864864864866e-05, "loss": 0.6144, "step": 9220 }, { "epoch": 9.0, "learning_rate": 8.888513513513515e-05, "loss": 0.6546, "step": 9230 }, { "epoch": 9.0, "learning_rate": 8.887162162162163e-05, "loss": 0.6457, "step": 9240 }, { "epoch": 9.0, "learning_rate": 8.885810810810811e-05, "loss": 0.5036, "step": 9250 }, { "epoch": 9.0, "learning_rate": 8.88445945945946e-05, "loss": 0.5977, "step": 9260 }, { "epoch": 9.0, "learning_rate": 8.883108108108108e-05, "loss": 0.7034, "step": 9270 }, { "epoch": 9.0, "learning_rate": 8.881756756756757e-05, "loss": 0.6827, "step": 9280 }, { "epoch": 9.0, "learning_rate": 8.880405405405405e-05, "loss": 0.5306, "step": 9290 }, { "epoch": 9.0, "learning_rate": 8.879054054054055e-05, "loss": 0.5848, "step": 9300 }, { "epoch": 9.0, "learning_rate": 8.877702702702703e-05, "loss": 0.5886, "step": 9310 }, { "epoch": 9.0, "learning_rate": 8.876351351351352e-05, "loss": 0.5854, "step": 9320 }, { "epoch": 9.0, "learning_rate": 8.875e-05, "loss": 0.4596, "step": 9330 }, { "epoch": 9.0, "learning_rate": 8.87364864864865e-05, "loss": 0.3273, "step": 9340 }, { "epoch": 9.0, "learning_rate": 8.872297297297298e-05, "loss": 0.3623, "step": 9350 }, { "epoch": 9.0, "learning_rate": 8.870945945945946e-05, "loss": 0.3671, "step": 9360 }, { "epoch": 9.0, "learning_rate": 8.869594594594594e-05, "loss": 1.1399, "step": 9370 }, { "epoch": 9.0, "learning_rate": 8.868243243243243e-05, "loss": 1.0923, "step": 9380 }, { "epoch": 9.0, "learning_rate": 8.866891891891892e-05, "loss": 2.6794, "step": 9390 }, { "epoch": 9.0, "learning_rate": 8.865540540540541e-05, "loss": 2.6391, "step": 9400 }, { "epoch": 9.0, "learning_rate": 8.864189189189189e-05, "loss": 2.581, "step": 9410 }, { "epoch": 9.0, "learning_rate": 8.862837837837839e-05, "loss": 2.6697, "step": 9420 }, { "epoch": 9.0, "learning_rate": 8.861486486486487e-05, "loss": 2.0002, "step": 9430 }, { "epoch": 9.0, "learning_rate": 8.860135135135136e-05, "loss": 1.7982, "step": 9440 }, { "epoch": 9.0, "learning_rate": 8.858783783783784e-05, "loss": 1.1784, "step": 9450 }, { "epoch": 9.0, "learning_rate": 8.857432432432434e-05, "loss": 0.5654, "step": 9460 }, { "epoch": 9.0, "learning_rate": 8.856081081081082e-05, "loss": 0.2686, "step": 9470 }, { "epoch": 9.0, "learning_rate": 8.85472972972973e-05, "loss": 0.4164, "step": 9480 }, { "epoch": 9.0, "learning_rate": 8.853378378378378e-05, "loss": 0.4965, "step": 9490 }, { "epoch": 9.0, "learning_rate": 8.852027027027027e-05, "loss": 0.5318, "step": 9500 }, { "epoch": 9.0, "eval_loss": 0.1483621895313263, "eval_runtime": 129.0489, "eval_samples_per_second": 27.958, "eval_steps_per_second": 3.495, "eval_wer": 0.15734053953315008, "step": 9500 }, { "epoch": 9.0, "learning_rate": 8.850675675675676e-05, "loss": 0.6236, "step": 9510 }, { "epoch": 9.0, "learning_rate": 8.849324324324325e-05, "loss": 0.3786, "step": 9520 }, { "epoch": 9.0, "learning_rate": 8.847972972972973e-05, "loss": 0.2748, "step": 9530 }, { "epoch": 9.0, "learning_rate": 8.846621621621623e-05, "loss": 0.4879, "step": 9540 }, { "epoch": 9.0, "learning_rate": 8.845270270270271e-05, "loss": 0.3291, "step": 9550 }, { "epoch": 9.0, "learning_rate": 8.84391891891892e-05, "loss": 0.5009, "step": 9560 }, { "epoch": 9.0, "learning_rate": 8.842567567567568e-05, "loss": 0.4277, "step": 9570 }, { "epoch": 9.0, "learning_rate": 8.841216216216218e-05, "loss": 0.3344, "step": 9580 }, { "epoch": 9.01, "learning_rate": 8.839864864864866e-05, "loss": 0.2887, "step": 9590 }, { "epoch": 9.01, "learning_rate": 8.838513513513514e-05, "loss": 0.1927, "step": 9600 }, { "epoch": 9.01, "learning_rate": 8.837162162162162e-05, "loss": 0.3067, "step": 9610 }, { "epoch": 9.01, "learning_rate": 8.835810810810811e-05, "loss": 0.3576, "step": 9620 }, { "epoch": 9.01, "learning_rate": 8.83445945945946e-05, "loss": 0.2561, "step": 9630 }, { "epoch": 9.01, "learning_rate": 8.833108108108109e-05, "loss": 0.3556, "step": 9640 }, { "epoch": 9.01, "learning_rate": 8.831756756756757e-05, "loss": 0.5681, "step": 9650 }, { "epoch": 9.01, "learning_rate": 8.830405405405405e-05, "loss": 0.3932, "step": 9660 }, { "epoch": 9.01, "learning_rate": 8.829054054054055e-05, "loss": 0.4453, "step": 9670 }, { "epoch": 9.01, "learning_rate": 8.827702702702703e-05, "loss": 0.5684, "step": 9680 }, { "epoch": 9.01, "learning_rate": 8.826351351351352e-05, "loss": 0.483, "step": 9690 }, { "epoch": 9.01, "learning_rate": 8.825e-05, "loss": 0.6269, "step": 9700 }, { "epoch": 9.01, "learning_rate": 8.823648648648648e-05, "loss": 0.534, "step": 9710 }, { "epoch": 9.01, "learning_rate": 8.822297297297297e-05, "loss": 0.4883, "step": 9720 }, { "epoch": 9.01, "learning_rate": 8.820945945945946e-05, "loss": 0.9006, "step": 9730 }, { "epoch": 9.01, "learning_rate": 8.819594594594594e-05, "loss": 0.7655, "step": 9740 }, { "epoch": 9.01, "learning_rate": 8.818243243243244e-05, "loss": 0.3184, "step": 9750 }, { "epoch": 9.01, "learning_rate": 8.816891891891892e-05, "loss": 0.3218, "step": 9760 }, { "epoch": 9.01, "learning_rate": 8.815540540540541e-05, "loss": 0.3982, "step": 9770 }, { "epoch": 9.01, "learning_rate": 8.814189189189189e-05, "loss": 0.3301, "step": 9780 }, { "epoch": 9.01, "learning_rate": 8.812837837837839e-05, "loss": 0.3007, "step": 9790 }, { "epoch": 9.01, "learning_rate": 8.811486486486487e-05, "loss": 0.2697, "step": 9800 }, { "epoch": 9.01, "learning_rate": 8.810135135135136e-05, "loss": 0.2447, "step": 9810 }, { "epoch": 9.01, "learning_rate": 8.808783783783784e-05, "loss": 0.3046, "step": 9820 }, { "epoch": 9.01, "learning_rate": 8.807432432432432e-05, "loss": 0.64, "step": 9830 }, { "epoch": 9.01, "learning_rate": 8.80608108108108e-05, "loss": 0.551, "step": 9840 }, { "epoch": 9.01, "learning_rate": 8.80472972972973e-05, "loss": 0.513, "step": 9850 }, { "epoch": 9.01, "learning_rate": 8.803378378378378e-05, "loss": 0.5455, "step": 9860 }, { "epoch": 9.01, "learning_rate": 8.802027027027028e-05, "loss": 0.7625, "step": 9870 }, { "epoch": 9.01, "learning_rate": 8.800675675675676e-05, "loss": 0.4676, "step": 9880 }, { "epoch": 9.01, "learning_rate": 8.799324324324325e-05, "loss": 0.3307, "step": 9890 }, { "epoch": 9.01, "learning_rate": 8.797972972972973e-05, "loss": 0.4632, "step": 9900 }, { "epoch": 9.01, "learning_rate": 8.796621621621623e-05, "loss": 0.5792, "step": 9910 }, { "epoch": 9.01, "learning_rate": 8.795270270270271e-05, "loss": 0.5534, "step": 9920 }, { "epoch": 9.01, "learning_rate": 8.79391891891892e-05, "loss": 0.5161, "step": 9930 }, { "epoch": 9.01, "learning_rate": 8.792567567567568e-05, "loss": 0.4059, "step": 9940 }, { "epoch": 9.01, "learning_rate": 8.791216216216217e-05, "loss": 0.4525, "step": 9950 }, { "epoch": 9.01, "learning_rate": 8.789864864864865e-05, "loss": 0.342, "step": 9960 }, { "epoch": 9.01, "learning_rate": 8.788513513513514e-05, "loss": 0.3757, "step": 9970 }, { "epoch": 9.01, "learning_rate": 8.787162162162162e-05, "loss": 0.2748, "step": 9980 }, { "epoch": 9.01, "learning_rate": 8.785810810810812e-05, "loss": 0.2394, "step": 9990 }, { "epoch": 9.01, "learning_rate": 8.78445945945946e-05, "loss": 0.4544, "step": 10000 }, { "epoch": 9.01, "eval_loss": 0.14805930852890015, "eval_runtime": 132.8228, "eval_samples_per_second": 27.164, "eval_steps_per_second": 3.396, "eval_wer": 0.16022923170106695, "step": 10000 }, { "epoch": 9.01, "learning_rate": 8.783108108108109e-05, "loss": 0.9147, "step": 10010 }, { "epoch": 9.01, "learning_rate": 8.781756756756757e-05, "loss": 0.3347, "step": 10020 }, { "epoch": 9.01, "learning_rate": 8.780405405405407e-05, "loss": 0.3345, "step": 10030 }, { "epoch": 9.01, "learning_rate": 8.779054054054055e-05, "loss": 0.4779, "step": 10040 }, { "epoch": 9.01, "learning_rate": 8.777702702702704e-05, "loss": 0.4372, "step": 10050 }, { "epoch": 9.01, "learning_rate": 8.776351351351352e-05, "loss": 0.4608, "step": 10060 }, { "epoch": 9.01, "learning_rate": 8.775e-05, "loss": 0.566, "step": 10070 }, { "epoch": 9.01, "learning_rate": 8.773648648648649e-05, "loss": 0.4968, "step": 10080 }, { "epoch": 9.01, "learning_rate": 8.772297297297297e-05, "loss": 0.3001, "step": 10090 }, { "epoch": 9.01, "learning_rate": 8.770945945945946e-05, "loss": 0.4784, "step": 10100 }, { "epoch": 9.01, "learning_rate": 8.769594594594594e-05, "loss": 0.4044, "step": 10110 }, { "epoch": 9.01, "learning_rate": 8.768243243243244e-05, "loss": 0.6536, "step": 10120 }, { "epoch": 9.01, "learning_rate": 8.766891891891892e-05, "loss": 0.6574, "step": 10130 }, { "epoch": 9.01, "learning_rate": 8.765540540540541e-05, "loss": 0.5586, "step": 10140 }, { "epoch": 9.01, "learning_rate": 8.76418918918919e-05, "loss": 0.908, "step": 10150 }, { "epoch": 9.01, "learning_rate": 8.762837837837839e-05, "loss": 0.6892, "step": 10160 }, { "epoch": 9.01, "learning_rate": 8.761486486486487e-05, "loss": 0.8302, "step": 10170 }, { "epoch": 9.01, "learning_rate": 8.760135135135135e-05, "loss": 0.8844, "step": 10180 }, { "epoch": 9.01, "learning_rate": 8.758783783783783e-05, "loss": 0.6732, "step": 10190 }, { "epoch": 9.01, "learning_rate": 8.757432432432433e-05, "loss": 0.71, "step": 10200 }, { "epoch": 9.01, "learning_rate": 8.756081081081081e-05, "loss": 0.663, "step": 10210 }, { "epoch": 9.01, "learning_rate": 8.75472972972973e-05, "loss": 0.5841, "step": 10220 }, { "epoch": 9.01, "learning_rate": 8.753378378378378e-05, "loss": 0.8617, "step": 10230 }, { "epoch": 10.0, "learning_rate": 8.752027027027028e-05, "loss": 0.58, "step": 10240 }, { "epoch": 10.0, "learning_rate": 8.750675675675676e-05, "loss": 0.5821, "step": 10250 }, { "epoch": 10.0, "learning_rate": 8.749324324324325e-05, "loss": 0.6531, "step": 10260 }, { "epoch": 10.0, "learning_rate": 8.747972972972973e-05, "loss": 0.524, "step": 10270 }, { "epoch": 10.0, "learning_rate": 8.746621621621623e-05, "loss": 0.5905, "step": 10280 }, { "epoch": 10.0, "learning_rate": 8.745270270270271e-05, "loss": 0.5553, "step": 10290 }, { "epoch": 10.0, "learning_rate": 8.743918918918919e-05, "loss": 0.7304, "step": 10300 }, { "epoch": 10.0, "learning_rate": 8.742567567567567e-05, "loss": 0.5363, "step": 10310 }, { "epoch": 10.0, "learning_rate": 8.741216216216217e-05, "loss": 0.5694, "step": 10320 }, { "epoch": 10.0, "learning_rate": 8.739864864864865e-05, "loss": 0.5536, "step": 10330 }, { "epoch": 10.0, "learning_rate": 8.738513513513514e-05, "loss": 0.5548, "step": 10340 }, { "epoch": 10.0, "learning_rate": 8.737162162162162e-05, "loss": 0.5189, "step": 10350 }, { "epoch": 10.0, "learning_rate": 8.735810810810812e-05, "loss": 0.3563, "step": 10360 }, { "epoch": 10.0, "learning_rate": 8.73445945945946e-05, "loss": 0.3627, "step": 10370 }, { "epoch": 10.0, "learning_rate": 8.73310810810811e-05, "loss": 0.3587, "step": 10380 }, { "epoch": 10.0, "learning_rate": 8.731756756756757e-05, "loss": 0.604, "step": 10390 }, { "epoch": 10.0, "learning_rate": 8.730405405405407e-05, "loss": 1.4707, "step": 10400 }, { "epoch": 10.0, "learning_rate": 8.729054054054055e-05, "loss": 2.0876, "step": 10410 }, { "epoch": 10.0, "learning_rate": 8.727702702702703e-05, "loss": 2.6494, "step": 10420 }, { "epoch": 10.0, "learning_rate": 8.726351351351351e-05, "loss": 2.57, "step": 10430 }, { "epoch": 10.0, "learning_rate": 8.725e-05, "loss": 2.662, "step": 10440 }, { "epoch": 10.0, "learning_rate": 8.723648648648649e-05, "loss": 2.1461, "step": 10450 }, { "epoch": 10.0, "learning_rate": 8.722297297297297e-05, "loss": 1.9342, "step": 10460 }, { "epoch": 10.0, "learning_rate": 8.720945945945946e-05, "loss": 1.3611, "step": 10470 }, { "epoch": 10.0, "learning_rate": 8.719594594594594e-05, "loss": 0.6272, "step": 10480 }, { "epoch": 10.0, "learning_rate": 8.718243243243244e-05, "loss": 0.2696, "step": 10490 }, { "epoch": 10.0, "learning_rate": 8.716891891891892e-05, "loss": 0.3894, "step": 10500 }, { "epoch": 10.0, "eval_loss": 0.14220407605171204, "eval_runtime": 128.9897, "eval_samples_per_second": 27.971, "eval_steps_per_second": 3.496, "eval_wer": 0.15356660299119415, "step": 10500 }, { "epoch": 10.0, "learning_rate": 8.715540540540541e-05, "loss": 0.3894, "step": 10510 }, { "epoch": 10.0, "learning_rate": 8.71418918918919e-05, "loss": 0.4125, "step": 10520 }, { "epoch": 10.0, "learning_rate": 8.712837837837839e-05, "loss": 0.6259, "step": 10530 }, { "epoch": 10.0, "learning_rate": 8.711486486486487e-05, "loss": 0.4499, "step": 10540 }, { "epoch": 10.0, "learning_rate": 8.710135135135135e-05, "loss": 0.253, "step": 10550 }, { "epoch": 10.0, "learning_rate": 8.708783783783783e-05, "loss": 0.3537, "step": 10560 }, { "epoch": 10.0, "learning_rate": 8.707432432432433e-05, "loss": 0.3478, "step": 10570 }, { "epoch": 10.0, "learning_rate": 8.706081081081081e-05, "loss": 0.4401, "step": 10580 }, { "epoch": 10.0, "learning_rate": 8.70472972972973e-05, "loss": 0.4319, "step": 10590 }, { "epoch": 10.0, "learning_rate": 8.703378378378378e-05, "loss": 0.2901, "step": 10600 }, { "epoch": 10.01, "learning_rate": 8.702027027027028e-05, "loss": 0.3357, "step": 10610 }, { "epoch": 10.01, "learning_rate": 8.700675675675676e-05, "loss": 0.2009, "step": 10620 }, { "epoch": 10.01, "learning_rate": 8.699324324324325e-05, "loss": 0.2786, "step": 10630 }, { "epoch": 10.01, "learning_rate": 8.697972972972974e-05, "loss": 0.3462, "step": 10640 }, { "epoch": 10.01, "learning_rate": 8.696621621621622e-05, "loss": 0.2587, "step": 10650 }, { "epoch": 10.01, "learning_rate": 8.69527027027027e-05, "loss": 0.3664, "step": 10660 }, { "epoch": 10.01, "learning_rate": 8.693918918918919e-05, "loss": 0.4706, "step": 10670 }, { "epoch": 10.01, "learning_rate": 8.692567567567567e-05, "loss": 0.4191, "step": 10680 }, { "epoch": 10.01, "learning_rate": 8.691216216216217e-05, "loss": 0.4135, "step": 10690 }, { "epoch": 10.01, "learning_rate": 8.689864864864865e-05, "loss": 0.5606, "step": 10700 }, { "epoch": 10.01, "learning_rate": 8.688513513513514e-05, "loss": 0.4964, "step": 10710 }, { "epoch": 10.01, "learning_rate": 8.687162162162162e-05, "loss": 0.5521, "step": 10720 }, { "epoch": 10.01, "learning_rate": 8.685810810810812e-05, "loss": 0.555, "step": 10730 }, { "epoch": 10.01, "learning_rate": 8.68445945945946e-05, "loss": 0.3857, "step": 10740 }, { "epoch": 10.01, "learning_rate": 8.68310810810811e-05, "loss": 0.8524, "step": 10750 }, { "epoch": 10.01, "learning_rate": 8.681756756756758e-05, "loss": 0.7702, "step": 10760 }, { "epoch": 10.01, "learning_rate": 8.68054054054054e-05, "loss": 0.4203, "step": 10770 }, { "epoch": 10.01, "learning_rate": 8.67918918918919e-05, "loss": 0.2573, "step": 10780 }, { "epoch": 10.01, "learning_rate": 8.677837837837838e-05, "loss": 0.4256, "step": 10790 }, { "epoch": 10.01, "learning_rate": 8.676486486486488e-05, "loss": 0.3504, "step": 10800 }, { "epoch": 10.01, "learning_rate": 8.675135135135136e-05, "loss": 0.2935, "step": 10810 }, { "epoch": 10.01, "learning_rate": 8.673783783783784e-05, "loss": 0.2782, "step": 10820 }, { "epoch": 10.01, "learning_rate": 8.672432432432432e-05, "loss": 0.3023, "step": 10830 }, { "epoch": 10.01, "learning_rate": 8.671081081081081e-05, "loss": 0.2887, "step": 10840 }, { "epoch": 10.01, "learning_rate": 8.66972972972973e-05, "loss": 0.5353, "step": 10850 }, { "epoch": 10.01, "learning_rate": 8.668378378378379e-05, "loss": 0.5727, "step": 10860 }, { "epoch": 10.01, "learning_rate": 8.667027027027027e-05, "loss": 0.5168, "step": 10870 }, { "epoch": 10.01, "learning_rate": 8.665675675675677e-05, "loss": 0.46, "step": 10880 }, { "epoch": 10.01, "learning_rate": 8.664324324324325e-05, "loss": 0.6258, "step": 10890 }, { "epoch": 10.01, "learning_rate": 8.662972972972974e-05, "loss": 0.5521, "step": 10900 }, { "epoch": 10.01, "learning_rate": 8.661621621621622e-05, "loss": 0.3608, "step": 10910 }, { "epoch": 10.01, "learning_rate": 8.66027027027027e-05, "loss": 0.3907, "step": 10920 }, { "epoch": 10.01, "learning_rate": 8.658918918918918e-05, "loss": 0.495, "step": 10930 }, { "epoch": 10.01, "learning_rate": 8.657567567567568e-05, "loss": 0.5417, "step": 10940 }, { "epoch": 10.01, "learning_rate": 8.656216216216216e-05, "loss": 0.5449, "step": 10950 }, { "epoch": 10.01, "learning_rate": 8.654864864864865e-05, "loss": 0.3864, "step": 10960 }, { "epoch": 10.01, "learning_rate": 8.653513513513513e-05, "loss": 0.4404, "step": 10970 }, { "epoch": 10.01, "learning_rate": 8.652162162162163e-05, "loss": 0.3815, "step": 10980 }, { "epoch": 10.01, "learning_rate": 8.650810810810811e-05, "loss": 0.3311, "step": 10990 }, { "epoch": 10.01, "learning_rate": 8.64945945945946e-05, "loss": 0.3602, "step": 11000 }, { "epoch": 10.01, "eval_loss": 0.15774685144424438, "eval_runtime": 126.8701, "eval_samples_per_second": 28.439, "eval_steps_per_second": 3.555, "eval_wer": 0.15841215114382892, "step": 11000 }, { "epoch": 10.01, "learning_rate": 8.648108108108109e-05, "loss": 0.1977, "step": 11010 }, { "epoch": 10.01, "learning_rate": 8.646756756756758e-05, "loss": 0.4424, "step": 11020 }, { "epoch": 10.01, "learning_rate": 8.645405405405406e-05, "loss": 0.6845, "step": 11030 }, { "epoch": 10.01, "learning_rate": 8.644054054054054e-05, "loss": 0.5343, "step": 11040 }, { "epoch": 10.01, "learning_rate": 8.642702702702702e-05, "loss": 0.331, "step": 11050 }, { "epoch": 10.01, "learning_rate": 8.641351351351352e-05, "loss": 0.4239, "step": 11060 }, { "epoch": 10.01, "learning_rate": 8.64e-05, "loss": 0.4183, "step": 11070 }, { "epoch": 10.01, "learning_rate": 8.63864864864865e-05, "loss": 0.4222, "step": 11080 }, { "epoch": 10.01, "learning_rate": 8.637297297297298e-05, "loss": 0.483, "step": 11090 }, { "epoch": 10.01, "learning_rate": 8.635945945945947e-05, "loss": 0.5503, "step": 11100 }, { "epoch": 10.01, "learning_rate": 8.634594594594595e-05, "loss": 0.3235, "step": 11110 }, { "epoch": 10.01, "learning_rate": 8.633243243243245e-05, "loss": 0.4921, "step": 11120 }, { "epoch": 10.01, "learning_rate": 8.631891891891893e-05, "loss": 0.3551, "step": 11130 }, { "epoch": 10.01, "learning_rate": 8.630540540540542e-05, "loss": 0.6363, "step": 11140 }, { "epoch": 10.01, "learning_rate": 8.62918918918919e-05, "loss": 0.6509, "step": 11150 }, { "epoch": 10.01, "learning_rate": 8.627837837837838e-05, "loss": 0.5734, "step": 11160 }, { "epoch": 10.01, "learning_rate": 8.626486486486486e-05, "loss": 0.6801, "step": 11170 }, { "epoch": 10.01, "learning_rate": 8.625135135135135e-05, "loss": 0.7444, "step": 11180 }, { "epoch": 10.01, "learning_rate": 8.623783783783784e-05, "loss": 0.7083, "step": 11190 }, { "epoch": 10.01, "learning_rate": 8.622432432432432e-05, "loss": 0.8422, "step": 11200 }, { "epoch": 10.01, "learning_rate": 8.621081081081082e-05, "loss": 0.6823, "step": 11210 }, { "epoch": 10.01, "learning_rate": 8.61972972972973e-05, "loss": 0.6719, "step": 11220 }, { "epoch": 10.01, "learning_rate": 8.618378378378379e-05, "loss": 0.6482, "step": 11230 }, { "epoch": 10.01, "learning_rate": 8.617027027027027e-05, "loss": 0.649, "step": 11240 }, { "epoch": 10.01, "learning_rate": 8.615675675675677e-05, "loss": 0.8214, "step": 11250 }, { "epoch": 11.0, "learning_rate": 8.614324324324325e-05, "loss": 0.727, "step": 11260 }, { "epoch": 11.0, "learning_rate": 8.612972972972974e-05, "loss": 0.5654, "step": 11270 }, { "epoch": 11.0, "learning_rate": 8.611621621621622e-05, "loss": 0.6683, "step": 11280 }, { "epoch": 11.0, "learning_rate": 8.61027027027027e-05, "loss": 0.4947, "step": 11290 }, { "epoch": 11.0, "learning_rate": 8.608918918918919e-05, "loss": 0.5586, "step": 11300 }, { "epoch": 11.0, "learning_rate": 8.607567567567568e-05, "loss": 0.5495, "step": 11310 }, { "epoch": 11.0, "learning_rate": 8.606216216216216e-05, "loss": 0.775, "step": 11320 }, { "epoch": 11.0, "learning_rate": 8.604864864864866e-05, "loss": 0.55, "step": 11330 }, { "epoch": 11.0, "learning_rate": 8.603513513513514e-05, "loss": 0.5516, "step": 11340 }, { "epoch": 11.0, "learning_rate": 8.602162162162163e-05, "loss": 0.5761, "step": 11350 }, { "epoch": 11.0, "learning_rate": 8.600810810810811e-05, "loss": 0.5439, "step": 11360 }, { "epoch": 11.0, "learning_rate": 8.59945945945946e-05, "loss": 0.5561, "step": 11370 }, { "epoch": 11.0, "learning_rate": 8.598108108108109e-05, "loss": 0.393, "step": 11380 }, { "epoch": 11.0, "learning_rate": 8.596756756756757e-05, "loss": 0.3215, "step": 11390 }, { "epoch": 11.0, "learning_rate": 8.595405405405405e-05, "loss": 0.3437, "step": 11400 }, { "epoch": 11.0, "learning_rate": 8.594054054054054e-05, "loss": 0.3447, "step": 11410 }, { "epoch": 11.0, "learning_rate": 8.592702702702703e-05, "loss": 1.4835, "step": 11420 }, { "epoch": 11.0, "learning_rate": 8.591351351351352e-05, "loss": 1.5858, "step": 11430 }, { "epoch": 11.0, "learning_rate": 8.59e-05, "loss": 2.7224, "step": 11440 }, { "epoch": 11.0, "learning_rate": 8.58864864864865e-05, "loss": 2.5242, "step": 11450 }, { "epoch": 11.0, "learning_rate": 8.587297297297298e-05, "loss": 2.6389, "step": 11460 }, { "epoch": 11.0, "learning_rate": 8.585945945945947e-05, "loss": 2.511, "step": 11470 }, { "epoch": 11.0, "learning_rate": 8.584594594594595e-05, "loss": 1.8566, "step": 11480 }, { "epoch": 11.0, "learning_rate": 8.583243243243245e-05, "loss": 1.6062, "step": 11490 }, { "epoch": 11.0, "learning_rate": 8.581891891891893e-05, "loss": 0.9586, "step": 11500 }, { "epoch": 11.0, "eval_loss": 0.1549200713634491, "eval_runtime": 129.8347, "eval_samples_per_second": 27.789, "eval_steps_per_second": 3.474, "eval_wer": 0.17061920514373574, "step": 11500 }, { "epoch": 11.0, "learning_rate": 8.580540540540541e-05, "loss": 0.3273, "step": 11510 }, { "epoch": 11.0, "learning_rate": 8.579189189189189e-05, "loss": 0.3728, "step": 11520 }, { "epoch": 11.0, "learning_rate": 8.577837837837838e-05, "loss": 0.2986, "step": 11530 }, { "epoch": 11.0, "learning_rate": 8.576486486486487e-05, "loss": 0.4806, "step": 11540 }, { "epoch": 11.0, "learning_rate": 8.575135135135135e-05, "loss": 0.591, "step": 11550 }, { "epoch": 11.0, "learning_rate": 8.573783783783784e-05, "loss": 0.5364, "step": 11560 }, { "epoch": 11.0, "learning_rate": 8.572432432432432e-05, "loss": 0.2774, "step": 11570 }, { "epoch": 11.0, "learning_rate": 8.571081081081082e-05, "loss": 0.2895, "step": 11580 }, { "epoch": 11.0, "learning_rate": 8.56972972972973e-05, "loss": 0.3504, "step": 11590 }, { "epoch": 11.0, "learning_rate": 8.568378378378379e-05, "loss": 0.3628, "step": 11600 }, { "epoch": 11.0, "learning_rate": 8.567027027027027e-05, "loss": 0.3882, "step": 11610 }, { "epoch": 11.0, "learning_rate": 8.565675675675677e-05, "loss": 0.3413, "step": 11620 }, { "epoch": 11.01, "learning_rate": 8.564324324324325e-05, "loss": 0.2963, "step": 11630 }, { "epoch": 11.01, "learning_rate": 8.562972972972973e-05, "loss": 0.2301, "step": 11640 }, { "epoch": 11.01, "learning_rate": 8.561621621621621e-05, "loss": 0.2078, "step": 11650 }, { "epoch": 11.01, "learning_rate": 8.56027027027027e-05, "loss": 0.3146, "step": 11660 }, { "epoch": 11.01, "learning_rate": 8.558918918918919e-05, "loss": 0.2806, "step": 11670 }, { "epoch": 11.01, "learning_rate": 8.557567567567568e-05, "loss": 0.3471, "step": 11680 }, { "epoch": 11.01, "learning_rate": 8.556216216216216e-05, "loss": 0.4378, "step": 11690 }, { "epoch": 11.01, "learning_rate": 8.554864864864866e-05, "loss": 0.4528, "step": 11700 }, { "epoch": 11.01, "learning_rate": 8.553513513513514e-05, "loss": 0.329, "step": 11710 }, { "epoch": 11.01, "learning_rate": 8.552162162162163e-05, "loss": 0.5113, "step": 11720 }, { "epoch": 11.01, "learning_rate": 8.550810810810811e-05, "loss": 0.5007, "step": 11730 }, { "epoch": 11.01, "learning_rate": 8.549459459459461e-05, "loss": 0.5821, "step": 11740 }, { "epoch": 11.01, "learning_rate": 8.548108108108109e-05, "loss": 0.6051, "step": 11750 }, { "epoch": 11.01, "learning_rate": 8.546756756756757e-05, "loss": 0.3353, "step": 11760 }, { "epoch": 11.01, "learning_rate": 8.545405405405405e-05, "loss": 0.6664, "step": 11770 }, { "epoch": 11.01, "learning_rate": 8.544054054054055e-05, "loss": 0.8095, "step": 11780 }, { "epoch": 11.01, "learning_rate": 8.542702702702703e-05, "loss": 0.5796, "step": 11790 }, { "epoch": 11.01, "learning_rate": 8.541351351351352e-05, "loss": 0.2767, "step": 11800 }, { "epoch": 11.01, "learning_rate": 8.54e-05, "loss": 0.3412, "step": 11810 }, { "epoch": 11.01, "learning_rate": 8.53864864864865e-05, "loss": 0.3355, "step": 11820 }, { "epoch": 11.01, "learning_rate": 8.537297297297298e-05, "loss": 0.3, "step": 11830 }, { "epoch": 11.01, "learning_rate": 8.535945945945947e-05, "loss": 0.279, "step": 11840 }, { "epoch": 11.01, "learning_rate": 8.534594594594595e-05, "loss": 0.2578, "step": 11850 }, { "epoch": 11.01, "learning_rate": 8.533243243243243e-05, "loss": 0.2633, "step": 11860 }, { "epoch": 11.01, "learning_rate": 8.531891891891892e-05, "loss": 0.414, "step": 11870 }, { "epoch": 11.01, "learning_rate": 8.530540540540541e-05, "loss": 0.5823, "step": 11880 }, { "epoch": 11.01, "learning_rate": 8.529189189189189e-05, "loss": 0.5009, "step": 11890 }, { "epoch": 11.01, "learning_rate": 8.527837837837839e-05, "loss": 0.3944, "step": 11900 }, { "epoch": 11.01, "learning_rate": 8.526486486486487e-05, "loss": 0.5344, "step": 11910 }, { "epoch": 11.01, "learning_rate": 8.525135135135136e-05, "loss": 0.6182, "step": 11920 }, { "epoch": 11.01, "learning_rate": 8.523783783783784e-05, "loss": 0.3679, "step": 11930 }, { "epoch": 11.01, "learning_rate": 8.522432432432434e-05, "loss": 0.3538, "step": 11940 }, { "epoch": 11.01, "learning_rate": 8.521081081081082e-05, "loss": 0.3868, "step": 11950 }, { "epoch": 11.01, "learning_rate": 8.51972972972973e-05, "loss": 0.4677, "step": 11960 }, { "epoch": 11.01, "learning_rate": 8.51837837837838e-05, "loss": 0.6305, "step": 11970 }, { "epoch": 11.01, "learning_rate": 8.517027027027027e-05, "loss": 0.4483, "step": 11980 }, { "epoch": 11.01, "learning_rate": 8.515675675675676e-05, "loss": 0.3689, "step": 11990 }, { "epoch": 11.01, "learning_rate": 8.514324324324324e-05, "loss": 0.374, "step": 12000 }, { "epoch": 11.01, "eval_loss": 0.13248920440673828, "eval_runtime": 127.6133, "eval_samples_per_second": 28.273, "eval_steps_per_second": 3.534, "eval_wer": 0.14112658994548757, "step": 12000 }, { "epoch": 11.01, "learning_rate": 8.512972972972973e-05, "loss": 0.3593, "step": 12010 }, { "epoch": 11.01, "learning_rate": 8.511621621621621e-05, "loss": 0.3844, "step": 12020 }, { "epoch": 11.01, "learning_rate": 8.510270270270271e-05, "loss": 0.2149, "step": 12030 }, { "epoch": 11.01, "learning_rate": 8.508918918918919e-05, "loss": 0.3566, "step": 12040 }, { "epoch": 11.01, "learning_rate": 8.507567567567568e-05, "loss": 0.5239, "step": 12050 }, { "epoch": 11.01, "learning_rate": 8.506216216216216e-05, "loss": 0.7106, "step": 12060 }, { "epoch": 11.01, "learning_rate": 8.504864864864866e-05, "loss": 0.3102, "step": 12070 }, { "epoch": 11.01, "learning_rate": 8.503513513513514e-05, "loss": 0.3492, "step": 12080 }, { "epoch": 11.01, "learning_rate": 8.502162162162163e-05, "loss": 0.4011, "step": 12090 }, { "epoch": 11.01, "learning_rate": 8.500810810810811e-05, "loss": 0.3727, "step": 12100 }, { "epoch": 11.01, "learning_rate": 8.49945945945946e-05, "loss": 0.3993, "step": 12110 }, { "epoch": 11.01, "learning_rate": 8.498108108108108e-05, "loss": 0.578, "step": 12120 }, { "epoch": 11.01, "learning_rate": 8.496756756756757e-05, "loss": 0.3893, "step": 12130 }, { "epoch": 11.01, "learning_rate": 8.495405405405405e-05, "loss": 0.4201, "step": 12140 }, { "epoch": 11.01, "learning_rate": 8.494054054054055e-05, "loss": 0.3877, "step": 12150 }, { "epoch": 11.01, "learning_rate": 8.492702702702703e-05, "loss": 0.5615, "step": 12160 }, { "epoch": 11.01, "learning_rate": 8.491351351351352e-05, "loss": 0.5164, "step": 12170 }, { "epoch": 11.01, "learning_rate": 8.49e-05, "loss": 0.6348, "step": 12180 }, { "epoch": 11.01, "learning_rate": 8.48864864864865e-05, "loss": 0.5311, "step": 12190 }, { "epoch": 11.01, "learning_rate": 8.487297297297298e-05, "loss": 0.8295, "step": 12200 }, { "epoch": 11.01, "learning_rate": 8.485945945945947e-05, "loss": 0.7266, "step": 12210 }, { "epoch": 11.01, "learning_rate": 8.484594594594595e-05, "loss": 0.8789, "step": 12220 }, { "epoch": 11.01, "learning_rate": 8.483243243243244e-05, "loss": 0.627, "step": 12230 }, { "epoch": 11.01, "learning_rate": 8.481891891891892e-05, "loss": 0.6374, "step": 12240 }, { "epoch": 11.01, "learning_rate": 8.480540540540541e-05, "loss": 0.5451, "step": 12250 }, { "epoch": 11.01, "learning_rate": 8.479189189189189e-05, "loss": 0.6223, "step": 12260 }, { "epoch": 11.01, "learning_rate": 8.477837837837839e-05, "loss": 0.67, "step": 12270 }, { "epoch": 12.0, "learning_rate": 8.476486486486487e-05, "loss": 0.7311, "step": 12280 }, { "epoch": 12.0, "learning_rate": 8.475135135135136e-05, "loss": 0.6776, "step": 12290 }, { "epoch": 12.0, "learning_rate": 8.473783783783784e-05, "loss": 0.556, "step": 12300 }, { "epoch": 12.0, "learning_rate": 8.472432432432434e-05, "loss": 0.57, "step": 12310 }, { "epoch": 12.0, "learning_rate": 8.471081081081082e-05, "loss": 0.4894, "step": 12320 }, { "epoch": 12.0, "learning_rate": 8.46972972972973e-05, "loss": 0.5514, "step": 12330 }, { "epoch": 12.0, "learning_rate": 8.468378378378378e-05, "loss": 0.6691, "step": 12340 }, { "epoch": 12.0, "learning_rate": 8.467027027027026e-05, "loss": 0.6045, "step": 12350 }, { "epoch": 12.0, "learning_rate": 8.465675675675676e-05, "loss": 0.4968, "step": 12360 }, { "epoch": 12.0, "learning_rate": 8.464324324324324e-05, "loss": 0.5696, "step": 12370 }, { "epoch": 12.0, "learning_rate": 8.462972972972973e-05, "loss": 0.5434, "step": 12380 }, { "epoch": 12.0, "learning_rate": 8.461621621621621e-05, "loss": 0.5655, "step": 12390 }, { "epoch": 12.0, "learning_rate": 8.460270270270271e-05, "loss": 0.386, "step": 12400 }, { "epoch": 12.0, "learning_rate": 8.458918918918919e-05, "loss": 0.3631, "step": 12410 }, { "epoch": 12.0, "learning_rate": 8.457567567567568e-05, "loss": 0.3533, "step": 12420 }, { "epoch": 12.0, "learning_rate": 8.456216216216216e-05, "loss": 0.335, "step": 12430 }, { "epoch": 12.0, "learning_rate": 8.454864864864866e-05, "loss": 1.1957, "step": 12440 }, { "epoch": 12.0, "learning_rate": 8.453513513513514e-05, "loss": 1.1425, "step": 12450 }, { "epoch": 12.0, "learning_rate": 8.452162162162162e-05, "loss": 2.7549, "step": 12460 }, { "epoch": 12.0, "learning_rate": 8.45081081081081e-05, "loss": 2.5992, "step": 12470 }, { "epoch": 12.0, "learning_rate": 8.44945945945946e-05, "loss": 2.5674, "step": 12480 }, { "epoch": 12.0, "learning_rate": 8.448108108108108e-05, "loss": 2.6225, "step": 12490 }, { "epoch": 12.0, "learning_rate": 8.446756756756757e-05, "loss": 1.8557, "step": 12500 }, { "epoch": 12.0, "eval_loss": 0.16791687905788422, "eval_runtime": 129.6767, "eval_samples_per_second": 27.823, "eval_steps_per_second": 3.478, "eval_wer": 0.1748124679681312, "step": 12500 }, { "epoch": 12.0, "learning_rate": 8.445405405405405e-05, "loss": 1.6904, "step": 12510 }, { "epoch": 12.0, "learning_rate": 8.444054054054055e-05, "loss": 1.1763, "step": 12520 }, { "epoch": 12.0, "learning_rate": 8.442702702702703e-05, "loss": 0.4174, "step": 12530 }, { "epoch": 12.0, "learning_rate": 8.441351351351352e-05, "loss": 0.2392, "step": 12540 }, { "epoch": 12.0, "learning_rate": 8.44e-05, "loss": 0.4256, "step": 12550 }, { "epoch": 12.0, "learning_rate": 8.43864864864865e-05, "loss": 0.43, "step": 12560 }, { "epoch": 12.0, "learning_rate": 8.437297297297298e-05, "loss": 0.5161, "step": 12570 }, { "epoch": 12.0, "learning_rate": 8.435945945945946e-05, "loss": 0.527, "step": 12580 }, { "epoch": 12.0, "learning_rate": 8.434594594594594e-05, "loss": 0.3934, "step": 12590 }, { "epoch": 12.0, "learning_rate": 8.433243243243244e-05, "loss": 0.2744, "step": 12600 }, { "epoch": 12.0, "learning_rate": 8.431891891891892e-05, "loss": 0.4178, "step": 12610 }, { "epoch": 12.0, "learning_rate": 8.430540540540541e-05, "loss": 0.2753, "step": 12620 }, { "epoch": 12.0, "learning_rate": 8.42918918918919e-05, "loss": 0.4094, "step": 12630 }, { "epoch": 12.0, "learning_rate": 8.427837837837839e-05, "loss": 0.3459, "step": 12640 }, { "epoch": 12.0, "learning_rate": 8.426486486486487e-05, "loss": 0.2902, "step": 12650 }, { "epoch": 12.01, "learning_rate": 8.425135135135136e-05, "loss": 0.267, "step": 12660 }, { "epoch": 12.01, "learning_rate": 8.423783783783785e-05, "loss": 0.1914, "step": 12670 }, { "epoch": 12.01, "learning_rate": 8.422432432432433e-05, "loss": 0.3135, "step": 12680 }, { "epoch": 12.01, "learning_rate": 8.421081081081081e-05, "loss": 0.301, "step": 12690 }, { "epoch": 12.01, "learning_rate": 8.41972972972973e-05, "loss": 0.2472, "step": 12700 }, { "epoch": 12.01, "learning_rate": 8.418378378378378e-05, "loss": 0.3546, "step": 12710 }, { "epoch": 12.01, "learning_rate": 8.417027027027028e-05, "loss": 0.4838, "step": 12720 }, { "epoch": 12.01, "learning_rate": 8.415675675675676e-05, "loss": 0.3124, "step": 12730 }, { "epoch": 12.01, "learning_rate": 8.414324324324325e-05, "loss": 0.4315, "step": 12740 }, { "epoch": 12.01, "learning_rate": 8.412972972972973e-05, "loss": 0.477, "step": 12750 }, { "epoch": 12.01, "learning_rate": 8.411621621621622e-05, "loss": 0.4698, "step": 12760 }, { "epoch": 12.01, "learning_rate": 8.410270270270271e-05, "loss": 0.6201, "step": 12770 }, { "epoch": 12.01, "learning_rate": 8.408918918918919e-05, "loss": 0.4315, "step": 12780 }, { "epoch": 12.01, "learning_rate": 8.407567567567569e-05, "loss": 0.4749, "step": 12790 }, { "epoch": 12.01, "learning_rate": 8.406351351351352e-05, "loss": 0.7995, "step": 12800 }, { "epoch": 12.01, "learning_rate": 8.405000000000001e-05, "loss": 0.6737, "step": 12810 }, { "epoch": 12.01, "learning_rate": 8.403648648648649e-05, "loss": 0.263, "step": 12820 }, { "epoch": 12.01, "learning_rate": 8.402297297297299e-05, "loss": 0.3259, "step": 12830 }, { "epoch": 12.01, "learning_rate": 8.400945945945947e-05, "loss": 0.348, "step": 12840 }, { "epoch": 12.01, "learning_rate": 8.399594594594595e-05, "loss": 0.3175, "step": 12850 }, { "epoch": 12.01, "learning_rate": 8.398243243243243e-05, "loss": 0.2759, "step": 12860 }, { "epoch": 12.01, "learning_rate": 8.396891891891892e-05, "loss": 0.2349, "step": 12870 }, { "epoch": 12.01, "learning_rate": 8.39554054054054e-05, "loss": 0.2495, "step": 12880 }, { "epoch": 12.01, "learning_rate": 8.39418918918919e-05, "loss": 0.3043, "step": 12890 }, { "epoch": 12.01, "learning_rate": 8.392837837837838e-05, "loss": 0.6314, "step": 12900 }, { "epoch": 12.01, "learning_rate": 8.391486486486487e-05, "loss": 0.4796, "step": 12910 }, { "epoch": 12.01, "learning_rate": 8.390135135135136e-05, "loss": 0.4284, "step": 12920 }, { "epoch": 12.01, "learning_rate": 8.388783783783785e-05, "loss": 0.4799, "step": 12930 }, { "epoch": 12.01, "learning_rate": 8.387432432432433e-05, "loss": 0.6782, "step": 12940 }, { "epoch": 12.01, "learning_rate": 8.386081081081083e-05, "loss": 0.3249, "step": 12950 }, { "epoch": 12.01, "learning_rate": 8.384729729729731e-05, "loss": 0.299, "step": 12960 }, { "epoch": 12.01, "learning_rate": 8.383378378378379e-05, "loss": 0.364, "step": 12970 }, { "epoch": 12.01, "learning_rate": 8.382027027027027e-05, "loss": 0.498, "step": 12980 }, { "epoch": 12.01, "learning_rate": 8.380675675675676e-05, "loss": 0.5047, "step": 12990 }, { "epoch": 12.01, "learning_rate": 8.379324324324324e-05, "loss": 0.4378, "step": 13000 }, { "epoch": 12.01, "eval_loss": 0.1289682686328888, "eval_runtime": 131.4903, "eval_samples_per_second": 27.439, "eval_steps_per_second": 3.43, "eval_wer": 0.14010157014396868, "step": 13000 }, { "epoch": 12.01, "learning_rate": 8.377972972972974e-05, "loss": 0.3863, "step": 13010 }, { "epoch": 12.01, "learning_rate": 8.376621621621622e-05, "loss": 0.4007, "step": 13020 }, { "epoch": 12.01, "learning_rate": 8.375270270270271e-05, "loss": 0.3403, "step": 13030 }, { "epoch": 12.01, "learning_rate": 8.37391891891892e-05, "loss": 0.3913, "step": 13040 }, { "epoch": 12.01, "learning_rate": 8.372567567567568e-05, "loss": 0.2527, "step": 13050 }, { "epoch": 12.01, "learning_rate": 8.371216216216217e-05, "loss": 0.2977, "step": 13060 }, { "epoch": 12.01, "learning_rate": 8.369864864864865e-05, "loss": 0.4161, "step": 13070 }, { "epoch": 12.01, "learning_rate": 8.368513513513513e-05, "loss": 0.9056, "step": 13080 }, { "epoch": 12.01, "learning_rate": 8.367162162162161e-05, "loss": 0.2732, "step": 13090 }, { "epoch": 12.01, "learning_rate": 8.365810810810811e-05, "loss": 0.3031, "step": 13100 }, { "epoch": 12.01, "learning_rate": 8.364459459459459e-05, "loss": 0.3943, "step": 13110 }, { "epoch": 12.01, "learning_rate": 8.363108108108108e-05, "loss": 0.4438, "step": 13120 }, { "epoch": 12.01, "learning_rate": 8.361756756756757e-05, "loss": 0.4192, "step": 13130 }, { "epoch": 12.01, "learning_rate": 8.360405405405406e-05, "loss": 0.5285, "step": 13140 }, { "epoch": 12.01, "learning_rate": 8.359054054054054e-05, "loss": 0.4485, "step": 13150 }, { "epoch": 12.01, "learning_rate": 8.357702702702704e-05, "loss": 0.3022, "step": 13160 }, { "epoch": 12.01, "learning_rate": 8.356351351351352e-05, "loss": 0.4524, "step": 13170 }, { "epoch": 12.01, "learning_rate": 8.355135135135136e-05, "loss": 0.4154, "step": 13180 }, { "epoch": 12.01, "learning_rate": 8.353783783783784e-05, "loss": 0.5359, "step": 13190 }, { "epoch": 12.01, "learning_rate": 8.352432432432434e-05, "loss": 0.6473, "step": 13200 }, { "epoch": 12.01, "learning_rate": 8.351081081081082e-05, "loss": 0.5285, "step": 13210 }, { "epoch": 12.01, "learning_rate": 8.349729729729731e-05, "loss": 0.8111, "step": 13220 }, { "epoch": 12.01, "learning_rate": 8.348378378378379e-05, "loss": 0.6777, "step": 13230 }, { "epoch": 12.01, "learning_rate": 8.347027027027027e-05, "loss": 0.9788, "step": 13240 }, { "epoch": 12.01, "learning_rate": 8.345675675675676e-05, "loss": 0.7222, "step": 13250 }, { "epoch": 12.01, "learning_rate": 8.344324324324325e-05, "loss": 0.5677, "step": 13260 }, { "epoch": 12.01, "learning_rate": 8.342972972972973e-05, "loss": 0.6035, "step": 13270 }, { "epoch": 12.01, "learning_rate": 8.341621621621623e-05, "loss": 0.5285, "step": 13280 }, { "epoch": 12.01, "learning_rate": 8.34027027027027e-05, "loss": 0.5237, "step": 13290 }, { "epoch": 13.0, "learning_rate": 8.33891891891892e-05, "loss": 0.8589, "step": 13300 }, { "epoch": 13.0, "learning_rate": 8.337567567567568e-05, "loss": 0.5366, "step": 13310 }, { "epoch": 13.0, "learning_rate": 8.336216216216216e-05, "loss": 0.6143, "step": 13320 }, { "epoch": 13.0, "learning_rate": 8.334864864864866e-05, "loss": 0.605, "step": 13330 }, { "epoch": 13.0, "learning_rate": 8.333513513513514e-05, "loss": 0.4915, "step": 13340 }, { "epoch": 13.0, "learning_rate": 8.332162162162162e-05, "loss": 0.5377, "step": 13350 }, { "epoch": 13.0, "learning_rate": 8.33081081081081e-05, "loss": 0.5965, "step": 13360 }, { "epoch": 13.0, "learning_rate": 8.32945945945946e-05, "loss": 0.6886, "step": 13370 }, { "epoch": 13.0, "learning_rate": 8.328108108108108e-05, "loss": 0.5019, "step": 13380 }, { "epoch": 13.0, "learning_rate": 8.326756756756757e-05, "loss": 0.5415, "step": 13390 }, { "epoch": 13.0, "learning_rate": 8.325405405405405e-05, "loss": 0.5761, "step": 13400 }, { "epoch": 13.0, "learning_rate": 8.324054054054055e-05, "loss": 0.5251, "step": 13410 }, { "epoch": 13.0, "learning_rate": 8.322702702702703e-05, "loss": 0.4906, "step": 13420 }, { "epoch": 13.0, "learning_rate": 8.321351351351352e-05, "loss": 0.3237, "step": 13430 }, { "epoch": 13.0, "learning_rate": 8.32e-05, "loss": 0.3481, "step": 13440 }, { "epoch": 13.0, "learning_rate": 8.31864864864865e-05, "loss": 0.3594, "step": 13450 }, { "epoch": 13.0, "learning_rate": 8.317297297297298e-05, "loss": 0.7631, "step": 13460 }, { "epoch": 13.0, "learning_rate": 8.315945945945946e-05, "loss": 1.2481, "step": 13470 }, { "epoch": 13.0, "learning_rate": 8.314594594594594e-05, "loss": 2.2333, "step": 13480 }, { "epoch": 13.0, "learning_rate": 8.313243243243244e-05, "loss": 2.5947, "step": 13490 }, { "epoch": 13.0, "learning_rate": 8.311891891891892e-05, "loss": 2.5375, "step": 13500 }, { "epoch": 13.0, "eval_loss": 0.16997256875038147, "eval_runtime": 142.279, "eval_samples_per_second": 25.359, "eval_steps_per_second": 3.17, "eval_wer": 0.15421888831943345, "step": 13500 }, { "epoch": 13.0, "learning_rate": 8.310540540540541e-05, "loss": 2.6469, "step": 13510 }, { "epoch": 13.0, "learning_rate": 8.309189189189189e-05, "loss": 2.0909, "step": 13520 }, { "epoch": 13.0, "learning_rate": 8.307837837837839e-05, "loss": 1.8349, "step": 13530 }, { "epoch": 13.0, "learning_rate": 8.306486486486487e-05, "loss": 1.21, "step": 13540 }, { "epoch": 13.0, "learning_rate": 8.305135135135136e-05, "loss": 0.6403, "step": 13550 }, { "epoch": 13.0, "learning_rate": 8.303783783783784e-05, "loss": 0.2229, "step": 13560 }, { "epoch": 13.0, "learning_rate": 8.302432432432434e-05, "loss": 0.3648, "step": 13570 }, { "epoch": 13.0, "learning_rate": 8.301081081081082e-05, "loss": 0.3631, "step": 13580 }, { "epoch": 13.0, "learning_rate": 8.29972972972973e-05, "loss": 0.4425, "step": 13590 }, { "epoch": 13.0, "learning_rate": 8.298378378378378e-05, "loss": 0.6097, "step": 13600 }, { "epoch": 13.0, "learning_rate": 8.297027027027028e-05, "loss": 0.4457, "step": 13610 }, { "epoch": 13.0, "learning_rate": 8.295675675675676e-05, "loss": 0.2239, "step": 13620 }, { "epoch": 13.0, "learning_rate": 8.294324324324325e-05, "loss": 0.3417, "step": 13630 }, { "epoch": 13.0, "learning_rate": 8.292972972972973e-05, "loss": 0.3421, "step": 13640 }, { "epoch": 13.0, "learning_rate": 8.291621621621623e-05, "loss": 0.4022, "step": 13650 }, { "epoch": 13.0, "learning_rate": 8.290270270270271e-05, "loss": 0.4256, "step": 13660 }, { "epoch": 13.0, "learning_rate": 8.28891891891892e-05, "loss": 0.2684, "step": 13670 }, { "epoch": 13.01, "learning_rate": 8.287567567567568e-05, "loss": 0.2973, "step": 13680 }, { "epoch": 13.01, "learning_rate": 8.286216216216218e-05, "loss": 0.2091, "step": 13690 }, { "epoch": 13.01, "learning_rate": 8.284864864864866e-05, "loss": 0.2666, "step": 13700 }, { "epoch": 13.01, "learning_rate": 8.283513513513514e-05, "loss": 0.376, "step": 13710 }, { "epoch": 13.01, "learning_rate": 8.282162162162162e-05, "loss": 0.1928, "step": 13720 }, { "epoch": 13.01, "learning_rate": 8.28081081081081e-05, "loss": 0.3196, "step": 13730 }, { "epoch": 13.01, "learning_rate": 8.27945945945946e-05, "loss": 0.548, "step": 13740 }, { "epoch": 13.01, "learning_rate": 8.278108108108108e-05, "loss": 0.3735, "step": 13750 }, { "epoch": 13.01, "learning_rate": 8.276756756756757e-05, "loss": 0.358, "step": 13760 }, { "epoch": 13.01, "learning_rate": 8.275405405405405e-05, "loss": 0.4964, "step": 13770 }, { "epoch": 13.01, "learning_rate": 8.274054054054055e-05, "loss": 0.4477, "step": 13780 }, { "epoch": 13.01, "learning_rate": 8.272702702702703e-05, "loss": 0.5881, "step": 13790 }, { "epoch": 13.01, "learning_rate": 8.271351351351352e-05, "loss": 0.5055, "step": 13800 }, { "epoch": 13.01, "learning_rate": 8.27e-05, "loss": 0.3873, "step": 13810 }, { "epoch": 13.01, "learning_rate": 8.268648648648649e-05, "loss": 0.7574, "step": 13820 }, { "epoch": 13.01, "learning_rate": 8.267297297297297e-05, "loss": 0.7266, "step": 13830 }, { "epoch": 13.01, "learning_rate": 8.265945945945946e-05, "loss": 0.3791, "step": 13840 }, { "epoch": 13.01, "learning_rate": 8.264594594594594e-05, "loss": 0.2891, "step": 13850 }, { "epoch": 13.01, "learning_rate": 8.263243243243244e-05, "loss": 0.3272, "step": 13860 }, { "epoch": 13.01, "learning_rate": 8.261891891891892e-05, "loss": 0.3131, "step": 13870 }, { "epoch": 13.01, "learning_rate": 8.260540540540541e-05, "loss": 0.2872, "step": 13880 }, { "epoch": 13.01, "learning_rate": 8.25918918918919e-05, "loss": 0.2631, "step": 13890 }, { "epoch": 13.01, "learning_rate": 8.257837837837839e-05, "loss": 0.2586, "step": 13900 }, { "epoch": 13.01, "learning_rate": 8.256486486486487e-05, "loss": 0.2659, "step": 13910 }, { "epoch": 13.01, "learning_rate": 8.255135135135136e-05, "loss": 0.5447, "step": 13920 }, { "epoch": 13.01, "learning_rate": 8.253783783783784e-05, "loss": 0.5141, "step": 13930 }, { "epoch": 13.01, "learning_rate": 8.252432432432433e-05, "loss": 0.5425, "step": 13940 }, { "epoch": 13.01, "learning_rate": 8.25108108108108e-05, "loss": 0.4169, "step": 13950 }, { "epoch": 13.01, "learning_rate": 8.24972972972973e-05, "loss": 0.5987, "step": 13960 }, { "epoch": 13.01, "learning_rate": 8.248378378378378e-05, "loss": 0.5119, "step": 13970 }, { "epoch": 13.01, "learning_rate": 8.247027027027028e-05, "loss": 0.3413, "step": 13980 }, { "epoch": 13.01, "learning_rate": 8.245675675675676e-05, "loss": 0.3748, "step": 13990 }, { "epoch": 13.01, "learning_rate": 8.244324324324325e-05, "loss": 0.4259, "step": 14000 }, { "epoch": 13.01, "eval_loss": 0.12877584993839264, "eval_runtime": 130.7012, "eval_samples_per_second": 27.605, "eval_steps_per_second": 3.451, "eval_wer": 0.1386106322508503, "step": 14000 }, { "epoch": 13.01, "learning_rate": 8.242972972972973e-05, "loss": 0.5691, "step": 14010 }, { "epoch": 13.01, "learning_rate": 8.241621621621623e-05, "loss": 0.4424, "step": 14020 }, { "epoch": 13.01, "learning_rate": 8.240270270270271e-05, "loss": 0.402, "step": 14030 }, { "epoch": 13.01, "learning_rate": 8.23891891891892e-05, "loss": 0.4127, "step": 14040 }, { "epoch": 13.01, "learning_rate": 8.237567567567568e-05, "loss": 0.3816, "step": 14050 }, { "epoch": 13.01, "learning_rate": 8.236216216216217e-05, "loss": 0.3469, "step": 14060 }, { "epoch": 13.01, "learning_rate": 8.234864864864865e-05, "loss": 0.2893, "step": 14070 }, { "epoch": 13.01, "learning_rate": 8.233513513513514e-05, "loss": 0.2368, "step": 14080 }, { "epoch": 13.01, "learning_rate": 8.232162162162162e-05, "loss": 0.4, "step": 14090 }, { "epoch": 13.01, "learning_rate": 8.230810810810812e-05, "loss": 0.7373, "step": 14100 }, { "epoch": 13.01, "learning_rate": 8.22945945945946e-05, "loss": 0.4357, "step": 14110 }, { "epoch": 13.01, "learning_rate": 8.228108108108108e-05, "loss": 0.2791, "step": 14120 }, { "epoch": 13.01, "learning_rate": 8.226756756756757e-05, "loss": 0.3814, "step": 14130 }, { "epoch": 13.01, "learning_rate": 8.225405405405405e-05, "loss": 0.3684, "step": 14140 }, { "epoch": 13.01, "learning_rate": 8.224054054054055e-05, "loss": 0.3793, "step": 14150 }, { "epoch": 13.01, "learning_rate": 8.222702702702703e-05, "loss": 0.5088, "step": 14160 }, { "epoch": 13.01, "learning_rate": 8.221351351351352e-05, "loss": 0.6018, "step": 14170 }, { "epoch": 13.01, "learning_rate": 8.22e-05, "loss": 0.3017, "step": 14180 }, { "epoch": 13.01, "learning_rate": 8.218648648648649e-05, "loss": 0.4029, "step": 14190 }, { "epoch": 13.01, "learning_rate": 8.217297297297297e-05, "loss": 0.3363, "step": 14200 }, { "epoch": 13.01, "learning_rate": 8.215945945945946e-05, "loss": 0.5602, "step": 14210 }, { "epoch": 13.01, "learning_rate": 8.214594594594594e-05, "loss": 0.5997, "step": 14220 }, { "epoch": 13.01, "learning_rate": 8.213243243243244e-05, "loss": 0.5302, "step": 14230 }, { "epoch": 13.01, "learning_rate": 8.211891891891892e-05, "loss": 0.6367, "step": 14240 }, { "epoch": 13.01, "learning_rate": 8.210540540540541e-05, "loss": 0.7905, "step": 14250 }, { "epoch": 13.01, "learning_rate": 8.20918918918919e-05, "loss": 0.6489, "step": 14260 }, { "epoch": 13.01, "learning_rate": 8.207837837837839e-05, "loss": 0.8359, "step": 14270 }, { "epoch": 13.01, "learning_rate": 8.206486486486487e-05, "loss": 0.6174, "step": 14280 }, { "epoch": 13.01, "learning_rate": 8.205135135135135e-05, "loss": 0.5723, "step": 14290 }, { "epoch": 13.01, "learning_rate": 8.203783783783783e-05, "loss": 0.5144, "step": 14300 }, { "epoch": 13.01, "learning_rate": 8.202432432432433e-05, "loss": 0.5097, "step": 14310 }, { "epoch": 13.01, "learning_rate": 8.201081081081081e-05, "loss": 0.7489, "step": 14320 }, { "epoch": 14.0, "learning_rate": 8.19972972972973e-05, "loss": 0.6341, "step": 14330 }, { "epoch": 14.0, "learning_rate": 8.198378378378378e-05, "loss": 0.5345, "step": 14340 }, { "epoch": 14.0, "learning_rate": 8.197027027027028e-05, "loss": 0.5954, "step": 14350 }, { "epoch": 14.0, "learning_rate": 8.195675675675676e-05, "loss": 0.4701, "step": 14360 }, { "epoch": 14.0, "learning_rate": 8.194324324324325e-05, "loss": 0.5009, "step": 14370 }, { "epoch": 14.0, "learning_rate": 8.192972972972973e-05, "loss": 0.4924, "step": 14380 }, { "epoch": 14.0, "learning_rate": 8.191621621621623e-05, "loss": 0.7628, "step": 14390 }, { "epoch": 14.0, "learning_rate": 8.190270270270271e-05, "loss": 0.4891, "step": 14400 }, { "epoch": 14.0, "learning_rate": 8.188918918918919e-05, "loss": 0.5527, "step": 14410 }, { "epoch": 14.0, "learning_rate": 8.187567567567567e-05, "loss": 0.5384, "step": 14420 }, { "epoch": 14.0, "learning_rate": 8.186216216216217e-05, "loss": 0.4888, "step": 14430 }, { "epoch": 14.0, "learning_rate": 8.184864864864865e-05, "loss": 0.4789, "step": 14440 }, { "epoch": 14.0, "learning_rate": 8.183513513513514e-05, "loss": 0.3753, "step": 14450 }, { "epoch": 14.0, "learning_rate": 8.182162162162162e-05, "loss": 0.3179, "step": 14460 }, { "epoch": 14.0, "learning_rate": 8.180810810810812e-05, "loss": 0.3079, "step": 14470 }, { "epoch": 14.0, "learning_rate": 8.17945945945946e-05, "loss": 0.3935, "step": 14480 }, { "epoch": 14.0, "learning_rate": 8.17810810810811e-05, "loss": 1.4521, "step": 14490 }, { "epoch": 14.0, "learning_rate": 8.176756756756757e-05, "loss": 1.6057, "step": 14500 }, { "epoch": 14.0, "eval_loss": 0.1433689296245575, "eval_runtime": 128.9602, "eval_samples_per_second": 27.978, "eval_steps_per_second": 3.497, "eval_wer": 0.1476028514187206, "step": 14500 }, { "epoch": 14.0, "learning_rate": 8.175405405405407e-05, "loss": 2.671, "step": 14510 }, { "epoch": 14.0, "learning_rate": 8.174054054054055e-05, "loss": 2.5001, "step": 14520 }, { "epoch": 14.0, "learning_rate": 8.172702702702703e-05, "loss": 2.6332, "step": 14530 }, { "epoch": 14.0, "learning_rate": 8.171351351351351e-05, "loss": 2.3225, "step": 14540 }, { "epoch": 14.0, "learning_rate": 8.17e-05, "loss": 1.7506, "step": 14550 }, { "epoch": 14.0, "learning_rate": 8.168648648648649e-05, "loss": 1.501, "step": 14560 }, { "epoch": 14.0, "learning_rate": 8.167297297297297e-05, "loss": 0.725, "step": 14570 }, { "epoch": 14.0, "learning_rate": 8.165945945945946e-05, "loss": 0.261, "step": 14580 }, { "epoch": 14.0, "learning_rate": 8.164594594594594e-05, "loss": 0.3251, "step": 14590 }, { "epoch": 14.0, "learning_rate": 8.163243243243244e-05, "loss": 0.2859, "step": 14600 }, { "epoch": 14.0, "learning_rate": 8.161891891891892e-05, "loss": 0.4387, "step": 14610 }, { "epoch": 14.0, "learning_rate": 8.160540540540542e-05, "loss": 0.5359, "step": 14620 }, { "epoch": 14.0, "learning_rate": 8.15918918918919e-05, "loss": 0.4683, "step": 14630 }, { "epoch": 14.0, "learning_rate": 8.157837837837839e-05, "loss": 0.2511, "step": 14640 }, { "epoch": 14.0, "learning_rate": 8.156486486486487e-05, "loss": 0.2601, "step": 14650 }, { "epoch": 14.0, "learning_rate": 8.155135135135135e-05, "loss": 0.3415, "step": 14660 }, { "epoch": 14.0, "learning_rate": 8.153783783783783e-05, "loss": 0.3462, "step": 14670 }, { "epoch": 14.0, "learning_rate": 8.152432432432433e-05, "loss": 0.4335, "step": 14680 }, { "epoch": 14.0, "learning_rate": 8.151081081081081e-05, "loss": 0.3096, "step": 14690 }, { "epoch": 14.01, "learning_rate": 8.14972972972973e-05, "loss": 0.2502, "step": 14700 }, { "epoch": 14.01, "learning_rate": 8.148378378378379e-05, "loss": 0.1906, "step": 14710 }, { "epoch": 14.01, "learning_rate": 8.147027027027028e-05, "loss": 0.1912, "step": 14720 }, { "epoch": 14.01, "learning_rate": 8.145675675675676e-05, "loss": 0.346, "step": 14730 }, { "epoch": 14.01, "learning_rate": 8.144324324324326e-05, "loss": 0.2487, "step": 14740 }, { "epoch": 14.01, "learning_rate": 8.142972972972974e-05, "loss": 0.3115, "step": 14750 }, { "epoch": 14.01, "learning_rate": 8.141621621621622e-05, "loss": 0.3731, "step": 14760 }, { "epoch": 14.01, "learning_rate": 8.14027027027027e-05, "loss": 0.3794, "step": 14770 }, { "epoch": 14.01, "learning_rate": 8.138918918918919e-05, "loss": 0.3413, "step": 14780 }, { "epoch": 14.01, "learning_rate": 8.137567567567567e-05, "loss": 0.4551, "step": 14790 }, { "epoch": 14.01, "learning_rate": 8.136216216216217e-05, "loss": 0.4473, "step": 14800 }, { "epoch": 14.01, "learning_rate": 8.134864864864865e-05, "loss": 0.4964, "step": 14810 }, { "epoch": 14.01, "learning_rate": 8.133513513513514e-05, "loss": 0.5514, "step": 14820 }, { "epoch": 14.01, "learning_rate": 8.132162162162163e-05, "loss": 0.2965, "step": 14830 }, { "epoch": 14.01, "learning_rate": 8.130810810810812e-05, "loss": 0.7011, "step": 14840 }, { "epoch": 14.01, "learning_rate": 8.12945945945946e-05, "loss": 0.6325, "step": 14850 }, { "epoch": 14.01, "learning_rate": 8.12810810810811e-05, "loss": 0.4523, "step": 14860 }, { "epoch": 14.01, "learning_rate": 8.126756756756758e-05, "loss": 0.1901, "step": 14870 }, { "epoch": 14.01, "learning_rate": 8.125405405405406e-05, "loss": 0.3182, "step": 14880 }, { "epoch": 14.01, "learning_rate": 8.124054054054054e-05, "loss": 0.2841, "step": 14890 }, { "epoch": 14.01, "learning_rate": 8.122702702702703e-05, "loss": 0.2555, "step": 14900 }, { "epoch": 14.01, "learning_rate": 8.121351351351351e-05, "loss": 0.2511, "step": 14910 }, { "epoch": 14.01, "learning_rate": 8.120000000000001e-05, "loss": 0.2527, "step": 14920 }, { "epoch": 14.01, "learning_rate": 8.118648648648649e-05, "loss": 0.2447, "step": 14930 }, { "epoch": 14.01, "learning_rate": 8.117297297297297e-05, "loss": 0.4574, "step": 14940 }, { "epoch": 14.01, "learning_rate": 8.115945945945947e-05, "loss": 0.521, "step": 14950 }, { "epoch": 14.01, "learning_rate": 8.114594594594595e-05, "loss": 0.4584, "step": 14960 }, { "epoch": 14.01, "learning_rate": 8.113243243243244e-05, "loss": 0.3934, "step": 14970 }, { "epoch": 14.01, "learning_rate": 8.111891891891892e-05, "loss": 0.6151, "step": 14980 }, { "epoch": 14.01, "learning_rate": 8.110540540540542e-05, "loss": 0.5915, "step": 14990 }, { "epoch": 14.01, "learning_rate": 8.10918918918919e-05, "loss": 0.3242, "step": 15000 }, { "epoch": 14.01, "eval_loss": 0.12805943191051483, "eval_runtime": 129.6116, "eval_samples_per_second": 27.837, "eval_steps_per_second": 3.48, "eval_wer": 0.13506965475469412, "step": 15000 }, { "epoch": 14.01, "learning_rate": 8.107837837837838e-05, "loss": 0.3075, "step": 15010 }, { "epoch": 14.01, "learning_rate": 8.106486486486486e-05, "loss": 0.4028, "step": 15020 }, { "epoch": 14.01, "learning_rate": 8.10527027027027e-05, "loss": 0.5666, "step": 15030 }, { "epoch": 14.01, "learning_rate": 8.103918918918918e-05, "loss": 0.5136, "step": 15040 }, { "epoch": 14.01, "learning_rate": 8.102567567567568e-05, "loss": 0.4072, "step": 15050 }, { "epoch": 14.01, "learning_rate": 8.101216216216216e-05, "loss": 0.4121, "step": 15060 }, { "epoch": 14.01, "learning_rate": 8.099864864864865e-05, "loss": 0.3191, "step": 15070 }, { "epoch": 14.01, "learning_rate": 8.098513513513514e-05, "loss": 0.3291, "step": 15080 }, { "epoch": 14.01, "learning_rate": 8.097162162162163e-05, "loss": 0.3986, "step": 15090 }, { "epoch": 14.01, "learning_rate": 8.095810810810811e-05, "loss": 0.2199, "step": 15100 }, { "epoch": 14.01, "learning_rate": 8.09445945945946e-05, "loss": 0.4096, "step": 15110 }, { "epoch": 14.01, "learning_rate": 8.093108108108109e-05, "loss": 0.5139, "step": 15120 }, { "epoch": 14.01, "learning_rate": 8.091756756756758e-05, "loss": 0.5446, "step": 15130 }, { "epoch": 14.01, "learning_rate": 8.090405405405406e-05, "loss": 0.2385, "step": 15140 }, { "epoch": 14.01, "learning_rate": 8.089054054054054e-05, "loss": 0.3299, "step": 15150 }, { "epoch": 14.01, "learning_rate": 8.087702702702702e-05, "loss": 0.3698, "step": 15160 }, { "epoch": 14.01, "learning_rate": 8.086351351351352e-05, "loss": 0.4283, "step": 15170 }, { "epoch": 14.01, "learning_rate": 8.085e-05, "loss": 0.4394, "step": 15180 }, { "epoch": 14.01, "learning_rate": 8.08364864864865e-05, "loss": 0.5857, "step": 15190 }, { "epoch": 14.01, "learning_rate": 8.082297297297298e-05, "loss": 0.3064, "step": 15200 }, { "epoch": 14.01, "learning_rate": 8.080945945945946e-05, "loss": 0.3648, "step": 15210 }, { "epoch": 14.01, "learning_rate": 8.079594594594595e-05, "loss": 0.3846, "step": 15220 }, { "epoch": 14.01, "learning_rate": 8.078243243243243e-05, "loss": 0.5648, "step": 15230 }, { "epoch": 14.01, "learning_rate": 8.076891891891893e-05, "loss": 0.6005, "step": 15240 }, { "epoch": 14.01, "learning_rate": 8.075540540540541e-05, "loss": 0.576, "step": 15250 }, { "epoch": 14.01, "learning_rate": 8.07418918918919e-05, "loss": 0.58, "step": 15260 }, { "epoch": 14.01, "learning_rate": 8.072837837837838e-05, "loss": 0.8161, "step": 15270 }, { "epoch": 14.01, "learning_rate": 8.071486486486486e-05, "loss": 0.6281, "step": 15280 }, { "epoch": 14.01, "learning_rate": 8.070135135135135e-05, "loss": 0.8454, "step": 15290 }, { "epoch": 14.01, "learning_rate": 8.068783783783784e-05, "loss": 0.6404, "step": 15300 }, { "epoch": 14.01, "learning_rate": 8.067432432432432e-05, "loss": 0.5874, "step": 15310 }, { "epoch": 14.01, "learning_rate": 8.066081081081082e-05, "loss": 0.5725, "step": 15320 }, { "epoch": 14.01, "learning_rate": 8.06472972972973e-05, "loss": 0.5481, "step": 15330 }, { "epoch": 14.01, "learning_rate": 8.063378378378379e-05, "loss": 0.6455, "step": 15340 }, { "epoch": 15.0, "learning_rate": 8.062027027027027e-05, "loss": 0.6629, "step": 15350 }, { "epoch": 15.0, "learning_rate": 8.060675675675677e-05, "loss": 0.5534, "step": 15360 }, { "epoch": 15.0, "learning_rate": 8.059324324324325e-05, "loss": 0.5634, "step": 15370 }, { "epoch": 15.0, "learning_rate": 8.057972972972974e-05, "loss": 0.5042, "step": 15380 }, { "epoch": 15.0, "learning_rate": 8.056621621621622e-05, "loss": 0.4968, "step": 15390 }, { "epoch": 15.0, "learning_rate": 8.05527027027027e-05, "loss": 0.5293, "step": 15400 }, { "epoch": 15.0, "learning_rate": 8.053918918918919e-05, "loss": 0.7052, "step": 15410 }, { "epoch": 15.0, "learning_rate": 8.052567567567568e-05, "loss": 0.5122, "step": 15420 }, { "epoch": 15.0, "learning_rate": 8.051216216216216e-05, "loss": 0.4782, "step": 15430 }, { "epoch": 15.0, "learning_rate": 8.049864864864866e-05, "loss": 0.5617, "step": 15440 }, { "epoch": 15.0, "learning_rate": 8.048513513513514e-05, "loss": 0.5014, "step": 15450 }, { "epoch": 15.0, "learning_rate": 8.047162162162163e-05, "loss": 0.5491, "step": 15460 }, { "epoch": 15.0, "learning_rate": 8.045810810810811e-05, "loss": 0.3763, "step": 15470 }, { "epoch": 15.0, "learning_rate": 8.044459459459461e-05, "loss": 0.3459, "step": 15480 }, { "epoch": 15.0, "learning_rate": 8.043108108108109e-05, "loss": 0.3232, "step": 15490 }, { "epoch": 15.0, "learning_rate": 8.041756756756757e-05, "loss": 0.3671, "step": 15500 }, { "epoch": 15.0, "eval_loss": 0.15460152924060822, "eval_runtime": 130.7683, "eval_samples_per_second": 27.591, "eval_steps_per_second": 3.449, "eval_wer": 0.158318967525509, "step": 15500 }, { "epoch": 15.0, "learning_rate": 8.040405405405405e-05, "loss": 1.1833, "step": 15510 }, { "epoch": 15.0, "learning_rate": 8.039054054054054e-05, "loss": 1.169, "step": 15520 }, { "epoch": 15.0, "learning_rate": 8.037702702702703e-05, "loss": 2.7122, "step": 15530 }, { "epoch": 15.0, "learning_rate": 8.036351351351352e-05, "loss": 2.4789, "step": 15540 }, { "epoch": 15.0, "learning_rate": 8.035e-05, "loss": 2.672, "step": 15550 }, { "epoch": 15.0, "learning_rate": 8.03364864864865e-05, "loss": 2.6436, "step": 15560 }, { "epoch": 15.0, "learning_rate": 8.032297297297298e-05, "loss": 1.647, "step": 15570 }, { "epoch": 15.0, "learning_rate": 8.030945945945947e-05, "loss": 1.7633, "step": 15580 }, { "epoch": 15.0, "learning_rate": 8.029594594594595e-05, "loss": 0.9401, "step": 15590 }, { "epoch": 15.0, "learning_rate": 8.028243243243245e-05, "loss": 0.3546, "step": 15600 }, { "epoch": 15.0, "learning_rate": 8.026891891891893e-05, "loss": 0.2507, "step": 15610 }, { "epoch": 15.0, "learning_rate": 8.025540540540541e-05, "loss": 0.3338, "step": 15620 }, { "epoch": 15.0, "learning_rate": 8.024189189189189e-05, "loss": 0.4008, "step": 15630 }, { "epoch": 15.0, "learning_rate": 8.022837837837837e-05, "loss": 0.4553, "step": 15640 }, { "epoch": 15.0, "learning_rate": 8.021486486486487e-05, "loss": 0.4942, "step": 15650 }, { "epoch": 15.0, "learning_rate": 8.020135135135135e-05, "loss": 0.3217, "step": 15660 }, { "epoch": 15.0, "learning_rate": 8.018783783783784e-05, "loss": 0.232, "step": 15670 }, { "epoch": 15.0, "learning_rate": 8.017432432432432e-05, "loss": 0.3808, "step": 15680 }, { "epoch": 15.0, "learning_rate": 8.016081081081082e-05, "loss": 0.3173, "step": 15690 }, { "epoch": 15.0, "learning_rate": 8.01472972972973e-05, "loss": 0.4102, "step": 15700 }, { "epoch": 15.0, "learning_rate": 8.013378378378379e-05, "loss": 0.3882, "step": 15710 }, { "epoch": 15.01, "learning_rate": 8.012027027027027e-05, "loss": 0.2733, "step": 15720 }, { "epoch": 15.01, "learning_rate": 8.010675675675677e-05, "loss": 0.2237, "step": 15730 }, { "epoch": 15.01, "learning_rate": 8.009324324324325e-05, "loss": 0.1819, "step": 15740 }, { "epoch": 15.01, "learning_rate": 8.007972972972973e-05, "loss": 0.2728, "step": 15750 }, { "epoch": 15.01, "learning_rate": 8.006621621621621e-05, "loss": 0.3077, "step": 15760 }, { "epoch": 15.01, "learning_rate": 8.00527027027027e-05, "loss": 0.3603, "step": 15770 }, { "epoch": 15.01, "learning_rate": 8.003918918918919e-05, "loss": 0.3424, "step": 15780 }, { "epoch": 15.01, "learning_rate": 8.002567567567568e-05, "loss": 0.4165, "step": 15790 }, { "epoch": 15.01, "learning_rate": 8.001216216216216e-05, "loss": 0.303, "step": 15800 }, { "epoch": 15.01, "learning_rate": 7.999864864864866e-05, "loss": 0.4243, "step": 15810 }, { "epoch": 15.01, "learning_rate": 7.998513513513514e-05, "loss": 0.4912, "step": 15820 }, { "epoch": 15.01, "learning_rate": 7.997162162162163e-05, "loss": 0.4991, "step": 15830 }, { "epoch": 15.01, "learning_rate": 7.995810810810811e-05, "loss": 0.4823, "step": 15840 }, { "epoch": 15.01, "learning_rate": 7.99445945945946e-05, "loss": 0.3835, "step": 15850 }, { "epoch": 15.01, "learning_rate": 7.993108108108109e-05, "loss": 0.4958, "step": 15860 }, { "epoch": 15.01, "learning_rate": 7.991756756756757e-05, "loss": 0.7868, "step": 15870 }, { "epoch": 15.01, "learning_rate": 7.990405405405405e-05, "loss": 0.6092, "step": 15880 }, { "epoch": 15.01, "learning_rate": 7.989054054054055e-05, "loss": 0.247, "step": 15890 }, { "epoch": 15.01, "learning_rate": 7.987702702702703e-05, "loss": 0.3259, "step": 15900 }, { "epoch": 15.01, "learning_rate": 7.986351351351352e-05, "loss": 0.2574, "step": 15910 }, { "epoch": 15.01, "learning_rate": 7.985e-05, "loss": 0.2661, "step": 15920 }, { "epoch": 15.01, "learning_rate": 7.98364864864865e-05, "loss": 0.2452, "step": 15930 }, { "epoch": 15.01, "learning_rate": 7.982297297297298e-05, "loss": 0.2309, "step": 15940 }, { "epoch": 15.01, "learning_rate": 7.980945945945947e-05, "loss": 0.2486, "step": 15950 }, { "epoch": 15.01, "learning_rate": 7.979594594594595e-05, "loss": 0.344, "step": 15960 }, { "epoch": 15.01, "learning_rate": 7.978243243243244e-05, "loss": 0.5708, "step": 15970 }, { "epoch": 15.01, "learning_rate": 7.976891891891892e-05, "loss": 0.4729, "step": 15980 }, { "epoch": 15.01, "learning_rate": 7.975540540540541e-05, "loss": 0.3825, "step": 15990 }, { "epoch": 15.01, "learning_rate": 7.974189189189189e-05, "loss": 0.4807, "step": 16000 }, { "epoch": 15.01, "eval_loss": 0.1240745559334755, "eval_runtime": 129.6187, "eval_samples_per_second": 27.835, "eval_steps_per_second": 3.479, "eval_wer": 0.13441736942645482, "step": 16000 }, { "epoch": 15.01, "learning_rate": 7.972837837837839e-05, "loss": 0.6695, "step": 16010 }, { "epoch": 15.01, "learning_rate": 7.971486486486487e-05, "loss": 0.3353, "step": 16020 }, { "epoch": 15.01, "learning_rate": 7.970135135135135e-05, "loss": 0.2649, "step": 16030 }, { "epoch": 15.01, "learning_rate": 7.968783783783784e-05, "loss": 0.4043, "step": 16040 }, { "epoch": 15.01, "learning_rate": 7.967432432432432e-05, "loss": 0.505, "step": 16050 }, { "epoch": 15.01, "learning_rate": 7.966081081081082e-05, "loss": 0.4693, "step": 16060 }, { "epoch": 15.01, "learning_rate": 7.96472972972973e-05, "loss": 0.4367, "step": 16070 }, { "epoch": 15.01, "learning_rate": 7.96337837837838e-05, "loss": 0.402, "step": 16080 }, { "epoch": 15.01, "learning_rate": 7.962027027027028e-05, "loss": 0.3804, "step": 16090 }, { "epoch": 15.01, "learning_rate": 7.960675675675676e-05, "loss": 0.3068, "step": 16100 }, { "epoch": 15.01, "learning_rate": 7.959324324324324e-05, "loss": 0.4079, "step": 16110 }, { "epoch": 15.01, "learning_rate": 7.957972972972973e-05, "loss": 0.2305, "step": 16120 }, { "epoch": 15.01, "learning_rate": 7.956621621621621e-05, "loss": 0.287, "step": 16130 }, { "epoch": 15.01, "learning_rate": 7.955270270270271e-05, "loss": 0.4427, "step": 16140 }, { "epoch": 15.01, "learning_rate": 7.953918918918919e-05, "loss": 0.7631, "step": 16150 }, { "epoch": 15.01, "learning_rate": 7.952567567567568e-05, "loss": 0.2665, "step": 16160 }, { "epoch": 15.01, "learning_rate": 7.951216216216216e-05, "loss": 0.3035, "step": 16170 }, { "epoch": 15.01, "learning_rate": 7.949864864864866e-05, "loss": 0.3758, "step": 16180 }, { "epoch": 15.01, "learning_rate": 7.948513513513514e-05, "loss": 0.3474, "step": 16190 }, { "epoch": 15.01, "learning_rate": 7.947162162162163e-05, "loss": 0.3693, "step": 16200 }, { "epoch": 15.01, "learning_rate": 7.945810810810812e-05, "loss": 0.4554, "step": 16210 }, { "epoch": 15.01, "learning_rate": 7.94445945945946e-05, "loss": 0.4415, "step": 16220 }, { "epoch": 15.01, "learning_rate": 7.943108108108108e-05, "loss": 0.298, "step": 16230 }, { "epoch": 15.01, "learning_rate": 7.941756756756757e-05, "loss": 0.4008, "step": 16240 }, { "epoch": 15.01, "learning_rate": 7.940405405405405e-05, "loss": 0.5038, "step": 16250 }, { "epoch": 15.01, "learning_rate": 7.939054054054055e-05, "loss": 0.4584, "step": 16260 }, { "epoch": 15.01, "learning_rate": 7.937702702702703e-05, "loss": 0.5274, "step": 16270 }, { "epoch": 15.01, "learning_rate": 7.936351351351352e-05, "loss": 0.5089, "step": 16280 }, { "epoch": 15.01, "learning_rate": 7.935e-05, "loss": 0.7511, "step": 16290 }, { "epoch": 15.01, "learning_rate": 7.93364864864865e-05, "loss": 0.5638, "step": 16300 }, { "epoch": 15.01, "learning_rate": 7.932297297297298e-05, "loss": 0.7934, "step": 16310 }, { "epoch": 15.01, "learning_rate": 7.930945945945946e-05, "loss": 0.6758, "step": 16320 }, { "epoch": 15.01, "learning_rate": 7.929594594594594e-05, "loss": 0.5177, "step": 16330 }, { "epoch": 15.01, "learning_rate": 7.928243243243244e-05, "loss": 0.4837, "step": 16340 }, { "epoch": 15.01, "learning_rate": 7.926891891891892e-05, "loss": 0.5213, "step": 16350 }, { "epoch": 15.01, "learning_rate": 7.925540540540541e-05, "loss": 0.5502, "step": 16360 }, { "epoch": 16.0, "learning_rate": 7.924189189189189e-05, "loss": 0.6568, "step": 16370 }, { "epoch": 16.0, "learning_rate": 7.922837837837839e-05, "loss": 0.5301, "step": 16380 }, { "epoch": 16.0, "learning_rate": 7.921486486486487e-05, "loss": 0.5211, "step": 16390 }, { "epoch": 16.0, "learning_rate": 7.920135135135136e-05, "loss": 0.5462, "step": 16400 }, { "epoch": 16.0, "learning_rate": 7.918783783783784e-05, "loss": 0.4601, "step": 16410 }, { "epoch": 16.0, "learning_rate": 7.917432432432433e-05, "loss": 0.522, "step": 16420 }, { "epoch": 16.0, "learning_rate": 7.916081081081082e-05, "loss": 0.593, "step": 16430 }, { "epoch": 16.0, "learning_rate": 7.91472972972973e-05, "loss": 0.6311, "step": 16440 }, { "epoch": 16.0, "learning_rate": 7.913378378378378e-05, "loss": 0.501, "step": 16450 }, { "epoch": 16.0, "learning_rate": 7.912027027027026e-05, "loss": 0.5547, "step": 16460 }, { "epoch": 16.0, "learning_rate": 7.910675675675676e-05, "loss": 0.5181, "step": 16470 }, { "epoch": 16.0, "learning_rate": 7.909324324324324e-05, "loss": 0.4838, "step": 16480 }, { "epoch": 16.0, "learning_rate": 7.907972972972973e-05, "loss": 0.4438, "step": 16490 }, { "epoch": 16.0, "learning_rate": 7.906621621621621e-05, "loss": 0.3233, "step": 16500 }, { "epoch": 16.0, "eval_loss": 0.1575058251619339, "eval_runtime": 133.2387, "eval_samples_per_second": 27.079, "eval_steps_per_second": 3.385, "eval_wer": 0.16041559893770674, "step": 16500 }, { "epoch": 16.0, "learning_rate": 7.905270270270271e-05, "loss": 0.3342, "step": 16510 }, { "epoch": 16.0, "learning_rate": 7.903918918918919e-05, "loss": 0.3087, "step": 16520 }, { "epoch": 16.0, "learning_rate": 7.902567567567568e-05, "loss": 0.8746, "step": 16530 }, { "epoch": 16.0, "learning_rate": 7.901216216216217e-05, "loss": 1.0915, "step": 16540 }, { "epoch": 16.0, "learning_rate": 7.899864864864866e-05, "loss": 2.4031, "step": 16550 }, { "epoch": 16.0, "learning_rate": 7.898513513513514e-05, "loss": 2.578, "step": 16560 }, { "epoch": 16.0, "learning_rate": 7.897162162162162e-05, "loss": 2.5281, "step": 16570 }, { "epoch": 16.0, "learning_rate": 7.89581081081081e-05, "loss": 2.6187, "step": 16580 }, { "epoch": 16.0, "learning_rate": 7.89445945945946e-05, "loss": 1.9944, "step": 16590 }, { "epoch": 16.0, "learning_rate": 7.893108108108108e-05, "loss": 1.7631, "step": 16600 }, { "epoch": 16.0, "learning_rate": 7.891756756756757e-05, "loss": 1.0247, "step": 16610 }, { "epoch": 16.0, "learning_rate": 7.890405405405405e-05, "loss": 0.4983, "step": 16620 }, { "epoch": 16.0, "learning_rate": 7.889054054054055e-05, "loss": 0.1962, "step": 16630 }, { "epoch": 16.0, "learning_rate": 7.887702702702703e-05, "loss": 0.344, "step": 16640 }, { "epoch": 16.0, "learning_rate": 7.886351351351352e-05, "loss": 0.3637, "step": 16650 }, { "epoch": 16.0, "learning_rate": 7.885e-05, "loss": 0.3745, "step": 16660 }, { "epoch": 16.0, "learning_rate": 7.88364864864865e-05, "loss": 0.5849, "step": 16670 }, { "epoch": 16.0, "learning_rate": 7.882297297297298e-05, "loss": 0.3322, "step": 16680 }, { "epoch": 16.0, "learning_rate": 7.880945945945946e-05, "loss": 0.2152, "step": 16690 }, { "epoch": 16.0, "learning_rate": 7.879594594594594e-05, "loss": 0.3465, "step": 16700 }, { "epoch": 16.0, "learning_rate": 7.878243243243244e-05, "loss": 0.2604, "step": 16710 }, { "epoch": 16.0, "learning_rate": 7.876891891891892e-05, "loss": 0.3972, "step": 16720 }, { "epoch": 16.0, "learning_rate": 7.875540540540541e-05, "loss": 0.3428, "step": 16730 }, { "epoch": 16.0, "learning_rate": 7.87418918918919e-05, "loss": 0.2522, "step": 16740 }, { "epoch": 16.01, "learning_rate": 7.872837837837839e-05, "loss": 0.3086, "step": 16750 }, { "epoch": 16.01, "learning_rate": 7.871486486486487e-05, "loss": 0.164, "step": 16760 }, { "epoch": 16.01, "learning_rate": 7.870135135135136e-05, "loss": 0.265, "step": 16770 }, { "epoch": 16.01, "learning_rate": 7.868783783783785e-05, "loss": 0.2949, "step": 16780 }, { "epoch": 16.01, "learning_rate": 7.867432432432433e-05, "loss": 0.2148, "step": 16790 }, { "epoch": 16.01, "learning_rate": 7.866081081081081e-05, "loss": 0.3078, "step": 16800 }, { "epoch": 16.01, "learning_rate": 7.86472972972973e-05, "loss": 0.4156, "step": 16810 }, { "epoch": 16.01, "learning_rate": 7.863378378378378e-05, "loss": 0.3088, "step": 16820 }, { "epoch": 16.01, "learning_rate": 7.862027027027026e-05, "loss": 0.3847, "step": 16830 }, { "epoch": 16.01, "learning_rate": 7.860675675675676e-05, "loss": 0.4949, "step": 16840 }, { "epoch": 16.01, "learning_rate": 7.859324324324324e-05, "loss": 0.4344, "step": 16850 }, { "epoch": 16.01, "learning_rate": 7.857972972972973e-05, "loss": 0.5611, "step": 16860 }, { "epoch": 16.01, "learning_rate": 7.856621621621622e-05, "loss": 0.4489, "step": 16870 }, { "epoch": 16.01, "learning_rate": 7.855270270270271e-05, "loss": 0.4117, "step": 16880 }, { "epoch": 16.01, "learning_rate": 7.853918918918919e-05, "loss": 0.7927, "step": 16890 }, { "epoch": 16.01, "learning_rate": 7.852567567567569e-05, "loss": 0.6944, "step": 16900 }, { "epoch": 16.01, "learning_rate": 7.851216216216217e-05, "loss": 0.303, "step": 16910 }, { "epoch": 16.01, "learning_rate": 7.849864864864865e-05, "loss": 0.2339, "step": 16920 }, { "epoch": 16.01, "learning_rate": 7.848513513513513e-05, "loss": 0.3128, "step": 16930 }, { "epoch": 16.01, "learning_rate": 7.847162162162162e-05, "loss": 0.2514, "step": 16940 }, { "epoch": 16.01, "learning_rate": 7.84581081081081e-05, "loss": 0.2335, "step": 16950 }, { "epoch": 16.01, "learning_rate": 7.84445945945946e-05, "loss": 0.2514, "step": 16960 }, { "epoch": 16.01, "learning_rate": 7.843108108108108e-05, "loss": 0.2545, "step": 16970 }, { "epoch": 16.01, "learning_rate": 7.841756756756757e-05, "loss": 0.2766, "step": 16980 }, { "epoch": 16.01, "learning_rate": 7.840405405405406e-05, "loss": 0.5465, "step": 16990 }, { "epoch": 16.01, "learning_rate": 7.839054054054055e-05, "loss": 0.4601, "step": 17000 }, { "epoch": 16.01, "eval_loss": 0.13551324605941772, "eval_runtime": 130.7771, "eval_samples_per_second": 27.589, "eval_steps_per_second": 3.449, "eval_wer": 0.14252434422028606, "step": 17000 }, { "epoch": 16.01, "learning_rate": 7.837702702702703e-05, "loss": 0.4131, "step": 17010 }, { "epoch": 16.01, "learning_rate": 7.836351351351353e-05, "loss": 0.4443, "step": 17020 }, { "epoch": 16.01, "learning_rate": 7.835000000000001e-05, "loss": 0.5621, "step": 17030 }, { "epoch": 16.01, "learning_rate": 7.833648648648649e-05, "loss": 0.4102, "step": 17040 }, { "epoch": 16.01, "learning_rate": 7.832297297297297e-05, "loss": 0.2675, "step": 17050 }, { "epoch": 16.01, "learning_rate": 7.830945945945946e-05, "loss": 0.3307, "step": 17060 }, { "epoch": 16.01, "learning_rate": 7.829594594594594e-05, "loss": 0.4319, "step": 17070 }, { "epoch": 16.01, "learning_rate": 7.828243243243244e-05, "loss": 0.4431, "step": 17080 }, { "epoch": 16.01, "learning_rate": 7.826891891891892e-05, "loss": 0.3902, "step": 17090 }, { "epoch": 16.01, "learning_rate": 7.825540540540541e-05, "loss": 0.3627, "step": 17100 }, { "epoch": 16.01, "learning_rate": 7.82418918918919e-05, "loss": 0.3981, "step": 17110 }, { "epoch": 16.01, "learning_rate": 7.822837837837839e-05, "loss": 0.3234, "step": 17120 }, { "epoch": 16.01, "learning_rate": 7.821486486486487e-05, "loss": 0.3112, "step": 17130 }, { "epoch": 16.01, "learning_rate": 7.820135135135137e-05, "loss": 0.2303, "step": 17140 }, { "epoch": 16.01, "learning_rate": 7.818783783783785e-05, "loss": 0.1838, "step": 17150 }, { "epoch": 16.01, "learning_rate": 7.817432432432433e-05, "loss": 0.3827, "step": 17160 }, { "epoch": 16.01, "learning_rate": 7.816081081081081e-05, "loss": 0.7938, "step": 17170 }, { "epoch": 16.01, "learning_rate": 7.81472972972973e-05, "loss": 0.3636, "step": 17180 }, { "epoch": 16.01, "learning_rate": 7.813378378378378e-05, "loss": 0.2819, "step": 17190 }, { "epoch": 16.01, "learning_rate": 7.812027027027028e-05, "loss": 0.365, "step": 17200 }, { "epoch": 16.01, "learning_rate": 7.810675675675676e-05, "loss": 0.3112, "step": 17210 }, { "epoch": 16.01, "learning_rate": 7.809324324324324e-05, "loss": 0.3728, "step": 17220 }, { "epoch": 16.01, "learning_rate": 7.807972972972974e-05, "loss": 0.4685, "step": 17230 }, { "epoch": 16.01, "learning_rate": 7.806621621621622e-05, "loss": 0.4407, "step": 17240 }, { "epoch": 16.01, "learning_rate": 7.805270270270271e-05, "loss": 0.2793, "step": 17250 }, { "epoch": 16.01, "learning_rate": 7.803918918918919e-05, "loss": 0.3899, "step": 17260 }, { "epoch": 16.01, "learning_rate": 7.802567567567567e-05, "loss": 0.3733, "step": 17270 }, { "epoch": 16.01, "learning_rate": 7.801216216216215e-05, "loss": 0.6168, "step": 17280 }, { "epoch": 16.01, "learning_rate": 7.799864864864865e-05, "loss": 0.5629, "step": 17290 }, { "epoch": 16.01, "learning_rate": 7.798513513513513e-05, "loss": 0.4894, "step": 17300 }, { "epoch": 16.01, "learning_rate": 7.797162162162163e-05, "loss": 0.6873, "step": 17310 }, { "epoch": 16.01, "learning_rate": 7.79581081081081e-05, "loss": 0.6353, "step": 17320 }, { "epoch": 16.01, "learning_rate": 7.79445945945946e-05, "loss": 0.5931, "step": 17330 }, { "epoch": 16.01, "learning_rate": 7.793108108108108e-05, "loss": 0.7208, "step": 17340 }, { "epoch": 16.01, "learning_rate": 7.791756756756758e-05, "loss": 0.531, "step": 17350 }, { "epoch": 16.01, "learning_rate": 7.790405405405406e-05, "loss": 0.6041, "step": 17360 }, { "epoch": 16.01, "learning_rate": 7.789054054054055e-05, "loss": 0.5736, "step": 17370 }, { "epoch": 16.01, "learning_rate": 7.787702702702703e-05, "loss": 0.5476, "step": 17380 }, { "epoch": 16.01, "learning_rate": 7.786351351351351e-05, "loss": 0.7599, "step": 17390 }, { "epoch": 17.0, "learning_rate": 7.785e-05, "loss": 0.5896, "step": 17400 }, { "epoch": 17.0, "learning_rate": 7.783648648648649e-05, "loss": 0.5472, "step": 17410 }, { "epoch": 17.0, "learning_rate": 7.782297297297297e-05, "loss": 0.5624, "step": 17420 }, { "epoch": 17.0, "learning_rate": 7.780945945945947e-05, "loss": 0.4651, "step": 17430 }, { "epoch": 17.0, "learning_rate": 7.779594594594595e-05, "loss": 0.501, "step": 17440 }, { "epoch": 17.0, "learning_rate": 7.778243243243244e-05, "loss": 0.4712, "step": 17450 }, { "epoch": 17.0, "learning_rate": 7.776891891891892e-05, "loss": 0.7017, "step": 17460 }, { "epoch": 17.0, "learning_rate": 7.775540540540542e-05, "loss": 0.4803, "step": 17470 }, { "epoch": 17.0, "learning_rate": 7.77418918918919e-05, "loss": 0.5302, "step": 17480 }, { "epoch": 17.0, "learning_rate": 7.772837837837839e-05, "loss": 0.5389, "step": 17490 }, { "epoch": 17.0, "learning_rate": 7.771486486486487e-05, "loss": 0.4699, "step": 17500 }, { "epoch": 17.0, "eval_loss": 0.14289720356464386, "eval_runtime": 130.2341, "eval_samples_per_second": 27.704, "eval_steps_per_second": 3.463, "eval_wer": 0.1471369333271211, "step": 17500 }, { "epoch": 17.0, "learning_rate": 7.770135135135135e-05, "loss": 0.4756, "step": 17510 }, { "epoch": 17.0, "learning_rate": 7.768783783783784e-05, "loss": 0.3455, "step": 17520 }, { "epoch": 17.0, "learning_rate": 7.767432432432433e-05, "loss": 0.3009, "step": 17530 }, { "epoch": 17.0, "learning_rate": 7.766081081081081e-05, "loss": 0.3375, "step": 17540 }, { "epoch": 17.0, "learning_rate": 7.76472972972973e-05, "loss": 0.4251, "step": 17550 }, { "epoch": 17.0, "learning_rate": 7.763378378378379e-05, "loss": 1.476, "step": 17560 }, { "epoch": 17.0, "learning_rate": 7.762027027027028e-05, "loss": 1.7802, "step": 17570 }, { "epoch": 17.0, "learning_rate": 7.760675675675676e-05, "loss": 2.6503, "step": 17580 }, { "epoch": 17.0, "learning_rate": 7.759324324324326e-05, "loss": 2.4926, "step": 17590 }, { "epoch": 17.0, "learning_rate": 7.757972972972974e-05, "loss": 2.6115, "step": 17600 }, { "epoch": 17.0, "learning_rate": 7.756621621621623e-05, "loss": 2.1764, "step": 17610 }, { "epoch": 17.0, "learning_rate": 7.755270270270271e-05, "loss": 1.6546, "step": 17620 }, { "epoch": 17.0, "learning_rate": 7.75391891891892e-05, "loss": 1.2824, "step": 17630 }, { "epoch": 17.0, "learning_rate": 7.752567567567568e-05, "loss": 0.6734, "step": 17640 }, { "epoch": 17.0, "learning_rate": 7.751216216216216e-05, "loss": 0.1884, "step": 17650 }, { "epoch": 17.0, "learning_rate": 7.749864864864865e-05, "loss": 0.3785, "step": 17660 }, { "epoch": 17.0, "learning_rate": 7.748513513513513e-05, "loss": 0.2736, "step": 17670 }, { "epoch": 17.0, "learning_rate": 7.747162162162163e-05, "loss": 0.4262, "step": 17680 }, { "epoch": 17.0, "learning_rate": 7.745810810810811e-05, "loss": 0.5528, "step": 17690 }, { "epoch": 17.0, "learning_rate": 7.74445945945946e-05, "loss": 0.4257, "step": 17700 }, { "epoch": 17.0, "learning_rate": 7.743108108108108e-05, "loss": 0.2285, "step": 17710 }, { "epoch": 17.0, "learning_rate": 7.741756756756758e-05, "loss": 0.3112, "step": 17720 }, { "epoch": 17.0, "learning_rate": 7.740405405405406e-05, "loss": 0.2759, "step": 17730 }, { "epoch": 17.0, "learning_rate": 7.739054054054054e-05, "loss": 0.2776, "step": 17740 }, { "epoch": 17.0, "learning_rate": 7.737702702702702e-05, "loss": 0.4162, "step": 17750 }, { "epoch": 17.0, "learning_rate": 7.736351351351352e-05, "loss": 0.2953, "step": 17760 }, { "epoch": 17.01, "learning_rate": 7.735e-05, "loss": 0.2607, "step": 17770 }, { "epoch": 17.01, "learning_rate": 7.733648648648649e-05, "loss": 0.1951, "step": 17780 }, { "epoch": 17.01, "learning_rate": 7.732297297297297e-05, "loss": 0.1989, "step": 17790 }, { "epoch": 17.01, "learning_rate": 7.730945945945947e-05, "loss": 0.2768, "step": 17800 }, { "epoch": 17.01, "learning_rate": 7.729594594594595e-05, "loss": 0.2, "step": 17810 }, { "epoch": 17.01, "learning_rate": 7.728243243243244e-05, "loss": 0.2828, "step": 17820 }, { "epoch": 17.01, "learning_rate": 7.726891891891892e-05, "loss": 0.386, "step": 17830 }, { "epoch": 17.01, "learning_rate": 7.725540540540542e-05, "loss": 0.411, "step": 17840 }, { "epoch": 17.01, "learning_rate": 7.72418918918919e-05, "loss": 0.3566, "step": 17850 }, { "epoch": 17.01, "learning_rate": 7.722837837837838e-05, "loss": 0.4277, "step": 17860 }, { "epoch": 17.01, "learning_rate": 7.721486486486486e-05, "loss": 0.4475, "step": 17870 }, { "epoch": 17.01, "learning_rate": 7.720135135135136e-05, "loss": 0.5039, "step": 17880 }, { "epoch": 17.01, "learning_rate": 7.718783783783784e-05, "loss": 0.5249, "step": 17890 }, { "epoch": 17.01, "learning_rate": 7.717432432432433e-05, "loss": 0.3265, "step": 17900 }, { "epoch": 17.01, "learning_rate": 7.716081081081081e-05, "loss": 0.5893, "step": 17910 }, { "epoch": 17.01, "learning_rate": 7.71472972972973e-05, "loss": 0.6742, "step": 17920 }, { "epoch": 17.01, "learning_rate": 7.713378378378379e-05, "loss": 0.427, "step": 17930 }, { "epoch": 17.01, "learning_rate": 7.712027027027028e-05, "loss": 0.1811, "step": 17940 }, { "epoch": 17.01, "learning_rate": 7.710675675675676e-05, "loss": 0.3855, "step": 17950 }, { "epoch": 17.01, "learning_rate": 7.709324324324326e-05, "loss": 0.28, "step": 17960 }, { "epoch": 17.01, "learning_rate": 7.707972972972974e-05, "loss": 0.2744, "step": 17970 }, { "epoch": 17.01, "learning_rate": 7.706621621621622e-05, "loss": 0.2714, "step": 17980 }, { "epoch": 17.01, "learning_rate": 7.70527027027027e-05, "loss": 0.2422, "step": 17990 }, { "epoch": 17.01, "learning_rate": 7.70391891891892e-05, "loss": 0.2277, "step": 18000 }, { "epoch": 17.01, "eval_loss": 0.1268441528081894, "eval_runtime": 127.9517, "eval_samples_per_second": 28.198, "eval_steps_per_second": 3.525, "eval_wer": 0.1329730233424964, "step": 18000 }, { "epoch": 17.01, "learning_rate": 7.702567567567568e-05, "loss": 0.4365, "step": 18010 }, { "epoch": 17.01, "learning_rate": 7.701216216216217e-05, "loss": 0.4802, "step": 18020 }, { "epoch": 17.01, "learning_rate": 7.699864864864865e-05, "loss": 0.4504, "step": 18030 }, { "epoch": 17.01, "learning_rate": 7.698513513513513e-05, "loss": 0.4038, "step": 18040 }, { "epoch": 17.01, "learning_rate": 7.697162162162163e-05, "loss": 0.5162, "step": 18050 }, { "epoch": 17.01, "learning_rate": 7.695810810810811e-05, "loss": 0.4978, "step": 18060 }, { "epoch": 17.01, "learning_rate": 7.69445945945946e-05, "loss": 0.307, "step": 18070 }, { "epoch": 17.01, "learning_rate": 7.693108108108108e-05, "loss": 0.2959, "step": 18080 }, { "epoch": 17.01, "learning_rate": 7.691756756756757e-05, "loss": 0.3857, "step": 18090 }, { "epoch": 17.01, "learning_rate": 7.690405405405405e-05, "loss": 0.5023, "step": 18100 }, { "epoch": 17.01, "learning_rate": 7.689054054054054e-05, "loss": 0.4852, "step": 18110 }, { "epoch": 17.01, "learning_rate": 7.687702702702702e-05, "loss": 0.3204, "step": 18120 }, { "epoch": 17.01, "learning_rate": 7.686351351351352e-05, "loss": 0.3898, "step": 18130 }, { "epoch": 17.01, "learning_rate": 7.685e-05, "loss": 0.3163, "step": 18140 }, { "epoch": 17.01, "learning_rate": 7.683648648648649e-05, "loss": 0.2995, "step": 18150 }, { "epoch": 17.01, "learning_rate": 7.682297297297297e-05, "loss": 0.3289, "step": 18160 }, { "epoch": 17.01, "learning_rate": 7.680945945945947e-05, "loss": 0.1953, "step": 18170 }, { "epoch": 17.01, "learning_rate": 7.679594594594595e-05, "loss": 0.3633, "step": 18180 }, { "epoch": 17.01, "learning_rate": 7.678243243243244e-05, "loss": 0.5665, "step": 18190 }, { "epoch": 17.01, "learning_rate": 7.676891891891892e-05, "loss": 0.5019, "step": 18200 }, { "epoch": 17.01, "learning_rate": 7.67554054054054e-05, "loss": 0.2567, "step": 18210 }, { "epoch": 17.01, "learning_rate": 7.674189189189189e-05, "loss": 0.288, "step": 18220 }, { "epoch": 17.01, "learning_rate": 7.672837837837838e-05, "loss": 0.3649, "step": 18230 }, { "epoch": 17.01, "learning_rate": 7.671486486486486e-05, "loss": 0.3576, "step": 18240 }, { "epoch": 17.01, "learning_rate": 7.670135135135136e-05, "loss": 0.4297, "step": 18250 }, { "epoch": 17.01, "learning_rate": 7.668783783783784e-05, "loss": 0.4873, "step": 18260 }, { "epoch": 17.01, "learning_rate": 7.667432432432433e-05, "loss": 0.3248, "step": 18270 }, { "epoch": 17.01, "learning_rate": 7.666081081081081e-05, "loss": 0.3613, "step": 18280 }, { "epoch": 17.01, "learning_rate": 7.664729729729731e-05, "loss": 0.3452, "step": 18290 }, { "epoch": 17.01, "learning_rate": 7.663378378378379e-05, "loss": 0.517, "step": 18300 }, { "epoch": 17.01, "learning_rate": 7.662027027027028e-05, "loss": 0.557, "step": 18310 }, { "epoch": 17.01, "learning_rate": 7.660675675675676e-05, "loss": 0.5541, "step": 18320 }, { "epoch": 17.01, "learning_rate": 7.659324324324325e-05, "loss": 0.4852, "step": 18330 }, { "epoch": 17.01, "learning_rate": 7.657972972972973e-05, "loss": 0.7001, "step": 18340 }, { "epoch": 17.01, "learning_rate": 7.656621621621622e-05, "loss": 0.6317, "step": 18350 }, { "epoch": 17.01, "learning_rate": 7.65527027027027e-05, "loss": 0.778, "step": 18360 }, { "epoch": 17.01, "learning_rate": 7.65391891891892e-05, "loss": 0.544, "step": 18370 }, { "epoch": 17.01, "learning_rate": 7.652567567567568e-05, "loss": 0.5194, "step": 18380 }, { "epoch": 17.01, "learning_rate": 7.651216216216217e-05, "loss": 0.4859, "step": 18390 }, { "epoch": 17.01, "learning_rate": 7.649864864864865e-05, "loss": 0.4833, "step": 18400 }, { "epoch": 17.01, "learning_rate": 7.648513513513515e-05, "loss": 0.6181, "step": 18410 }, { "epoch": 18.0, "learning_rate": 7.647162162162163e-05, "loss": 0.5963, "step": 18420 }, { "epoch": 18.0, "learning_rate": 7.645810810810811e-05, "loss": 0.5302, "step": 18430 }, { "epoch": 18.0, "learning_rate": 7.64445945945946e-05, "loss": 0.5749, "step": 18440 }, { "epoch": 18.0, "learning_rate": 7.643108108108109e-05, "loss": 0.4641, "step": 18450 }, { "epoch": 18.0, "learning_rate": 7.641756756756757e-05, "loss": 0.487, "step": 18460 }, { "epoch": 18.0, "learning_rate": 7.640405405405405e-05, "loss": 0.5102, "step": 18470 }, { "epoch": 18.0, "learning_rate": 7.639054054054054e-05, "loss": 0.7349, "step": 18480 }, { "epoch": 18.0, "learning_rate": 7.637702702702702e-05, "loss": 0.4991, "step": 18490 }, { "epoch": 18.0, "learning_rate": 7.636351351351352e-05, "loss": 0.4472, "step": 18500 }, { "epoch": 18.0, "eval_loss": 0.13492043316364288, "eval_runtime": 129.8001, "eval_samples_per_second": 27.797, "eval_steps_per_second": 3.475, "eval_wer": 0.1383310813958906, "step": 18500 }, { "epoch": 18.0, "learning_rate": 7.635e-05, "loss": 0.509, "step": 18510 }, { "epoch": 18.0, "learning_rate": 7.63364864864865e-05, "loss": 0.4876, "step": 18520 }, { "epoch": 18.0, "learning_rate": 7.632297297297297e-05, "loss": 0.494, "step": 18530 }, { "epoch": 18.0, "learning_rate": 7.630945945945947e-05, "loss": 0.3385, "step": 18540 }, { "epoch": 18.0, "learning_rate": 7.629594594594595e-05, "loss": 0.2942, "step": 18550 }, { "epoch": 18.0, "learning_rate": 7.628243243243243e-05, "loss": 0.3326, "step": 18560 }, { "epoch": 18.0, "learning_rate": 7.626891891891891e-05, "loss": 0.3162, "step": 18570 }, { "epoch": 18.0, "learning_rate": 7.625540540540541e-05, "loss": 1.2909, "step": 18580 }, { "epoch": 18.0, "learning_rate": 7.624189189189189e-05, "loss": 1.3133, "step": 18590 }, { "epoch": 18.0, "learning_rate": 7.622837837837838e-05, "loss": 2.6373, "step": 18600 }, { "epoch": 18.0, "learning_rate": 7.621486486486486e-05, "loss": 2.4631, "step": 18610 }, { "epoch": 18.0, "learning_rate": 7.620135135135136e-05, "loss": 2.6128, "step": 18620 }, { "epoch": 18.0, "learning_rate": 7.618783783783784e-05, "loss": 2.5176, "step": 18630 }, { "epoch": 18.0, "learning_rate": 7.617432432432433e-05, "loss": 1.6144, "step": 18640 }, { "epoch": 18.0, "learning_rate": 7.616081081081081e-05, "loss": 1.6019, "step": 18650 }, { "epoch": 18.0, "learning_rate": 7.614729729729731e-05, "loss": 0.8426, "step": 18660 }, { "epoch": 18.0, "learning_rate": 7.613378378378379e-05, "loss": 0.2981, "step": 18670 }, { "epoch": 18.0, "learning_rate": 7.612027027027027e-05, "loss": 0.2928, "step": 18680 }, { "epoch": 18.0, "learning_rate": 7.610675675675675e-05, "loss": 0.2893, "step": 18690 }, { "epoch": 18.0, "learning_rate": 7.609324324324325e-05, "loss": 0.3979, "step": 18700 }, { "epoch": 18.0, "learning_rate": 7.607972972972973e-05, "loss": 0.4791, "step": 18710 }, { "epoch": 18.0, "learning_rate": 7.606621621621622e-05, "loss": 0.538, "step": 18720 }, { "epoch": 18.0, "learning_rate": 7.60527027027027e-05, "loss": 0.2737, "step": 18730 }, { "epoch": 18.0, "learning_rate": 7.60391891891892e-05, "loss": 0.238, "step": 18740 }, { "epoch": 18.0, "learning_rate": 7.602567567567568e-05, "loss": 0.3895, "step": 18750 }, { "epoch": 18.0, "learning_rate": 7.601216216216217e-05, "loss": 0.2977, "step": 18760 }, { "epoch": 18.0, "learning_rate": 7.599864864864865e-05, "loss": 0.3879, "step": 18770 }, { "epoch": 18.0, "learning_rate": 7.598513513513515e-05, "loss": 0.3052, "step": 18780 }, { "epoch": 18.01, "learning_rate": 7.597162162162163e-05, "loss": 0.2748, "step": 18790 }, { "epoch": 18.01, "learning_rate": 7.595810810810811e-05, "loss": 0.2206, "step": 18800 }, { "epoch": 18.01, "learning_rate": 7.594459459459459e-05, "loss": 0.2093, "step": 18810 }, { "epoch": 18.01, "learning_rate": 7.593108108108109e-05, "loss": 0.282, "step": 18820 }, { "epoch": 18.01, "learning_rate": 7.591756756756757e-05, "loss": 0.2314, "step": 18830 }, { "epoch": 18.01, "learning_rate": 7.590405405405405e-05, "loss": 0.2494, "step": 18840 }, { "epoch": 18.01, "learning_rate": 7.589054054054054e-05, "loss": 0.3164, "step": 18850 }, { "epoch": 18.01, "learning_rate": 7.587702702702702e-05, "loss": 0.4196, "step": 18860 }, { "epoch": 18.01, "learning_rate": 7.586351351351352e-05, "loss": 0.3123, "step": 18870 }, { "epoch": 18.01, "learning_rate": 7.585e-05, "loss": 0.4595, "step": 18880 }, { "epoch": 18.01, "learning_rate": 7.58364864864865e-05, "loss": 0.4233, "step": 18890 }, { "epoch": 18.01, "learning_rate": 7.582297297297298e-05, "loss": 0.4777, "step": 18900 }, { "epoch": 18.01, "learning_rate": 7.580945945945947e-05, "loss": 0.4486, "step": 18910 }, { "epoch": 18.01, "learning_rate": 7.579594594594595e-05, "loss": 0.3358, "step": 18920 }, { "epoch": 18.01, "learning_rate": 7.578243243243243e-05, "loss": 0.4984, "step": 18930 }, { "epoch": 18.01, "learning_rate": 7.576891891891891e-05, "loss": 0.6726, "step": 18940 }, { "epoch": 18.01, "learning_rate": 7.575540540540541e-05, "loss": 0.542, "step": 18950 }, { "epoch": 18.01, "learning_rate": 7.574189189189189e-05, "loss": 0.2174, "step": 18960 }, { "epoch": 18.01, "learning_rate": 7.572837837837838e-05, "loss": 0.2753, "step": 18970 }, { "epoch": 18.01, "learning_rate": 7.571486486486487e-05, "loss": 0.2989, "step": 18980 }, { "epoch": 18.01, "learning_rate": 7.570135135135136e-05, "loss": 0.2531, "step": 18990 }, { "epoch": 18.01, "learning_rate": 7.568783783783784e-05, "loss": 0.2611, "step": 19000 }, { "epoch": 18.01, "eval_loss": 0.12401454150676727, "eval_runtime": 128.6611, "eval_samples_per_second": 28.043, "eval_steps_per_second": 3.505, "eval_wer": 0.12854680147230116, "step": 19000 }, { "epoch": 18.01, "learning_rate": 7.567432432432434e-05, "loss": 0.2305, "step": 19010 }, { "epoch": 18.01, "learning_rate": 7.566081081081082e-05, "loss": 0.2309, "step": 19020 }, { "epoch": 18.01, "learning_rate": 7.56472972972973e-05, "loss": 0.3396, "step": 19030 }, { "epoch": 18.01, "learning_rate": 7.563378378378378e-05, "loss": 0.5302, "step": 19040 }, { "epoch": 18.01, "learning_rate": 7.562027027027027e-05, "loss": 0.4675, "step": 19050 }, { "epoch": 18.01, "learning_rate": 7.560675675675675e-05, "loss": 0.3014, "step": 19060 }, { "epoch": 18.01, "learning_rate": 7.559324324324325e-05, "loss": 0.4737, "step": 19070 }, { "epoch": 18.01, "learning_rate": 7.557972972972973e-05, "loss": 0.5653, "step": 19080 }, { "epoch": 18.01, "learning_rate": 7.556621621621622e-05, "loss": 0.3169, "step": 19090 }, { "epoch": 18.01, "learning_rate": 7.55527027027027e-05, "loss": 0.2601, "step": 19100 }, { "epoch": 18.01, "learning_rate": 7.55391891891892e-05, "loss": 0.3747, "step": 19110 }, { "epoch": 18.01, "learning_rate": 7.552567567567568e-05, "loss": 0.4457, "step": 19120 }, { "epoch": 18.01, "learning_rate": 7.551216216216218e-05, "loss": 0.4672, "step": 19130 }, { "epoch": 18.01, "learning_rate": 7.549864864864866e-05, "loss": 0.4156, "step": 19140 }, { "epoch": 18.01, "learning_rate": 7.548513513513514e-05, "loss": 0.3392, "step": 19150 }, { "epoch": 18.01, "learning_rate": 7.547162162162162e-05, "loss": 0.362, "step": 19160 }, { "epoch": 18.01, "learning_rate": 7.545810810810811e-05, "loss": 0.2983, "step": 19170 }, { "epoch": 18.01, "learning_rate": 7.54445945945946e-05, "loss": 0.3484, "step": 19180 }, { "epoch": 18.01, "learning_rate": 7.543108108108109e-05, "loss": 0.1829, "step": 19190 }, { "epoch": 18.01, "learning_rate": 7.541756756756757e-05, "loss": 0.2829, "step": 19200 }, { "epoch": 18.01, "learning_rate": 7.540405405405406e-05, "loss": 0.4345, "step": 19210 }, { "epoch": 18.01, "learning_rate": 7.539054054054055e-05, "loss": 0.7288, "step": 19220 }, { "epoch": 18.01, "learning_rate": 7.537702702702703e-05, "loss": 0.2809, "step": 19230 }, { "epoch": 18.01, "learning_rate": 7.536351351351352e-05, "loss": 0.2593, "step": 19240 }, { "epoch": 18.01, "learning_rate": 7.535e-05, "loss": 0.3349, "step": 19250 }, { "epoch": 18.01, "learning_rate": 7.53364864864865e-05, "loss": 0.387, "step": 19260 }, { "epoch": 18.01, "learning_rate": 7.532297297297298e-05, "loss": 0.3308, "step": 19270 }, { "epoch": 18.01, "learning_rate": 7.530945945945946e-05, "loss": 0.5337, "step": 19280 }, { "epoch": 18.01, "learning_rate": 7.529594594594594e-05, "loss": 0.3509, "step": 19290 }, { "epoch": 18.01, "learning_rate": 7.528243243243243e-05, "loss": 0.3379, "step": 19300 }, { "epoch": 18.01, "learning_rate": 7.526891891891892e-05, "loss": 0.3643, "step": 19310 }, { "epoch": 18.01, "learning_rate": 7.525540540540541e-05, "loss": 0.4566, "step": 19320 }, { "epoch": 18.01, "learning_rate": 7.524189189189189e-05, "loss": 0.4993, "step": 19330 }, { "epoch": 18.01, "learning_rate": 7.522837837837839e-05, "loss": 0.5514, "step": 19340 }, { "epoch": 18.01, "learning_rate": 7.521486486486487e-05, "loss": 0.4835, "step": 19350 }, { "epoch": 18.01, "learning_rate": 7.520135135135136e-05, "loss": 0.7703, "step": 19360 }, { "epoch": 18.01, "learning_rate": 7.518783783783784e-05, "loss": 0.6487, "step": 19370 }, { "epoch": 18.01, "learning_rate": 7.517432432432434e-05, "loss": 0.7236, "step": 19380 }, { "epoch": 18.01, "learning_rate": 7.516081081081082e-05, "loss": 0.5741, "step": 19390 }, { "epoch": 18.01, "learning_rate": 7.51472972972973e-05, "loss": 0.4986, "step": 19400 }, { "epoch": 18.01, "learning_rate": 7.513378378378378e-05, "loss": 0.5082, "step": 19410 }, { "epoch": 18.01, "learning_rate": 7.512027027027027e-05, "loss": 0.5468, "step": 19420 }, { "epoch": 18.01, "learning_rate": 7.510675675675676e-05, "loss": 0.5325, "step": 19430 }, { "epoch": 19.0, "learning_rate": 7.509324324324325e-05, "loss": 0.6897, "step": 19440 }, { "epoch": 19.0, "learning_rate": 7.507972972972973e-05, "loss": 0.5308, "step": 19450 }, { "epoch": 19.0, "learning_rate": 7.506621621621623e-05, "loss": 0.5734, "step": 19460 }, { "epoch": 19.0, "learning_rate": 7.50527027027027e-05, "loss": 0.5251, "step": 19470 }, { "epoch": 19.0, "learning_rate": 7.50391891891892e-05, "loss": 0.4579, "step": 19480 }, { "epoch": 19.0, "learning_rate": 7.502567567567568e-05, "loss": 0.4969, "step": 19490 }, { "epoch": 19.0, "learning_rate": 7.501216216216216e-05, "loss": 0.5479, "step": 19500 }, { "epoch": 19.0, "eval_loss": 0.1393987089395523, "eval_runtime": 129.1648, "eval_samples_per_second": 27.933, "eval_steps_per_second": 3.492, "eval_wer": 0.14476075105996367, "step": 19500 }, { "epoch": 19.0, "learning_rate": 7.499864864864864e-05, "loss": 0.6081, "step": 19510 }, { "epoch": 19.0, "learning_rate": 7.498513513513514e-05, "loss": 0.4454, "step": 19520 }, { "epoch": 19.0, "learning_rate": 7.497162162162162e-05, "loss": 0.5435, "step": 19530 }, { "epoch": 19.0, "learning_rate": 7.495810810810811e-05, "loss": 0.4908, "step": 19540 }, { "epoch": 19.0, "learning_rate": 7.49445945945946e-05, "loss": 0.4902, "step": 19550 }, { "epoch": 19.0, "learning_rate": 7.493108108108109e-05, "loss": 0.3445, "step": 19560 }, { "epoch": 19.0, "learning_rate": 7.491756756756757e-05, "loss": 0.2916, "step": 19570 }, { "epoch": 19.0, "learning_rate": 7.490405405405407e-05, "loss": 0.3001, "step": 19580 }, { "epoch": 19.0, "learning_rate": 7.489054054054055e-05, "loss": 0.3103, "step": 19590 }, { "epoch": 19.0, "learning_rate": 7.487702702702704e-05, "loss": 0.9982, "step": 19600 }, { "epoch": 19.0, "learning_rate": 7.486351351351352e-05, "loss": 0.9466, "step": 19610 }, { "epoch": 19.0, "learning_rate": 7.485e-05, "loss": 2.5676, "step": 19620 }, { "epoch": 19.0, "learning_rate": 7.483648648648648e-05, "loss": 2.5595, "step": 19630 }, { "epoch": 19.0, "learning_rate": 7.482297297297297e-05, "loss": 2.4945, "step": 19640 }, { "epoch": 19.0, "learning_rate": 7.480945945945946e-05, "loss": 2.5984, "step": 19650 }, { "epoch": 19.0, "learning_rate": 7.479594594594594e-05, "loss": 1.7561, "step": 19660 }, { "epoch": 19.0, "learning_rate": 7.478243243243244e-05, "loss": 1.5891, "step": 19670 }, { "epoch": 19.0, "learning_rate": 7.476891891891892e-05, "loss": 0.9733, "step": 19680 }, { "epoch": 19.0, "learning_rate": 7.475540540540541e-05, "loss": 0.442, "step": 19690 }, { "epoch": 19.0, "learning_rate": 7.474189189189189e-05, "loss": 0.1787, "step": 19700 }, { "epoch": 19.0, "learning_rate": 7.472837837837839e-05, "loss": 0.3395, "step": 19710 }, { "epoch": 19.0, "learning_rate": 7.471486486486487e-05, "loss": 0.3805, "step": 19720 }, { "epoch": 19.0, "learning_rate": 7.470135135135136e-05, "loss": 0.448, "step": 19730 }, { "epoch": 19.0, "learning_rate": 7.468783783783784e-05, "loss": 0.4977, "step": 19740 }, { "epoch": 19.0, "learning_rate": 7.467432432432432e-05, "loss": 0.2898, "step": 19750 }, { "epoch": 19.0, "learning_rate": 7.46608108108108e-05, "loss": 0.1868, "step": 19760 }, { "epoch": 19.0, "learning_rate": 7.46472972972973e-05, "loss": 0.3616, "step": 19770 }, { "epoch": 19.0, "learning_rate": 7.463378378378378e-05, "loss": 0.2104, "step": 19780 }, { "epoch": 19.0, "learning_rate": 7.462027027027028e-05, "loss": 0.3756, "step": 19790 }, { "epoch": 19.0, "learning_rate": 7.460675675675676e-05, "loss": 0.3116, "step": 19800 }, { "epoch": 19.0, "learning_rate": 7.459324324324325e-05, "loss": 0.2656, "step": 19810 }, { "epoch": 19.01, "learning_rate": 7.457972972972973e-05, "loss": 0.2425, "step": 19820 }, { "epoch": 19.01, "learning_rate": 7.456621621621623e-05, "loss": 0.1414, "step": 19830 }, { "epoch": 19.01, "learning_rate": 7.455270270270271e-05, "loss": 0.2967, "step": 19840 }, { "epoch": 19.01, "learning_rate": 7.45391891891892e-05, "loss": 0.2877, "step": 19850 }, { "epoch": 19.01, "learning_rate": 7.452567567567568e-05, "loss": 0.2051, "step": 19860 }, { "epoch": 19.01, "learning_rate": 7.451216216216216e-05, "loss": 0.2523, "step": 19870 }, { "epoch": 19.01, "learning_rate": 7.449864864864865e-05, "loss": 0.419, "step": 19880 }, { "epoch": 19.01, "learning_rate": 7.448513513513514e-05, "loss": 0.3508, "step": 19890 }, { "epoch": 19.01, "learning_rate": 7.447162162162162e-05, "loss": 0.349, "step": 19900 }, { "epoch": 19.01, "learning_rate": 7.445810810810812e-05, "loss": 0.4537, "step": 19910 }, { "epoch": 19.01, "learning_rate": 7.44445945945946e-05, "loss": 0.3706, "step": 19920 }, { "epoch": 19.01, "learning_rate": 7.443108108108109e-05, "loss": 0.5275, "step": 19930 }, { "epoch": 19.01, "learning_rate": 7.441756756756757e-05, "loss": 0.3779, "step": 19940 }, { "epoch": 19.01, "learning_rate": 7.440405405405407e-05, "loss": 0.3721, "step": 19950 }, { "epoch": 19.01, "learning_rate": 7.439054054054055e-05, "loss": 0.7378, "step": 19960 }, { "epoch": 19.01, "learning_rate": 7.437702702702703e-05, "loss": 0.6086, "step": 19970 }, { "epoch": 19.01, "learning_rate": 7.436351351351351e-05, "loss": 0.2475, "step": 19980 }, { "epoch": 19.01, "learning_rate": 7.435e-05, "loss": 0.242, "step": 19990 }, { "epoch": 19.01, "learning_rate": 7.433648648648649e-05, "loss": 0.301, "step": 20000 }, { "epoch": 19.01, "eval_loss": 0.12247521430253983, "eval_runtime": 128.4783, "eval_samples_per_second": 28.083, "eval_steps_per_second": 3.51, "eval_wer": 0.12542515025858453, "step": 20000 } ], "max_steps": 75000, "num_train_epochs": 9223372036854775807, "total_flos": 1.3193673854990254e+20, "trial_name": null, "trial_params": null }