diff --git "a/trainer_state.json" "b/trainer_state.json" --- "a/trainer_state.json" +++ "b/trainer_state.json" @@ -1,2635 +1,26125 @@ { - "best_metric": 0.5104931592941284, - "best_model_checkpoint": "ai-light-dance_singing3_ft_wav2vec2-large-xlsr-53-v2/checkpoint-1872", - "epoch": 49.996539792387544, - "global_step": 3600, + "best_metric": 0.4760190546512604, + "best_model_checkpoint": "ai-light-dance_singing3_ft_wav2vec2-large-xlsr-53-v2/checkpoint-7416", + "epoch": 499.9965397923875, + "global_step": 36000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.14, - "learning_rate": 1.0000000000000002e-06, - "loss": 0.6213, + "learning_rate": 4.0000000000000003e-07, + "loss": 0.522, "step": 10 }, { "epoch": 0.28, - "learning_rate": 1.9000000000000002e-06, - "loss": 0.639, + "learning_rate": 8.000000000000001e-07, + "loss": 0.5382, "step": 20 }, { "epoch": 0.42, - "learning_rate": 2.9e-06, - "loss": 0.6243, + "learning_rate": 1.1600000000000001e-06, + "loss": 0.5121, "step": 30 }, { "epoch": 0.55, - "learning_rate": 3.900000000000001e-06, - "loss": 0.6178, + "learning_rate": 1.56e-06, + "loss": 0.5194, "step": 40 }, { "epoch": 0.69, - "learning_rate": 4.9000000000000005e-06, - "loss": 0.5815, + "learning_rate": 1.9600000000000003e-06, + "loss": 0.5153, "step": 50 }, { "epoch": 0.83, - "learning_rate": 4.9887323943661975e-06, - "loss": 0.5894, + "learning_rate": 2.3600000000000003e-06, + "loss": 0.5172, "step": 60 }, { "epoch": 0.97, - "learning_rate": 4.974647887323944e-06, - "loss": 0.6154, + "learning_rate": 2.7600000000000003e-06, + "loss": 0.5306, "step": 70 }, { "epoch": 1.0, - "eval_loss": 0.526593804359436, - "eval_runtime": 128.5544, - "eval_samples_per_second": 4.138, - "eval_steps_per_second": 0.521, - "eval_wer": 0.2550620299543614, + "eval_loss": 0.5237026810646057, + "eval_runtime": 125.6242, + "eval_samples_per_second": 4.235, + "eval_steps_per_second": 0.533, + "eval_wer": 0.2540978337725783, "step": 72 }, { "epoch": 1.11, - "learning_rate": 4.96056338028169e-06, - "loss": 0.6172, + "learning_rate": 3.1600000000000002e-06, + "loss": 0.5346, "step": 80 }, { "epoch": 1.25, - "learning_rate": 4.946478873239437e-06, - "loss": 0.6082, + "learning_rate": 3.5600000000000002e-06, + "loss": 0.527, "step": 90 }, { "epoch": 1.39, - "learning_rate": 4.932394366197184e-06, - "loss": 0.5951, + "learning_rate": 3.96e-06, + "loss": 0.5134, "step": 100 }, { "epoch": 1.53, - "learning_rate": 4.91830985915493e-06, - "loss": 0.6139, + "learning_rate": 4.360000000000001e-06, + "loss": 0.5272, "step": 110 }, { "epoch": 1.66, - "learning_rate": 4.904225352112677e-06, - "loss": 0.5957, + "learning_rate": 4.76e-06, + "loss": 0.5219, "step": 120 }, { "epoch": 1.8, - "learning_rate": 4.890140845070423e-06, - "loss": 0.6248, + "learning_rate": 5.1600000000000006e-06, + "loss": 0.547, "step": 130 }, { "epoch": 1.94, - "learning_rate": 4.876056338028169e-06, - "loss": 0.5958, + "learning_rate": 5.560000000000001e-06, + "loss": 0.5218, "step": 140 }, { "epoch": 2.0, - "eval_loss": 0.5272348523139954, - "eval_runtime": 129.1192, - "eval_samples_per_second": 4.12, - "eval_steps_per_second": 0.519, - "eval_wer": 0.2585974159542328, + "eval_loss": 0.5389940738677979, + "eval_runtime": 125.5064, + "eval_samples_per_second": 4.239, + "eval_steps_per_second": 0.534, + "eval_wer": 0.26361123609950504, "step": 144 }, { "epoch": 2.08, - "learning_rate": 4.861971830985916e-06, - "loss": 0.6125, + "learning_rate": 5.9600000000000005e-06, + "loss": 0.5389, "step": 150 }, { "epoch": 2.22, - "learning_rate": 4.847887323943662e-06, - "loss": 0.6002, + "learning_rate": 6.360000000000001e-06, + "loss": 0.5246, "step": 160 }, { "epoch": 2.36, - "learning_rate": 4.833802816901409e-06, - "loss": 0.5946, + "learning_rate": 6.760000000000001e-06, + "loss": 0.5348, "step": 170 }, { "epoch": 2.5, - "learning_rate": 4.819718309859156e-06, - "loss": 0.586, + "learning_rate": 7.16e-06, + "loss": 0.5225, "step": 180 }, { "epoch": 2.64, - "learning_rate": 4.805633802816902e-06, - "loss": 0.5792, + "learning_rate": 7.5600000000000005e-06, + "loss": 0.5137, "step": 190 }, { "epoch": 2.78, - "learning_rate": 4.7915492957746485e-06, - "loss": 0.5761, + "learning_rate": 7.960000000000002e-06, + "loss": 0.5378, "step": 200 }, { "epoch": 2.91, - "learning_rate": 4.777464788732395e-06, - "loss": 0.5825, + "learning_rate": 8.36e-06, + "loss": 0.521, "step": 210 }, { "epoch": 3.0, - "eval_loss": 0.5249173641204834, - "eval_runtime": 127.7312, - "eval_samples_per_second": 4.165, - "eval_steps_per_second": 0.525, - "eval_wer": 0.25866169569968506, + "eval_loss": 0.5434454679489136, + "eval_runtime": 125.9155, + "eval_samples_per_second": 4.225, + "eval_steps_per_second": 0.532, + "eval_wer": 0.2615542842450344, "step": 216 }, { "epoch": 3.06, - "learning_rate": 4.763380281690141e-06, - "loss": 0.5987, + "learning_rate": 8.76e-06, + "loss": 0.5338, "step": 220 }, { "epoch": 3.19, - "learning_rate": 4.749295774647888e-06, - "loss": 0.5777, + "learning_rate": 9.16e-06, + "loss": 0.5217, "step": 230 }, { "epoch": 3.33, - "learning_rate": 4.735211267605635e-06, - "loss": 0.61, + "learning_rate": 9.56e-06, + "loss": 0.5455, "step": 240 }, { "epoch": 3.47, - "learning_rate": 4.721126760563381e-06, - "loss": 0.5833, + "learning_rate": 9.960000000000001e-06, + "loss": 0.5247, "step": 250 }, { "epoch": 3.61, - "learning_rate": 4.707042253521127e-06, - "loss": 0.5848, + "learning_rate": 1.036e-05, + "loss": 0.5325, "step": 260 }, { "epoch": 3.75, - "learning_rate": 4.692957746478873e-06, - "loss": 0.5808, + "learning_rate": 1.0760000000000002e-05, + "loss": 0.5356, "step": 270 }, { "epoch": 3.89, - "learning_rate": 4.6788732394366195e-06, - "loss": 0.5717, + "learning_rate": 1.1160000000000002e-05, + "loss": 0.525, "step": 280 }, { "epoch": 4.0, - "eval_loss": 0.5236164927482605, - "eval_runtime": 127.5564, - "eval_samples_per_second": 4.171, - "eval_steps_per_second": 0.525, - "eval_wer": 0.2570547020633798, + "eval_loss": 0.5434799790382385, + "eval_runtime": 126.1498, + "eval_samples_per_second": 4.217, + "eval_steps_per_second": 0.531, + "eval_wer": 0.2616185639904866, "step": 288 }, { "epoch": 4.03, - "learning_rate": 4.664788732394367e-06, - "loss": 0.6055, + "learning_rate": 1.156e-05, + "loss": 0.5554, "step": 290 }, { "epoch": 4.17, - "learning_rate": 4.650704225352113e-06, - "loss": 0.5704, + "learning_rate": 1.196e-05, + "loss": 0.5343, "step": 300 }, { "epoch": 4.3, - "learning_rate": 4.6366197183098594e-06, - "loss": 0.5835, + "learning_rate": 1.236e-05, + "loss": 0.53, "step": 310 }, { "epoch": 4.44, - "learning_rate": 4.622535211267606e-06, - "loss": 0.5677, + "learning_rate": 1.2760000000000001e-05, + "loss": 0.5606, "step": 320 }, { "epoch": 4.58, - "learning_rate": 4.608450704225352e-06, - "loss": 0.5799, + "learning_rate": 1.3160000000000001e-05, + "loss": 0.5644, "step": 330 }, { "epoch": 4.72, - "learning_rate": 4.5943661971830986e-06, - "loss": 0.576, + "learning_rate": 1.3560000000000002e-05, + "loss": 0.5555, "step": 340 }, { "epoch": 4.86, - "learning_rate": 4.580281690140845e-06, - "loss": 0.5975, + "learning_rate": 1.396e-05, + "loss": 0.5526, "step": 350 }, { "epoch": 5.0, - "learning_rate": 4.566197183098592e-06, - "loss": 0.5831, + "learning_rate": 1.4360000000000001e-05, + "loss": 0.5519, "step": 360 }, { "epoch": 5.0, - "eval_loss": 0.5202789306640625, - "eval_runtime": 129.1161, - "eval_samples_per_second": 4.12, - "eval_steps_per_second": 0.519, - "eval_wer": 0.25898309442694606, + "eval_loss": 0.5476202964782715, + "eval_runtime": 127.1416, + "eval_samples_per_second": 4.184, + "eval_steps_per_second": 0.527, + "eval_wer": 0.269782091662917, "step": 360 }, { "epoch": 5.14, - "learning_rate": 4.5521126760563385e-06, - "loss": 0.58, + "learning_rate": 1.4760000000000001e-05, + "loss": 0.5547, "step": 370 }, { "epoch": 5.28, - "learning_rate": 4.538028169014085e-06, - "loss": 0.5869, + "learning_rate": 1.516e-05, + "loss": 0.5652, "step": 380 }, { "epoch": 5.42, - "learning_rate": 4.523943661971831e-06, - "loss": 0.5603, + "learning_rate": 1.556e-05, + "loss": 0.5459, "step": 390 }, { "epoch": 5.55, - "learning_rate": 4.509859154929578e-06, - "loss": 0.5657, + "learning_rate": 1.5960000000000003e-05, + "loss": 0.5331, "step": 400 }, { "epoch": 5.69, - "learning_rate": 4.495774647887324e-06, - "loss": 0.5846, + "learning_rate": 1.636e-05, + "loss": 0.5525, "step": 410 }, { "epoch": 5.83, - "learning_rate": 4.48169014084507e-06, - "loss": 0.5951, + "learning_rate": 1.6760000000000002e-05, + "loss": 0.5566, "step": 420 }, { "epoch": 5.97, - "learning_rate": 4.467605633802818e-06, - "loss": 0.5652, + "learning_rate": 1.7160000000000002e-05, + "loss": 0.5521, "step": 430 }, { "epoch": 6.0, - "eval_loss": 0.5126761198043823, - "eval_runtime": 126.6507, - "eval_samples_per_second": 4.201, - "eval_steps_per_second": 0.529, - "eval_wer": 0.2575046602815453, + "eval_loss": 0.5425682663917542, + "eval_runtime": 125.628, + "eval_samples_per_second": 4.235, + "eval_steps_per_second": 0.533, + "eval_wer": 0.27813845857170405, "step": 432 }, { "epoch": 6.11, - "learning_rate": 4.453521126760564e-06, - "loss": 0.5965, + "learning_rate": 1.756e-05, + "loss": 0.5759, "step": 440 }, { "epoch": 6.25, - "learning_rate": 4.43943661971831e-06, - "loss": 0.5641, + "learning_rate": 1.796e-05, + "loss": 0.5361, "step": 450 }, { "epoch": 6.39, - "learning_rate": 4.425352112676057e-06, - "loss": 0.5547, + "learning_rate": 1.8360000000000004e-05, + "loss": 0.5339, "step": 460 }, { "epoch": 6.53, - "learning_rate": 4.411267605633803e-06, - "loss": 0.5849, + "learning_rate": 1.876e-05, + "loss": 0.5618, "step": 470 }, { "epoch": 6.66, - "learning_rate": 4.3971830985915495e-06, - "loss": 0.5665, + "learning_rate": 1.916e-05, + "loss": 0.548, "step": 480 }, { "epoch": 6.8, - "learning_rate": 4.383098591549296e-06, - "loss": 0.5666, + "learning_rate": 1.9560000000000002e-05, + "loss": 0.5482, "step": 490 }, { "epoch": 6.94, - "learning_rate": 4.369014084507043e-06, - "loss": 0.5665, + "learning_rate": 1.9960000000000002e-05, + "loss": 0.5345, "step": 500 }, { "epoch": 7.0, - "eval_loss": 0.5228902101516724, - "eval_runtime": 126.6048, - "eval_samples_per_second": 4.202, - "eval_steps_per_second": 0.529, - "eval_wer": 0.25866169569968506, + "eval_loss": 0.550900399684906, + "eval_runtime": 125.972, + "eval_samples_per_second": 4.223, + "eval_steps_per_second": 0.532, + "eval_wer": 0.27228900173555315, "step": 504 }, { "epoch": 7.08, - "learning_rate": 4.3549295774647895e-06, - "loss": 0.5989, + "learning_rate": 2.036e-05, + "loss": 0.5896, "step": 510 }, { "epoch": 7.22, - "learning_rate": 4.340845070422536e-06, - "loss": 0.5625, + "learning_rate": 2.076e-05, + "loss": 0.5467, "step": 520 }, { "epoch": 7.36, - "learning_rate": 4.326760563380282e-06, - "loss": 0.5827, + "learning_rate": 2.1160000000000004e-05, + "loss": 0.5625, "step": 530 }, { "epoch": 7.5, - "learning_rate": 4.312676056338029e-06, - "loss": 0.5864, + "learning_rate": 2.1560000000000004e-05, + "loss": 0.5562, "step": 540 }, { "epoch": 7.64, - "learning_rate": 4.298591549295775e-06, - "loss": 0.5555, + "learning_rate": 2.1960000000000003e-05, + "loss": 0.5282, "step": 550 }, { "epoch": 7.78, - "learning_rate": 4.284507042253521e-06, - "loss": 0.5606, + "learning_rate": 2.2360000000000003e-05, + "loss": 0.5616, "step": 560 }, { "epoch": 7.91, - "learning_rate": 4.270422535211268e-06, - "loss": 0.5625, + "learning_rate": 2.276e-05, + "loss": 0.5505, "step": 570 }, { "epoch": 8.0, - "eval_loss": 0.5248023867607117, - "eval_runtime": 127.7741, - "eval_samples_per_second": 4.164, - "eval_steps_per_second": 0.524, - "eval_wer": 0.25474063122710033, + "eval_loss": 0.5417599678039551, + "eval_runtime": 125.5651, + "eval_samples_per_second": 4.237, + "eval_steps_per_second": 0.534, + "eval_wer": 0.2686893359902295, "step": 576 }, { "epoch": 8.06, - "learning_rate": 4.256338028169014e-06, - "loss": 0.5798, + "learning_rate": 2.3160000000000002e-05, + "loss": 0.5659, "step": 580 }, { "epoch": 8.19, - "learning_rate": 4.2422535211267605e-06, - "loss": 0.5645, + "learning_rate": 2.356e-05, + "loss": 0.547, "step": 590 }, { "epoch": 8.33, - "learning_rate": 4.228169014084507e-06, - "loss": 0.5717, + "learning_rate": 2.396e-05, + "loss": 0.5481, "step": 600 }, { "epoch": 8.47, - "learning_rate": 4.214084507042254e-06, - "loss": 0.5617, + "learning_rate": 2.436e-05, + "loss": 0.5509, "step": 610 }, { "epoch": 8.61, - "learning_rate": 4.2000000000000004e-06, - "loss": 0.564, + "learning_rate": 2.4760000000000003e-05, + "loss": 0.5596, "step": 620 }, { "epoch": 8.75, - "learning_rate": 4.185915492957747e-06, - "loss": 0.5758, + "learning_rate": 2.5160000000000003e-05, + "loss": 0.5582, "step": 630 }, { "epoch": 8.89, - "learning_rate": 4.171830985915493e-06, - "loss": 0.5661, + "learning_rate": 2.5560000000000003e-05, + "loss": 0.5457, "step": 640 }, { "epoch": 9.0, - "eval_loss": 0.5213830471038818, - "eval_runtime": 127.0111, - "eval_samples_per_second": 4.189, - "eval_steps_per_second": 0.528, - "eval_wer": 0.25576910715433565, + "eval_loss": 0.52699875831604, + "eval_runtime": 126.6817, + "eval_samples_per_second": 4.2, + "eval_steps_per_second": 0.529, + "eval_wer": 0.2650253904994536, "step": 648 }, { "epoch": 9.03, - "learning_rate": 4.1577464788732396e-06, - "loss": 0.6023, + "learning_rate": 2.5960000000000002e-05, + "loss": 0.577, "step": 650 }, { "epoch": 9.17, - "learning_rate": 4.143661971830986e-06, - "loss": 0.5642, + "learning_rate": 2.6360000000000002e-05, + "loss": 0.5584, "step": 660 }, { "epoch": 9.3, - "learning_rate": 4.129577464788732e-06, - "loss": 0.5741, + "learning_rate": 2.6760000000000005e-05, + "loss": 0.5667, "step": 670 }, { "epoch": 9.44, - "learning_rate": 4.1154929577464795e-06, - "loss": 0.5746, + "learning_rate": 2.7160000000000004e-05, + "loss": 0.5583, "step": 680 }, { "epoch": 9.58, - "learning_rate": 4.101408450704226e-06, - "loss": 0.5749, + "learning_rate": 2.756e-05, + "loss": 0.5663, "step": 690 }, { "epoch": 9.72, - "learning_rate": 4.087323943661972e-06, - "loss": 0.5623, + "learning_rate": 2.796e-05, + "loss": 0.5551, "step": 700 }, { "epoch": 9.86, - "learning_rate": 4.073239436619719e-06, - "loss": 0.5628, + "learning_rate": 2.836e-05, + "loss": 0.5564, "step": 710 }, { "epoch": 10.0, - "learning_rate": 4.059154929577465e-06, - "loss": 0.5583, + "learning_rate": 2.8760000000000002e-05, + "loss": 0.5733, "step": 720 }, { "epoch": 10.0, - "eval_loss": 0.5196737051010132, - "eval_runtime": 128.0441, - "eval_samples_per_second": 4.155, - "eval_steps_per_second": 0.523, - "eval_wer": 0.2582117374815196, + "eval_loss": 0.5815369486808777, + "eval_runtime": 125.0916, + "eval_samples_per_second": 4.253, + "eval_steps_per_second": 0.536, + "eval_wer": 0.2787812560262261, "step": 720 }, { "epoch": 10.14, - "learning_rate": 4.045070422535211e-06, - "loss": 0.5656, + "learning_rate": 2.9160000000000002e-05, + "loss": 0.5675, "step": 730 }, { "epoch": 10.28, - "learning_rate": 4.030985915492958e-06, - "loss": 0.5687, + "learning_rate": 2.956e-05, + "loss": 0.6122, "step": 740 }, { "epoch": 10.42, - "learning_rate": 4.016901408450705e-06, - "loss": 0.5569, + "learning_rate": 2.996e-05, + "loss": 0.6002, "step": 750 }, { "epoch": 10.55, - "learning_rate": 4.002816901408451e-06, - "loss": 0.5771, + "learning_rate": 3.0360000000000004e-05, + "loss": 0.5954, "step": 760 }, { "epoch": 10.69, - "learning_rate": 3.988732394366198e-06, - "loss": 0.568, + "learning_rate": 3.0760000000000004e-05, + "loss": 0.5676, "step": 770 }, { "epoch": 10.83, - "learning_rate": 3.974647887323944e-06, - "loss": 0.5699, + "learning_rate": 3.1160000000000007e-05, + "loss": 0.5556, "step": 780 }, { "epoch": 10.97, - "learning_rate": 3.9605633802816905e-06, - "loss": 0.5605, + "learning_rate": 3.156e-05, + "loss": 0.554, "step": 790 }, { "epoch": 11.0, - "eval_loss": 0.5212803483009338, - "eval_runtime": 127.3424, - "eval_samples_per_second": 4.178, - "eval_steps_per_second": 0.526, - "eval_wer": 0.26110432602686895, + "eval_loss": 0.5523175597190857, + "eval_runtime": 125.5875, + "eval_samples_per_second": 4.236, + "eval_steps_per_second": 0.533, + "eval_wer": 0.2777527800989908, "step": 792 }, { "epoch": 11.11, - "learning_rate": 3.946478873239437e-06, - "loss": 0.5823, + "learning_rate": 3.1960000000000006e-05, + "loss": 0.5909, "step": 800 }, { "epoch": 11.25, - "learning_rate": 3.932394366197183e-06, - "loss": 0.5739, + "learning_rate": 3.236e-05, + "loss": 0.5588, "step": 810 }, { "epoch": 11.39, - "learning_rate": 3.9183098591549305e-06, - "loss": 0.5539, + "learning_rate": 3.276e-05, + "loss": 0.5456, "step": 820 }, { "epoch": 11.53, - "learning_rate": 3.904225352112677e-06, - "loss": 0.5672, + "learning_rate": 3.316e-05, + "loss": 0.5619, "step": 830 }, { "epoch": 11.66, - "learning_rate": 3.890140845070423e-06, - "loss": 0.557, + "learning_rate": 3.3560000000000004e-05, + "loss": 0.5599, "step": 840 }, { "epoch": 11.8, - "learning_rate": 3.87605633802817e-06, - "loss": 0.5711, + "learning_rate": 3.396e-05, + "loss": 0.5651, "step": 850 }, { "epoch": 11.94, - "learning_rate": 3.861971830985915e-06, - "loss": 0.5784, + "learning_rate": 3.436e-05, + "loss": 0.5662, "step": 860 }, { "epoch": 12.0, - "eval_loss": 0.5327615141868591, - "eval_runtime": 128.9244, - "eval_samples_per_second": 4.126, - "eval_steps_per_second": 0.52, - "eval_wer": 0.258340296972424, + "eval_loss": 0.5460386872291565, + "eval_runtime": 126.6313, + "eval_samples_per_second": 4.201, + "eval_steps_per_second": 0.529, + "eval_wer": 0.28289515973516743, "step": 864 }, { "epoch": 12.08, - "learning_rate": 3.847887323943662e-06, - "loss": 0.5593, + "learning_rate": 3.4760000000000006e-05, + "loss": 0.5906, "step": 870 }, { "epoch": 12.22, - "learning_rate": 3.833802816901409e-06, - "loss": 0.5503, + "learning_rate": 3.516e-05, + "loss": 0.5417, "step": 880 }, { "epoch": 12.36, - "learning_rate": 3.819718309859155e-06, - "loss": 0.57, + "learning_rate": 3.5560000000000005e-05, + "loss": 0.5651, "step": 890 }, { "epoch": 12.5, - "learning_rate": 3.8056338028169015e-06, - "loss": 0.556, + "learning_rate": 3.596e-05, + "loss": 0.5836, "step": 900 }, { "epoch": 12.64, - "learning_rate": 3.791549295774648e-06, - "loss": 0.5469, + "learning_rate": 3.6360000000000004e-05, + "loss": 0.5584, "step": 910 }, { "epoch": 12.78, - "learning_rate": 3.7774647887323947e-06, - "loss": 0.5575, + "learning_rate": 3.676000000000001e-05, + "loss": 0.5924, "step": 920 }, { "epoch": 12.91, - "learning_rate": 3.763380281690141e-06, - "loss": 0.5636, + "learning_rate": 3.716e-05, + "loss": 0.5974, "step": 930 }, { "epoch": 13.0, - "eval_loss": 0.5246398448944092, - "eval_runtime": 127.8438, - "eval_samples_per_second": 4.161, - "eval_steps_per_second": 0.524, - "eval_wer": 0.2585974159542328, + "eval_loss": 0.530403196811676, + "eval_runtime": 125.2246, + "eval_samples_per_second": 4.248, + "eval_steps_per_second": 0.535, + "eval_wer": 0.27582438773542456, "step": 936 }, { "epoch": 13.06, - "learning_rate": 3.7492957746478874e-06, - "loss": 0.5818, + "learning_rate": 3.756e-05, + "loss": 0.5949, "step": 940 }, { "epoch": 13.19, - "learning_rate": 3.7352112676056342e-06, - "loss": 0.5387, + "learning_rate": 3.796e-05, + "loss": 0.5384, "step": 950 }, { "epoch": 13.33, - "learning_rate": 3.7211267605633806e-06, - "loss": 0.5792, + "learning_rate": 3.836e-05, + "loss": 0.5802, "step": 960 }, { "epoch": 13.47, - "learning_rate": 3.707042253521127e-06, - "loss": 0.5543, + "learning_rate": 3.876e-05, + "loss": 0.5582, "step": 970 }, { "epoch": 13.61, - "learning_rate": 3.6929577464788733e-06, - "loss": 0.5429, + "learning_rate": 3.9160000000000005e-05, + "loss": 0.5795, "step": 980 }, { "epoch": 13.75, - "learning_rate": 3.67887323943662e-06, - "loss": 0.5571, + "learning_rate": 3.956e-05, + "loss": 0.5929, "step": 990 }, { "epoch": 13.89, - "learning_rate": 3.6647887323943665e-06, - "loss": 0.5581, + "learning_rate": 3.9960000000000004e-05, + "loss": 0.5751, "step": 1000 }, { "epoch": 14.0, - "eval_loss": 0.522983968257904, - "eval_runtime": 128.2074, - "eval_samples_per_second": 4.15, - "eval_steps_per_second": 0.523, - "eval_wer": 0.25461207173619593, + "eval_loss": 0.5404934883117676, + "eval_runtime": 125.2731, + "eval_samples_per_second": 4.247, + "eval_steps_per_second": 0.535, + "eval_wer": 0.2887446165713184, "step": 1008 }, { "epoch": 14.03, - "learning_rate": 3.650704225352113e-06, - "loss": 0.5776, + "learning_rate": 3.998971428571429e-05, + "loss": 0.6034, "step": 1010 }, { "epoch": 14.17, - "learning_rate": 3.6366197183098597e-06, - "loss": 0.5523, + "learning_rate": 3.9978285714285715e-05, + "loss": 0.5729, "step": 1020 }, { "epoch": 14.3, - "learning_rate": 3.622535211267606e-06, - "loss": 0.5603, + "learning_rate": 3.996685714285715e-05, + "loss": 0.5732, "step": 1030 }, { "epoch": 14.44, - "learning_rate": 3.6084507042253524e-06, - "loss": 0.5341, + "learning_rate": 3.9955428571428576e-05, + "loss": 0.5619, "step": 1040 }, { "epoch": 14.58, - "learning_rate": 3.594366197183099e-06, - "loss": 0.5589, + "learning_rate": 3.9944e-05, + "loss": 0.6105, "step": 1050 }, { "epoch": 14.72, - "learning_rate": 3.5802816901408456e-06, - "loss": 0.5508, + "learning_rate": 3.993257142857143e-05, + "loss": 0.5662, "step": 1060 }, { "epoch": 14.86, - "learning_rate": 3.566197183098592e-06, - "loss": 0.5483, + "learning_rate": 3.9921142857142856e-05, + "loss": 0.5576, "step": 1070 }, { "epoch": 15.0, - "learning_rate": 3.5521126760563384e-06, - "loss": 0.567, + "learning_rate": 3.990971428571429e-05, + "loss": 0.5803, "step": 1080 }, { "epoch": 15.0, - "eval_loss": 0.5205003619194031, - "eval_runtime": 128.349, - "eval_samples_per_second": 4.145, - "eval_steps_per_second": 0.522, - "eval_wer": 0.2571832615542842, + "eval_loss": 0.5455237030982971, + "eval_runtime": 126.2717, + "eval_samples_per_second": 4.213, + "eval_steps_per_second": 0.531, + "eval_wer": 0.28025969017162694, "step": 1080 }, { "epoch": 15.14, - "learning_rate": 3.538028169014085e-06, - "loss": 0.5702, + "learning_rate": 3.9898285714285716e-05, + "loss": 0.585, "step": 1090 }, { "epoch": 15.28, - "learning_rate": 3.5239436619718315e-06, - "loss": 0.5812, + "learning_rate": 3.988685714285715e-05, + "loss": 0.5987, "step": 1100 }, { "epoch": 15.42, - "learning_rate": 3.509859154929578e-06, - "loss": 0.5577, + "learning_rate": 3.9875428571428576e-05, + "loss": 0.5676, "step": 1110 }, { "epoch": 15.55, - "learning_rate": 3.4957746478873243e-06, - "loss": 0.5728, + "learning_rate": 3.9864e-05, + "loss": 0.5855, "step": 1120 }, { "epoch": 15.69, - "learning_rate": 3.481690140845071e-06, - "loss": 0.5317, + "learning_rate": 3.985257142857143e-05, + "loss": 0.5576, "step": 1130 }, { "epoch": 15.83, - "learning_rate": 3.4676056338028175e-06, - "loss": 0.5601, + "learning_rate": 3.984114285714286e-05, + "loss": 0.6111, "step": 1140 }, { "epoch": 15.97, - "learning_rate": 3.4535211267605634e-06, - "loss": 0.5586, + "learning_rate": 3.982971428571429e-05, + "loss": 0.5633, "step": 1150 }, { "epoch": 16.0, - "eval_loss": 0.5258896946907043, - "eval_runtime": 126.5534, - "eval_samples_per_second": 4.204, - "eval_steps_per_second": 0.529, - "eval_wer": 0.25564054766343125, + "eval_loss": 0.5420528054237366, + "eval_runtime": 125.1934, + "eval_samples_per_second": 4.249, + "eval_steps_per_second": 0.535, + "eval_wer": 0.2890660152985794, "step": 1152 }, { "epoch": 16.11, - "learning_rate": 3.4394366197183098e-06, - "loss": 0.5722, + "learning_rate": 3.981828571428572e-05, + "loss": 0.5838, "step": 1160 }, { "epoch": 16.25, - "learning_rate": 3.4253521126760566e-06, - "loss": 0.5569, + "learning_rate": 3.9806857142857144e-05, + "loss": 0.5626, "step": 1170 }, { "epoch": 16.39, - "learning_rate": 3.411267605633803e-06, - "loss": 0.5507, + "learning_rate": 3.979542857142857e-05, + "loss": 0.5572, "step": 1180 }, { "epoch": 16.53, - "learning_rate": 3.3971830985915493e-06, - "loss": 0.57, + "learning_rate": 3.9784000000000004e-05, + "loss": 0.6007, "step": 1190 }, { "epoch": 16.66, - "learning_rate": 3.3830985915492957e-06, - "loss": 0.557, + "learning_rate": 3.977257142857143e-05, + "loss": 0.609, "step": 1200 }, { "epoch": 16.8, - "learning_rate": 3.3690140845070425e-06, - "loss": 0.5366, + "learning_rate": 3.9761142857142864e-05, + "loss": 0.5655, "step": 1210 }, { "epoch": 16.94, - "learning_rate": 3.354929577464789e-06, - "loss": 0.5358, + "learning_rate": 3.974971428571429e-05, + "loss": 0.5674, "step": 1220 }, { "epoch": 17.0, - "eval_loss": 0.5334306359291077, - "eval_runtime": 128.1209, - "eval_samples_per_second": 4.152, - "eval_steps_per_second": 0.523, - "eval_wer": 0.26046152857234683, + "eval_loss": 0.5444985032081604, + "eval_runtime": 125.5509, + "eval_samples_per_second": 4.237, + "eval_steps_per_second": 0.534, + "eval_wer": 0.2857877482805168, "step": 1224 }, { "epoch": 17.08, - "learning_rate": 3.3408450704225353e-06, - "loss": 0.5884, + "learning_rate": 3.973828571428572e-05, + "loss": 0.6199, "step": 1230 }, { "epoch": 17.22, - "learning_rate": 3.326760563380282e-06, - "loss": 0.5394, + "learning_rate": 3.9726857142857144e-05, + "loss": 0.5498, "step": 1240 }, { "epoch": 17.36, - "learning_rate": 3.3126760563380284e-06, - "loss": 0.5633, + "learning_rate": 3.971542857142857e-05, + "loss": 0.5731, "step": 1250 }, { "epoch": 17.5, - "learning_rate": 3.298591549295775e-06, - "loss": 0.5456, + "learning_rate": 3.9704000000000005e-05, + "loss": 0.5763, "step": 1260 }, { "epoch": 17.64, - "learning_rate": 3.284507042253521e-06, - "loss": 0.5509, + "learning_rate": 3.969257142857143e-05, + "loss": 0.5589, "step": 1270 }, { "epoch": 17.78, - "learning_rate": 3.270422535211268e-06, - "loss": 0.5746, + "learning_rate": 3.9681142857142865e-05, + "loss": 0.5825, "step": 1280 }, { "epoch": 17.91, - "learning_rate": 3.2563380281690144e-06, - "loss": 0.5526, + "learning_rate": 3.966971428571429e-05, + "loss": 0.5543, "step": 1290 }, { "epoch": 18.0, - "eval_loss": 0.5180938839912415, - "eval_runtime": 127.6299, - "eval_samples_per_second": 4.168, - "eval_steps_per_second": 0.525, - "eval_wer": 0.25557626791797905, + "eval_loss": 0.5229591727256775, + "eval_runtime": 125.3879, + "eval_samples_per_second": 4.243, + "eval_steps_per_second": 0.534, + "eval_wer": 0.2799382914443659, "step": 1296 }, { "epoch": 18.06, - "learning_rate": 3.2422535211267607e-06, - "loss": 0.5768, + "learning_rate": 3.965828571428572e-05, + "loss": 0.579, "step": 1300 }, { "epoch": 18.19, - "learning_rate": 3.2281690140845075e-06, - "loss": 0.5491, + "learning_rate": 3.9646857142857145e-05, + "loss": 0.5574, "step": 1310 }, { "epoch": 18.33, - "learning_rate": 3.214084507042254e-06, - "loss": 0.5738, + "learning_rate": 3.963542857142857e-05, + "loss": 0.5827, "step": 1320 }, { "epoch": 18.47, - "learning_rate": 3.2000000000000003e-06, - "loss": 0.5564, + "learning_rate": 3.9624000000000006e-05, + "loss": 0.5681, "step": 1330 }, { "epoch": 18.61, - "learning_rate": 3.1859154929577467e-06, - "loss": 0.5605, + "learning_rate": 3.961257142857143e-05, + "loss": 0.5944, "step": 1340 }, { "epoch": 18.75, - "learning_rate": 3.1718309859154935e-06, - "loss": 0.5443, + "learning_rate": 3.9601142857142866e-05, + "loss": 0.5508, "step": 1350 }, { "epoch": 18.89, - "learning_rate": 3.15774647887324e-06, - "loss": 0.5483, + "learning_rate": 3.9589714285714286e-05, + "loss": 0.5618, "step": 1360 }, { "epoch": 19.0, - "eval_loss": 0.5131182074546814, - "eval_runtime": 127.3437, - "eval_samples_per_second": 4.178, - "eval_steps_per_second": 0.526, - "eval_wer": 0.2562190653725011, + "eval_loss": 0.5207758545875549, + "eval_runtime": 125.4899, + "eval_samples_per_second": 4.239, + "eval_steps_per_second": 0.534, + "eval_wer": 0.26200424246319987, "step": 1368 }, { "epoch": 19.03, - "learning_rate": 3.143661971830986e-06, - "loss": 0.5656, + "learning_rate": 3.957828571428571e-05, + "loss": 0.5672, "step": 1370 }, { "epoch": 19.17, - "learning_rate": 3.129577464788733e-06, - "loss": 0.5534, + "learning_rate": 3.9566857142857146e-05, + "loss": 0.5527, "step": 1380 }, { "epoch": 19.3, - "learning_rate": 3.1154929577464794e-06, - "loss": 0.5568, + "learning_rate": 3.955542857142857e-05, + "loss": 0.5724, "step": 1390 }, { "epoch": 19.44, - "learning_rate": 3.1014084507042258e-06, - "loss": 0.5492, + "learning_rate": 3.9544000000000006e-05, + "loss": 0.5638, "step": 1400 }, { "epoch": 19.58, - "learning_rate": 3.087323943661972e-06, - "loss": 0.5537, + "learning_rate": 3.953257142857143e-05, + "loss": 0.5769, "step": 1410 }, { "epoch": 19.72, - "learning_rate": 3.073239436619719e-06, - "loss": 0.5541, + "learning_rate": 3.952114285714286e-05, + "loss": 0.5713, "step": 1420 }, { "epoch": 19.86, - "learning_rate": 3.0591549295774653e-06, - "loss": 0.5536, + "learning_rate": 3.9509714285714287e-05, + "loss": 0.5727, "step": 1430 }, { "epoch": 20.0, - "learning_rate": 3.0450704225352117e-06, - "loss": 0.5487, + "learning_rate": 3.949828571428571e-05, + "loss": 0.5551, "step": 1440 }, { "epoch": 20.0, - "eval_loss": 0.5178970098495483, - "eval_runtime": 128.7396, - "eval_samples_per_second": 4.132, - "eval_steps_per_second": 0.52, - "eval_wer": 0.2560905058815967, + "eval_loss": 0.5313947200775146, + "eval_runtime": 126.2412, + "eval_samples_per_second": 4.214, + "eval_steps_per_second": 0.531, + "eval_wer": 0.2624542006813653, "step": 1440 }, { "epoch": 20.14, - "learning_rate": 3.0309859154929576e-06, - "loss": 0.551, + "learning_rate": 3.948685714285715e-05, + "loss": 0.5573, "step": 1450 }, { "epoch": 20.28, - "learning_rate": 3.0169014084507044e-06, - "loss": 0.554, + "learning_rate": 3.9475428571428574e-05, + "loss": 0.558, "step": 1460 }, { "epoch": 20.42, - "learning_rate": 3.002816901408451e-06, - "loss": 0.5524, + "learning_rate": 3.946400000000001e-05, + "loss": 0.5566, "step": 1470 }, { "epoch": 20.55, - "learning_rate": 2.988732394366197e-06, - "loss": 0.5676, + "learning_rate": 3.9452571428571434e-05, + "loss": 0.5618, "step": 1480 }, { "epoch": 20.69, - "learning_rate": 2.9746478873239436e-06, - "loss": 0.5488, + "learning_rate": 3.944114285714286e-05, + "loss": 0.5527, "step": 1490 }, { "epoch": 20.83, - "learning_rate": 2.9605633802816903e-06, - "loss": 0.5691, + "learning_rate": 3.942971428571429e-05, + "loss": 0.5768, "step": 1500 }, { "epoch": 20.97, - "learning_rate": 2.9464788732394367e-06, - "loss": 0.5489, + "learning_rate": 3.9418285714285714e-05, + "loss": 0.5582, "step": 1510 }, { "epoch": 21.0, - "eval_loss": 0.525915265083313, - "eval_runtime": 128.1257, - "eval_samples_per_second": 4.152, - "eval_steps_per_second": 0.523, - "eval_wer": 0.2596258918814682, + "eval_loss": 0.5191528797149658, + "eval_runtime": 126.7101, + "eval_samples_per_second": 4.199, + "eval_steps_per_second": 0.529, + "eval_wer": 0.2834093976987851, "step": 1512 }, { "epoch": 21.11, - "learning_rate": 2.932394366197183e-06, - "loss": 0.5522, + "learning_rate": 3.940685714285715e-05, + "loss": 0.557, "step": 1520 }, { "epoch": 21.25, - "learning_rate": 2.91830985915493e-06, - "loss": 0.5544, + "learning_rate": 3.9395428571428574e-05, + "loss": 0.5718, "step": 1530 }, { "epoch": 21.39, - "learning_rate": 2.9042253521126763e-06, - "loss": 0.5715, + "learning_rate": 3.938400000000001e-05, + "loss": 0.5601, "step": 1540 }, { "epoch": 21.53, - "learning_rate": 2.8901408450704226e-06, - "loss": 0.5547, + "learning_rate": 3.937257142857143e-05, + "loss": 0.5652, "step": 1550 }, { "epoch": 21.66, - "learning_rate": 2.876056338028169e-06, - "loss": 0.5256, + "learning_rate": 3.936114285714286e-05, + "loss": 0.5391, "step": 1560 }, { "epoch": 21.8, - "learning_rate": 2.861971830985916e-06, - "loss": 0.5507, + "learning_rate": 3.934971428571429e-05, + "loss": 0.5489, "step": 1570 }, { "epoch": 21.94, - "learning_rate": 2.847887323943662e-06, - "loss": 0.5582, + "learning_rate": 3.9338285714285715e-05, + "loss": 0.5639, "step": 1580 }, { "epoch": 22.0, - "eval_loss": 0.5199052691459656, - "eval_runtime": 128.2296, - "eval_samples_per_second": 4.149, - "eval_steps_per_second": 0.523, - "eval_wer": 0.2550620299543614, + "eval_loss": 0.4979424774646759, + "eval_runtime": 125.7457, + "eval_samples_per_second": 4.231, + "eval_steps_per_second": 0.533, + "eval_wer": 0.26238992093591307, "step": 1584 }, { "epoch": 22.08, - "learning_rate": 2.8338028169014086e-06, - "loss": 0.5706, + "learning_rate": 3.932685714285715e-05, + "loss": 0.5929, "step": 1590 }, { "epoch": 22.22, - "learning_rate": 2.8197183098591554e-06, - "loss": 0.5487, + "learning_rate": 3.9315428571428575e-05, + "loss": 0.5565, "step": 1600 }, { "epoch": 22.36, - "learning_rate": 2.8056338028169017e-06, - "loss": 0.5494, + "learning_rate": 3.9304e-05, + "loss": 0.5615, "step": 1610 }, { "epoch": 22.5, - "learning_rate": 2.791549295774648e-06, - "loss": 0.5536, + "learning_rate": 3.929257142857143e-05, + "loss": 0.5687, "step": 1620 }, { "epoch": 22.64, - "learning_rate": 2.7774647887323945e-06, - "loss": 0.5469, + "learning_rate": 3.928114285714286e-05, + "loss": 0.5548, "step": 1630 }, { "epoch": 22.78, - "learning_rate": 2.7633802816901413e-06, - "loss": 0.556, + "learning_rate": 3.926971428571429e-05, + "loss": 0.5597, "step": 1640 }, { "epoch": 22.91, - "learning_rate": 2.7492957746478877e-06, - "loss": 0.5351, + "learning_rate": 3.9258285714285716e-05, + "loss": 0.5473, "step": 1650 }, { "epoch": 23.0, - "eval_loss": 0.5282993316650391, - "eval_runtime": 129.7167, - "eval_samples_per_second": 4.101, - "eval_steps_per_second": 0.517, - "eval_wer": 0.25345503631805616, + "eval_loss": 0.508553683757782, + "eval_runtime": 125.7835, + "eval_samples_per_second": 4.229, + "eval_steps_per_second": 0.533, + "eval_wer": 0.2535193160635084, "step": 1656 }, { "epoch": 23.06, - "learning_rate": 2.735211267605634e-06, - "loss": 0.5505, + "learning_rate": 3.924685714285715e-05, + "loss": 0.5575, "step": 1660 }, { "epoch": 23.19, - "learning_rate": 2.721126760563381e-06, - "loss": 0.5448, + "learning_rate": 3.9235428571428576e-05, + "loss": 0.5539, "step": 1670 }, { "epoch": 23.33, - "learning_rate": 2.7070422535211272e-06, - "loss": 0.5539, + "learning_rate": 3.9224e-05, + "loss": 0.5597, "step": 1680 }, { "epoch": 23.47, - "learning_rate": 2.6929577464788736e-06, - "loss": 0.5401, + "learning_rate": 3.921257142857143e-05, + "loss": 0.5453, "step": 1690 }, { "epoch": 23.61, - "learning_rate": 2.67887323943662e-06, - "loss": 0.5626, + "learning_rate": 3.920114285714286e-05, + "loss": 0.5558, "step": 1700 }, { "epoch": 23.75, - "learning_rate": 2.6647887323943668e-06, - "loss": 0.5588, + "learning_rate": 3.918971428571429e-05, + "loss": 0.5542, "step": 1710 }, { "epoch": 23.89, - "learning_rate": 2.650704225352113e-06, - "loss": 0.5572, + "learning_rate": 3.9178285714285716e-05, + "loss": 0.5442, "step": 1720 }, { "epoch": 24.0, - "eval_loss": 0.5120282173156738, - "eval_runtime": 127.888, - "eval_samples_per_second": 4.16, - "eval_steps_per_second": 0.524, - "eval_wer": 0.25326219708169956, + "eval_loss": 0.5139951109886169, + "eval_runtime": 126.1164, + "eval_samples_per_second": 4.218, + "eval_steps_per_second": 0.531, + "eval_wer": 0.2627755994086263, "step": 1728 }, { "epoch": 24.03, - "learning_rate": 2.6366197183098595e-06, - "loss": 0.5649, + "learning_rate": 3.916685714285715e-05, + "loss": 0.5557, "step": 1730 }, { "epoch": 24.17, - "learning_rate": 2.6225352112676055e-06, - "loss": 0.5481, + "learning_rate": 3.915542857142857e-05, + "loss": 0.547, "step": 1740 }, { "epoch": 24.3, - "learning_rate": 2.6084507042253523e-06, - "loss": 0.5478, + "learning_rate": 3.9144e-05, + "loss": 0.5488, "step": 1750 }, { "epoch": 24.44, - "learning_rate": 2.5943661971830986e-06, - "loss": 0.5404, + "learning_rate": 3.913371428571429e-05, + "loss": 0.5434, "step": 1760 }, { "epoch": 24.58, - "learning_rate": 2.580281690140845e-06, - "loss": 0.5593, + "learning_rate": 3.9122285714285716e-05, + "loss": 0.5622, "step": 1770 }, { "epoch": 24.72, - "learning_rate": 2.5661971830985914e-06, - "loss": 0.5302, + "learning_rate": 3.911085714285715e-05, + "loss": 0.5449, "step": 1780 }, { "epoch": 24.86, - "learning_rate": 2.552112676056338e-06, - "loss": 0.5557, + "learning_rate": 3.9099428571428576e-05, + "loss": 0.5628, "step": 1790 }, { "epoch": 25.0, - "learning_rate": 2.5380281690140846e-06, - "loss": 0.5467, + "learning_rate": 3.9088e-05, + "loss": 0.5348, "step": 1800 }, { "epoch": 25.0, - "eval_loss": 0.5175544619560242, - "eval_runtime": 129.516, - "eval_samples_per_second": 4.108, - "eval_steps_per_second": 0.517, - "eval_wer": 0.25782605900880634, + "eval_loss": 0.5193970203399658, + "eval_runtime": 126.1264, + "eval_samples_per_second": 4.218, + "eval_steps_per_second": 0.531, + "eval_wer": 0.2673394613357331, "step": 1800 }, { "epoch": 25.14, - "learning_rate": 2.523943661971831e-06, - "loss": 0.5543, + "learning_rate": 3.907657142857143e-05, + "loss": 0.5589, "step": 1810 }, { "epoch": 25.28, - "learning_rate": 2.5098591549295777e-06, - "loss": 0.55, + "learning_rate": 3.9065142857142856e-05, + "loss": 0.56, "step": 1820 }, { "epoch": 25.42, - "learning_rate": 2.495774647887324e-06, - "loss": 0.5348, + "learning_rate": 3.905371428571429e-05, + "loss": 0.5418, "step": 1830 }, { "epoch": 25.55, - "learning_rate": 2.4816901408450705e-06, - "loss": 0.5401, + "learning_rate": 3.9042285714285716e-05, + "loss": 0.5345, "step": 1840 }, { "epoch": 25.69, - "learning_rate": 2.467605633802817e-06, - "loss": 0.5341, + "learning_rate": 3.903085714285715e-05, + "loss": 0.5516, "step": 1850 }, { "epoch": 25.83, - "learning_rate": 2.4535211267605637e-06, - "loss": 0.552, + "learning_rate": 3.9019428571428577e-05, + "loss": 0.5562, "step": 1860 }, { "epoch": 25.97, - "learning_rate": 2.43943661971831e-06, - "loss": 0.5424, + "learning_rate": 3.9008e-05, + "loss": 0.5298, "step": 1870 }, { "epoch": 26.0, - "eval_loss": 0.5104931592941284, - "eval_runtime": 127.2359, - "eval_samples_per_second": 4.181, - "eval_steps_per_second": 0.527, - "eval_wer": 0.2551905894452658, + "eval_loss": 0.5027355551719666, + "eval_runtime": 125.2833, + "eval_samples_per_second": 4.246, + "eval_steps_per_second": 0.535, + "eval_wer": 0.25448351224529153, "step": 1872 }, { "epoch": 26.11, - "learning_rate": 2.4253521126760564e-06, - "loss": 0.5556, + "learning_rate": 3.899657142857143e-05, + "loss": 0.5738, "step": 1880 }, { "epoch": 26.25, - "learning_rate": 2.4112676056338032e-06, - "loss": 0.546, + "learning_rate": 3.898514285714286e-05, + "loss": 0.5604, "step": 1890 }, { "epoch": 26.39, - "learning_rate": 2.3971830985915496e-06, - "loss": 0.5392, + "learning_rate": 3.897371428571429e-05, + "loss": 0.5387, "step": 1900 }, { "epoch": 26.53, - "learning_rate": 2.383098591549296e-06, - "loss": 0.5465, + "learning_rate": 3.896228571428572e-05, + "loss": 0.5606, "step": 1910 }, { "epoch": 26.66, - "learning_rate": 2.3690140845070423e-06, - "loss": 0.5393, + "learning_rate": 3.895085714285715e-05, + "loss": 0.5327, "step": 1920 }, { "epoch": 26.8, - "learning_rate": 2.354929577464789e-06, - "loss": 0.5469, + "learning_rate": 3.893942857142858e-05, + "loss": 0.5669, "step": 1930 }, { "epoch": 26.94, - "learning_rate": 2.3408450704225355e-06, - "loss": 0.5344, + "learning_rate": 3.8928000000000004e-05, + "loss": 0.5423, "step": 1940 }, { "epoch": 27.0, - "eval_loss": 0.5212472677230835, - "eval_runtime": 128.0249, - "eval_samples_per_second": 4.155, - "eval_steps_per_second": 0.523, - "eval_wer": 0.2540978337725783, + "eval_loss": 0.5178112387657166, + "eval_runtime": 126.1454, + "eval_samples_per_second": 4.217, + "eval_steps_per_second": 0.531, + "eval_wer": 0.2551263096998136, "step": 1944 }, { "epoch": 27.08, - "learning_rate": 2.326760563380282e-06, - "loss": 0.5647, + "learning_rate": 3.891657142857143e-05, + "loss": 0.5571, "step": 1950 }, { "epoch": 27.22, - "learning_rate": 2.3126760563380287e-06, - "loss": 0.5383, + "learning_rate": 3.890514285714286e-05, + "loss": 0.5358, "step": 1960 }, { "epoch": 27.36, - "learning_rate": 2.2985915492957746e-06, - "loss": 0.5333, + "learning_rate": 3.889371428571429e-05, + "loss": 0.5477, "step": 1970 }, { "epoch": 27.5, - "learning_rate": 2.284507042253521e-06, - "loss": 0.5551, + "learning_rate": 3.888228571428572e-05, + "loss": 0.5439, "step": 1980 }, { "epoch": 27.64, - "learning_rate": 2.270422535211268e-06, - "loss": 0.5477, + "learning_rate": 3.887085714285715e-05, + "loss": 0.5372, "step": 1990 }, { "epoch": 27.78, - "learning_rate": 2.256338028169014e-06, - "loss": 0.5594, + "learning_rate": 3.885942857142857e-05, + "loss": 0.5644, "step": 2000 }, { "epoch": 27.91, - "learning_rate": 2.2422535211267606e-06, - "loss": 0.5444, + "learning_rate": 3.8848e-05, + "loss": 0.547, "step": 2010 }, { "epoch": 28.0, - "eval_loss": 0.5154798626899719, - "eval_runtime": 128.0303, - "eval_samples_per_second": 4.155, - "eval_steps_per_second": 0.523, - "eval_wer": 0.25557626791797905, + "eval_loss": 0.5477745532989502, + "eval_runtime": 126.7098, + "eval_samples_per_second": 4.199, + "eval_steps_per_second": 0.529, + "eval_wer": 0.28283087998971523, "step": 2016 }, { "epoch": 28.06, - "learning_rate": 2.2281690140845074e-06, - "loss": 0.569, + "learning_rate": 3.883657142857143e-05, + "loss": 0.5555, "step": 2020 }, { "epoch": 28.19, - "learning_rate": 2.2140845070422537e-06, - "loss": 0.5493, + "learning_rate": 3.882514285714286e-05, + "loss": 0.527, "step": 2030 }, { "epoch": 28.33, - "learning_rate": 2.2e-06, - "loss": 0.5485, + "learning_rate": 3.881371428571429e-05, + "loss": 0.5578, "step": 2040 }, { "epoch": 28.47, - "learning_rate": 2.1859154929577465e-06, - "loss": 0.5367, + "learning_rate": 3.880228571428572e-05, + "loss": 0.5281, "step": 2050 }, { "epoch": 28.61, - "learning_rate": 2.1718309859154933e-06, - "loss": 0.5487, + "learning_rate": 3.8790857142857145e-05, + "loss": 0.5591, "step": 2060 }, { "epoch": 28.75, - "learning_rate": 2.1577464788732397e-06, - "loss": 0.5487, + "learning_rate": 3.877942857142857e-05, + "loss": 0.557, "step": 2070 }, { "epoch": 28.89, - "learning_rate": 2.143661971830986e-06, - "loss": 0.5276, + "learning_rate": 3.8768e-05, + "loss": 0.5327, "step": 2080 }, { "epoch": 29.0, - "eval_loss": 0.523108959197998, - "eval_runtime": 128.0146, - "eval_samples_per_second": 4.156, - "eval_steps_per_second": 0.523, - "eval_wer": 0.2551263096998136, + "eval_loss": 0.5265487432479858, + "eval_runtime": 126.5684, + "eval_samples_per_second": 4.203, + "eval_steps_per_second": 0.529, + "eval_wer": 0.26573246769942793, "step": 2088 }, { "epoch": 29.03, - "learning_rate": 2.129577464788733e-06, - "loss": 0.546, + "learning_rate": 3.875657142857143e-05, + "loss": 0.5521, "step": 2090 }, { "epoch": 29.17, - "learning_rate": 2.115492957746479e-06, - "loss": 0.5308, + "learning_rate": 3.874514285714286e-05, + "loss": 0.5307, "step": 2100 }, { "epoch": 29.3, - "learning_rate": 2.1014084507042256e-06, - "loss": 0.5303, + "learning_rate": 3.873371428571429e-05, + "loss": 0.5375, "step": 2110 }, { "epoch": 29.44, - "learning_rate": 2.087323943661972e-06, - "loss": 0.5453, + "learning_rate": 3.872228571428572e-05, + "loss": 0.5372, "step": 2120 }, { "epoch": 29.58, - "learning_rate": 2.0732394366197183e-06, - "loss": 0.5396, + "learning_rate": 3.8710857142857146e-05, + "loss": 0.5599, "step": 2130 }, { "epoch": 29.72, - "learning_rate": 2.0591549295774647e-06, - "loss": 0.5352, + "learning_rate": 3.869942857142857e-05, + "loss": 0.5611, "step": 2140 }, { "epoch": 29.86, - "learning_rate": 2.0450704225352115e-06, - "loss": 0.54, + "learning_rate": 3.8688e-05, + "loss": 0.548, "step": 2150 }, { "epoch": 30.0, - "learning_rate": 2.030985915492958e-06, - "loss": 0.5501, + "learning_rate": 3.867657142857143e-05, + "loss": 0.5495, "step": 2160 }, { "epoch": 30.0, - "eval_loss": 0.5224459171295166, - "eval_runtime": 128.6755, - "eval_samples_per_second": 4.134, - "eval_steps_per_second": 0.521, - "eval_wer": 0.25570482740888345, + "eval_loss": 0.521438717842102, + "eval_runtime": 126.4073, + "eval_samples_per_second": 4.209, + "eval_steps_per_second": 0.53, + "eval_wer": 0.2630327183904352, "step": 2160 }, { "epoch": 30.14, - "learning_rate": 2.0169014084507043e-06, - "loss": 0.554, + "learning_rate": 3.866514285714286e-05, + "loss": 0.5586, "step": 2170 }, { "epoch": 30.28, - "learning_rate": 2.002816901408451e-06, - "loss": 0.555, + "learning_rate": 3.8653714285714287e-05, + "loss": 0.5655, "step": 2180 }, { "epoch": 30.42, - "learning_rate": 1.9887323943661974e-06, - "loss": 0.5414, + "learning_rate": 3.864228571428571e-05, + "loss": 0.5253, "step": 2190 }, { "epoch": 30.55, - "learning_rate": 1.974647887323944e-06, - "loss": 0.5469, + "learning_rate": 3.863085714285715e-05, + "loss": 0.5316, "step": 2200 }, { "epoch": 30.69, - "learning_rate": 1.96056338028169e-06, - "loss": 0.5356, + "learning_rate": 3.8619428571428574e-05, + "loss": 0.5386, "step": 2210 }, { "epoch": 30.83, - "learning_rate": 1.946478873239437e-06, - "loss": 0.5483, + "learning_rate": 3.8608e-05, + "loss": 0.5546, "step": 2220 }, { "epoch": 30.97, - "learning_rate": 1.9323943661971834e-06, - "loss": 0.5335, + "learning_rate": 3.8596571428571434e-05, + "loss": 0.5272, "step": 2230 }, { "epoch": 31.0, - "eval_loss": 0.5278783440589905, - "eval_runtime": 128.5943, - "eval_samples_per_second": 4.137, - "eval_steps_per_second": 0.521, - "eval_wer": 0.2549977502089092, + "eval_loss": 0.5094417333602905, + "eval_runtime": 126.1741, + "eval_samples_per_second": 4.216, + "eval_steps_per_second": 0.531, + "eval_wer": 0.26457543228128816, "step": 2232 }, { "epoch": 31.11, - "learning_rate": 1.9183098591549297e-06, - "loss": 0.5579, + "learning_rate": 3.858514285714286e-05, + "loss": 0.5574, "step": 2240 }, { "epoch": 31.25, - "learning_rate": 1.9042253521126763e-06, - "loss": 0.5416, + "learning_rate": 3.857371428571429e-05, + "loss": 0.5369, "step": 2250 }, { "epoch": 31.39, - "learning_rate": 1.8901408450704225e-06, - "loss": 0.5325, + "learning_rate": 3.8562285714285714e-05, + "loss": 0.5338, "step": 2260 }, { "epoch": 31.53, - "learning_rate": 1.876056338028169e-06, - "loss": 0.5376, + "learning_rate": 3.855085714285715e-05, + "loss": 0.5424, "step": 2270 }, { "epoch": 31.66, - "learning_rate": 1.8619718309859157e-06, - "loss": 0.5382, + "learning_rate": 3.8539428571428574e-05, + "loss": 0.5488, "step": 2280 }, { "epoch": 31.8, - "learning_rate": 1.847887323943662e-06, - "loss": 0.5517, + "learning_rate": 3.8528e-05, + "loss": 0.5743, "step": 2290 }, { "epoch": 31.94, - "learning_rate": 1.8338028169014086e-06, - "loss": 0.5315, + "learning_rate": 3.8516571428571435e-05, + "loss": 0.5378, "step": 2300 }, { "epoch": 32.0, - "eval_loss": 0.515052855014801, - "eval_runtime": 128.5881, - "eval_samples_per_second": 4.137, - "eval_steps_per_second": 0.521, - "eval_wer": 0.25448351224529153, + "eval_loss": 0.5152480006217957, + "eval_runtime": 125.8818, + "eval_samples_per_second": 4.226, + "eval_steps_per_second": 0.532, + "eval_wer": 0.261747123481391, "step": 2304 }, { "epoch": 32.08, - "learning_rate": 1.819718309859155e-06, - "loss": 0.5712, + "learning_rate": 3.850514285714286e-05, + "loss": 0.5729, "step": 2310 }, { "epoch": 32.22, - "learning_rate": 1.8056338028169016e-06, - "loss": 0.5349, + "learning_rate": 3.849371428571429e-05, + "loss": 0.5366, "step": 2320 }, { "epoch": 32.36, - "learning_rate": 1.791549295774648e-06, - "loss": 0.5408, + "learning_rate": 3.8482285714285715e-05, + "loss": 0.5523, "step": 2330 }, { "epoch": 32.5, - "learning_rate": 1.7774647887323945e-06, - "loss": 0.5405, + "learning_rate": 3.847085714285715e-05, + "loss": 0.5379, "step": 2340 }, { "epoch": 32.64, - "learning_rate": 1.7633802816901411e-06, - "loss": 0.5309, + "learning_rate": 3.8459428571428575e-05, + "loss": 0.5225, "step": 2350 }, { "epoch": 32.78, - "learning_rate": 1.7492957746478875e-06, - "loss": 0.5463, + "learning_rate": 3.844800000000001e-05, + "loss": 0.5341, "step": 2360 }, { "epoch": 32.91, - "learning_rate": 1.735211267605634e-06, - "loss": 0.5344, + "learning_rate": 3.843657142857143e-05, + "loss": 0.5255, "step": 2370 }, { "epoch": 33.0, - "eval_loss": 0.5204472541809082, - "eval_runtime": 129.9429, - "eval_samples_per_second": 4.094, - "eval_steps_per_second": 0.516, - "eval_wer": 0.2528122388635341, + "eval_loss": 0.5067561864852905, + "eval_runtime": 126.4534, + "eval_samples_per_second": 4.207, + "eval_steps_per_second": 0.53, + "eval_wer": 0.26354695635405284, "step": 2376 }, { "epoch": 33.06, - "learning_rate": 1.7211267605633805e-06, - "loss": 0.5626, + "learning_rate": 3.8425142857142855e-05, + "loss": 0.5689, "step": 2380 }, { "epoch": 33.19, - "learning_rate": 1.707042253521127e-06, - "loss": 0.5423, + "learning_rate": 3.841371428571429e-05, + "loss": 0.5534, "step": 2390 }, { "epoch": 33.33, - "learning_rate": 1.6929577464788734e-06, - "loss": 0.5505, + "learning_rate": 3.8402285714285716e-05, + "loss": 0.544, "step": 2400 }, { "epoch": 33.47, - "learning_rate": 1.6788732394366198e-06, - "loss": 0.5354, + "learning_rate": 3.839085714285715e-05, + "loss": 0.5317, "step": 2410 }, { "epoch": 33.61, - "learning_rate": 1.6647887323943662e-06, - "loss": 0.5366, + "learning_rate": 3.8379428571428576e-05, + "loss": 0.5588, "step": 2420 }, { "epoch": 33.75, - "learning_rate": 1.6507042253521128e-06, - "loss": 0.5445, + "learning_rate": 3.8368e-05, + "loss": 0.5236, "step": 2430 }, { "epoch": 33.89, - "learning_rate": 1.6366197183098591e-06, - "loss": 0.5249, + "learning_rate": 3.835657142857143e-05, + "loss": 0.5218, "step": 2440 }, { "epoch": 34.0, - "eval_loss": 0.515282154083252, - "eval_runtime": 128.9615, - "eval_samples_per_second": 4.125, - "eval_steps_per_second": 0.52, - "eval_wer": 0.2542906730089349, + "eval_loss": 0.5435338020324707, + "eval_runtime": 126.3416, + "eval_samples_per_second": 4.211, + "eval_steps_per_second": 0.53, + "eval_wer": 0.2614900044995822, "step": 2448 }, { "epoch": 34.03, - "learning_rate": 1.6225352112676057e-06, - "loss": 0.5576, + "learning_rate": 3.8345142857142856e-05, + "loss": 0.5821, "step": 2450 }, { "epoch": 34.17, - "learning_rate": 1.6084507042253523e-06, - "loss": 0.5375, + "learning_rate": 3.833371428571429e-05, + "loss": 0.5302, "step": 2460 }, { "epoch": 34.3, - "learning_rate": 1.5943661971830987e-06, - "loss": 0.5439, + "learning_rate": 3.8322285714285716e-05, + "loss": 0.5415, "step": 2470 }, { "epoch": 34.44, - "learning_rate": 1.5802816901408453e-06, - "loss": 0.5376, + "learning_rate": 3.831085714285715e-05, + "loss": 0.5406, "step": 2480 }, { "epoch": 34.58, - "learning_rate": 1.5661971830985917e-06, - "loss": 0.5327, + "learning_rate": 3.829942857142858e-05, + "loss": 0.5397, "step": 2490 }, { "epoch": 34.72, - "learning_rate": 1.5521126760563382e-06, - "loss": 0.5283, + "learning_rate": 3.8288000000000003e-05, + "loss": 0.5444, "step": 2500 }, { "epoch": 34.86, - "learning_rate": 1.5380281690140846e-06, - "loss": 0.5375, + "learning_rate": 3.827657142857143e-05, + "loss": 0.5423, "step": 2510 }, { "epoch": 35.0, - "learning_rate": 1.5239436619718312e-06, - "loss": 0.5478, + "learning_rate": 3.826514285714286e-05, + "loss": 0.5326, "step": 2520 }, { "epoch": 35.0, - "eval_loss": 0.5154463648796082, - "eval_runtime": 129.3389, - "eval_samples_per_second": 4.113, - "eval_steps_per_second": 0.518, - "eval_wer": 0.2543549527543871, + "eval_loss": 0.5107089281082153, + "eval_runtime": 126.0509, + "eval_samples_per_second": 4.221, + "eval_steps_per_second": 0.532, + "eval_wer": 0.2609114867905123, "step": 2520 }, { "epoch": 35.14, - "learning_rate": 1.5098591549295778e-06, - "loss": 0.526, + "learning_rate": 3.825371428571429e-05, + "loss": 0.5566, "step": 2530 }, { "epoch": 35.28, - "learning_rate": 1.4957746478873242e-06, - "loss": 0.5461, + "learning_rate": 3.824228571428572e-05, + "loss": 0.5768, "step": 2540 }, { "epoch": 35.42, - "learning_rate": 1.4816901408450707e-06, - "loss": 0.5357, + "learning_rate": 3.823085714285715e-05, + "loss": 0.5359, "step": 2550 }, { "epoch": 35.55, - "learning_rate": 1.467605633802817e-06, - "loss": 0.5379, + "learning_rate": 3.821942857142857e-05, + "loss": 0.5527, "step": 2560 }, { "epoch": 35.69, - "learning_rate": 1.4535211267605635e-06, - "loss": 0.5354, + "learning_rate": 3.8208000000000004e-05, + "loss": 0.5484, "step": 2570 }, { "epoch": 35.83, - "learning_rate": 1.4394366197183099e-06, - "loss": 0.5374, + "learning_rate": 3.819657142857143e-05, + "loss": 0.5585, "step": 2580 }, { "epoch": 35.97, - "learning_rate": 1.4253521126760565e-06, - "loss": 0.5346, + "learning_rate": 3.818514285714286e-05, + "loss": 0.5345, "step": 2590 }, { "epoch": 36.0, - "eval_loss": 0.5122731924057007, - "eval_runtime": 127.7459, - "eval_samples_per_second": 4.165, - "eval_steps_per_second": 0.524, - "eval_wer": 0.25339075657260396, + "eval_loss": 0.5491129159927368, + "eval_runtime": 126.4262, + "eval_samples_per_second": 4.208, + "eval_steps_per_second": 0.53, + "eval_wer": 0.2761457864626856, "step": 2592 }, { "epoch": 36.11, - "learning_rate": 1.4112676056338028e-06, - "loss": 0.5522, + "learning_rate": 3.817371428571429e-05, + "loss": 0.559, "step": 2600 }, { "epoch": 36.25, - "learning_rate": 1.3971830985915494e-06, - "loss": 0.5397, + "learning_rate": 3.816228571428572e-05, + "loss": 0.5338, "step": 2610 }, { "epoch": 36.39, - "learning_rate": 1.3830985915492958e-06, - "loss": 0.519, + "learning_rate": 3.8150857142857145e-05, + "loss": 0.5292, "step": 2620 }, { "epoch": 36.53, - "learning_rate": 1.3690140845070424e-06, - "loss": 0.5558, + "learning_rate": 3.813942857142857e-05, + "loss": 0.5576, "step": 2630 }, { "epoch": 36.66, - "learning_rate": 1.354929577464789e-06, - "loss": 0.5407, + "learning_rate": 3.8128000000000005e-05, + "loss": 0.5352, "step": 2640 }, { "epoch": 36.8, - "learning_rate": 1.3408450704225353e-06, - "loss": 0.533, + "learning_rate": 3.811657142857143e-05, + "loss": 0.5307, "step": 2650 }, { "epoch": 36.94, - "learning_rate": 1.326760563380282e-06, - "loss": 0.5436, + "learning_rate": 3.810514285714286e-05, + "loss": 0.5323, "step": 2660 }, { "epoch": 37.0, - "eval_loss": 0.5210054516792297, - "eval_runtime": 129.2771, - "eval_samples_per_second": 4.115, - "eval_steps_per_second": 0.518, - "eval_wer": 0.25654046409976217, + "eval_loss": 0.5177223086357117, + "eval_runtime": 126.9526, + "eval_samples_per_second": 4.191, + "eval_steps_per_second": 0.528, + "eval_wer": 0.27479591180818924, "step": 2664 }, { "epoch": 37.08, - "learning_rate": 1.3126760563380283e-06, - "loss": 0.564, + "learning_rate": 3.809371428571429e-05, + "loss": 0.5417, "step": 2670 }, { "epoch": 37.22, - "learning_rate": 1.298591549295775e-06, - "loss": 0.5498, + "learning_rate": 3.808228571428572e-05, + "loss": 0.5301, "step": 2680 }, { "epoch": 37.36, - "learning_rate": 1.2845070422535213e-06, - "loss": 0.5368, + "learning_rate": 3.8070857142857145e-05, + "loss": 0.5387, "step": 2690 }, { "epoch": 37.5, - "learning_rate": 1.2704225352112676e-06, - "loss": 0.5166, + "learning_rate": 3.805942857142857e-05, + "loss": 0.5218, "step": 2700 }, { "epoch": 37.64, - "learning_rate": 1.256338028169014e-06, - "loss": 0.5314, + "learning_rate": 3.8048000000000006e-05, + "loss": 0.508, "step": 2710 }, { "epoch": 37.78, - "learning_rate": 1.2422535211267606e-06, - "loss": 0.5411, + "learning_rate": 3.803657142857143e-05, + "loss": 0.5372, "step": 2720 }, { "epoch": 37.91, - "learning_rate": 1.2281690140845072e-06, - "loss": 0.5299, + "learning_rate": 3.802514285714286e-05, + "loss": 0.5068, "step": 2730 }, { "epoch": 38.0, - "eval_loss": 0.5182300806045532, - "eval_runtime": 129.021, - "eval_samples_per_second": 4.123, - "eval_steps_per_second": 0.519, - "eval_wer": 0.253712155299865, + "eval_loss": 0.5005291104316711, + "eval_runtime": 127.1967, + "eval_samples_per_second": 4.182, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2576974995179019, "step": 2736 }, { "epoch": 38.06, - "learning_rate": 1.2140845070422536e-06, - "loss": 0.5536, + "learning_rate": 3.801371428571429e-05, + "loss": 0.5453, "step": 2740 }, { "epoch": 38.19, - "learning_rate": 1.2000000000000002e-06, - "loss": 0.5458, + "learning_rate": 3.800228571428571e-05, + "loss": 0.5197, "step": 2750 }, { "epoch": 38.33, - "learning_rate": 1.1859154929577465e-06, - "loss": 0.5247, + "learning_rate": 3.7990857142857146e-05, + "loss": 0.5116, "step": 2760 }, { "epoch": 38.47, - "learning_rate": 1.1718309859154931e-06, - "loss": 0.5405, + "learning_rate": 3.797942857142857e-05, + "loss": 0.534, "step": 2770 }, { "epoch": 38.61, - "learning_rate": 1.1577464788732395e-06, - "loss": 0.547, + "learning_rate": 3.7968000000000006e-05, + "loss": 0.5331, "step": 2780 }, { "epoch": 38.75, - "learning_rate": 1.143661971830986e-06, - "loss": 0.5321, + "learning_rate": 3.795657142857143e-05, + "loss": 0.5257, "step": 2790 }, { "epoch": 38.89, - "learning_rate": 1.1295774647887325e-06, - "loss": 0.5248, + "learning_rate": 3.794514285714286e-05, + "loss": 0.5238, "step": 2800 }, { "epoch": 39.0, - "eval_loss": 0.5239952206611633, - "eval_runtime": 129.8341, - "eval_samples_per_second": 4.098, - "eval_steps_per_second": 0.516, - "eval_wer": 0.2528765186089863, + "eval_loss": 0.4947085976600647, + "eval_runtime": 126.2304, + "eval_samples_per_second": 4.215, + "eval_steps_per_second": 0.531, + "eval_wer": 0.24689850228193097, "step": 2808 }, { "epoch": 39.03, - "learning_rate": 1.115492957746479e-06, - "loss": 0.5514, + "learning_rate": 3.793371428571429e-05, + "loss": 0.5501, "step": 2810 }, { "epoch": 39.17, - "learning_rate": 1.1014084507042254e-06, - "loss": 0.5394, + "learning_rate": 3.7922285714285713e-05, + "loss": 0.5189, "step": 2820 }, { "epoch": 39.3, - "learning_rate": 1.0873239436619718e-06, - "loss": 0.5387, + "learning_rate": 3.791085714285715e-05, + "loss": 0.5116, "step": 2830 }, { "epoch": 39.44, - "learning_rate": 1.0732394366197184e-06, - "loss": 0.513, + "learning_rate": 3.7899428571428574e-05, + "loss": 0.5014, "step": 2840 }, { "epoch": 39.58, - "learning_rate": 1.059154929577465e-06, - "loss": 0.5425, + "learning_rate": 3.788800000000001e-05, + "loss": 0.5312, "step": 2850 }, { "epoch": 39.72, - "learning_rate": 1.0450704225352113e-06, - "loss": 0.5397, + "learning_rate": 3.7876571428571434e-05, + "loss": 0.5283, "step": 2860 }, { "epoch": 39.86, - "learning_rate": 1.030985915492958e-06, - "loss": 0.5407, + "learning_rate": 3.786514285714286e-05, + "loss": 0.5157, "step": 2870 }, { "epoch": 40.0, - "learning_rate": 1.0169014084507043e-06, - "loss": 0.5295, + "learning_rate": 3.785371428571429e-05, + "loss": 0.548, "step": 2880 }, { "epoch": 40.0, - "eval_loss": 0.5250394940376282, - "eval_runtime": 128.5995, - "eval_samples_per_second": 4.137, - "eval_steps_per_second": 0.521, - "eval_wer": 0.2562833451179533, + "eval_loss": 0.503398597240448, + "eval_runtime": 125.9549, + "eval_samples_per_second": 4.224, + "eval_steps_per_second": 0.532, + "eval_wer": 0.2570547020633798, "step": 2880 }, { "epoch": 40.14, - "learning_rate": 1.0028169014084507e-06, - "loss": 0.5626, + "learning_rate": 3.7842285714285714e-05, + "loss": 0.5398, "step": 2890 }, { "epoch": 40.28, - "learning_rate": 9.887323943661973e-07, - "loss": 0.5362, + "learning_rate": 3.783085714285715e-05, + "loss": 0.518, "step": 2900 }, { "epoch": 40.42, - "learning_rate": 9.746478873239436e-07, - "loss": 0.5354, + "learning_rate": 3.7819428571428574e-05, + "loss": 0.5167, "step": 2910 }, { "epoch": 40.55, - "learning_rate": 9.605633802816902e-07, - "loss": 0.5444, + "learning_rate": 3.780800000000001e-05, + "loss": 0.5301, "step": 2920 }, { "epoch": 40.69, - "learning_rate": 9.464788732394367e-07, - "loss": 0.5232, + "learning_rate": 3.7796571428571435e-05, + "loss": 0.5143, "step": 2930 }, { "epoch": 40.83, - "learning_rate": 9.323943661971832e-07, - "loss": 0.5378, + "learning_rate": 3.778514285714286e-05, + "loss": 0.5414, "step": 2940 }, { "epoch": 40.97, - "learning_rate": 9.183098591549297e-07, - "loss": 0.5343, + "learning_rate": 3.777371428571429e-05, + "loss": 0.5301, "step": 2950 }, { "epoch": 41.0, - "eval_loss": 0.5179165601730347, - "eval_runtime": 129.1365, - "eval_samples_per_second": 4.12, - "eval_steps_per_second": 0.519, - "eval_wer": 0.2536478755544128, + "eval_loss": 0.5064073204994202, + "eval_runtime": 126.5243, + "eval_samples_per_second": 4.205, + "eval_steps_per_second": 0.53, + "eval_wer": 0.25075528700906347, "step": 2952 }, { "epoch": 41.11, - "learning_rate": 9.04225352112676e-07, - "loss": 0.5501, + "learning_rate": 3.7762285714285715e-05, + "loss": 0.5575, "step": 2960 }, { "epoch": 41.25, - "learning_rate": 8.901408450704225e-07, - "loss": 0.5334, + "learning_rate": 3.775085714285715e-05, + "loss": 0.5367, "step": 2970 }, { "epoch": 41.39, - "learning_rate": 8.76056338028169e-07, - "loss": 0.5379, + "learning_rate": 3.7739428571428575e-05, + "loss": 0.5342, "step": 2980 }, { "epoch": 41.53, - "learning_rate": 8.619718309859156e-07, - "loss": 0.54, + "learning_rate": 3.7728e-05, + "loss": 0.5337, "step": 2990 }, { "epoch": 41.66, - "learning_rate": 8.478873239436621e-07, - "loss": 0.5446, + "learning_rate": 3.771657142857143e-05, + "loss": 0.5495, "step": 3000 }, { "epoch": 41.8, - "learning_rate": 8.338028169014086e-07, - "loss": 0.5478, + "learning_rate": 3.770514285714286e-05, + "loss": 0.5376, "step": 3010 }, { "epoch": 41.94, - "learning_rate": 8.19718309859155e-07, - "loss": 0.5255, + "learning_rate": 3.769371428571429e-05, + "loss": 0.5082, "step": 3020 }, { "epoch": 42.0, - "eval_loss": 0.5213496685028076, - "eval_runtime": 130.2226, - "eval_samples_per_second": 4.085, - "eval_steps_per_second": 0.515, - "eval_wer": 0.2560262261361445, + "eval_loss": 0.5106186270713806, + "eval_runtime": 126.5158, + "eval_samples_per_second": 4.205, + "eval_steps_per_second": 0.53, + "eval_wer": 0.2569904223179276, "step": 3024 }, { "epoch": 42.08, - "learning_rate": 8.056338028169015e-07, - "loss": 0.5457, + "learning_rate": 3.7682285714285716e-05, + "loss": 0.5485, "step": 3030 }, { "epoch": 42.22, - "learning_rate": 7.915492957746479e-07, - "loss": 0.5311, + "learning_rate": 3.767085714285715e-05, + "loss": 0.5156, "step": 3040 }, { "epoch": 42.36, - "learning_rate": 7.774647887323944e-07, - "loss": 0.5355, + "learning_rate": 3.7659428571428576e-05, + "loss": 0.5435, "step": 3050 }, { "epoch": 42.5, - "learning_rate": 7.633802816901409e-07, - "loss": 0.5426, + "learning_rate": 3.7648e-05, + "loss": 0.5337, "step": 3060 }, { "epoch": 42.64, - "learning_rate": 7.492957746478873e-07, - "loss": 0.5349, + "learning_rate": 3.763657142857143e-05, + "loss": 0.5327, "step": 3070 }, { "epoch": 42.78, - "learning_rate": 7.352112676056339e-07, - "loss": 0.5379, + "learning_rate": 3.762514285714286e-05, + "loss": 0.5371, "step": 3080 }, { "epoch": 42.91, - "learning_rate": 7.211267605633804e-07, - "loss": 0.525, + "learning_rate": 3.761371428571429e-05, + "loss": 0.5206, "step": 3090 }, { "epoch": 43.0, - "eval_loss": 0.522071123123169, - "eval_runtime": 128.4426, - "eval_samples_per_second": 4.142, - "eval_steps_per_second": 0.522, - "eval_wer": 0.2553191489361702, + "eval_loss": 0.5208801627159119, + "eval_runtime": 126.2182, + "eval_samples_per_second": 4.215, + "eval_steps_per_second": 0.531, + "eval_wer": 0.250305328790898, "step": 3096 }, { "epoch": 43.06, - "learning_rate": 7.070422535211269e-07, - "loss": 0.5591, + "learning_rate": 3.7602285714285717e-05, + "loss": 0.5611, "step": 3100 }, { "epoch": 43.19, - "learning_rate": 6.929577464788733e-07, - "loss": 0.5328, + "learning_rate": 3.759085714285715e-05, + "loss": 0.5434, "step": 3110 }, { "epoch": 43.33, - "learning_rate": 6.788732394366197e-07, - "loss": 0.5427, + "learning_rate": 3.757942857142857e-05, + "loss": 0.5476, "step": 3120 }, { "epoch": 43.47, - "learning_rate": 6.647887323943662e-07, - "loss": 0.5322, + "learning_rate": 3.7568000000000004e-05, + "loss": 0.5376, "step": 3130 }, { "epoch": 43.61, - "learning_rate": 6.507042253521127e-07, - "loss": 0.5293, + "learning_rate": 3.755657142857143e-05, + "loss": 0.5375, "step": 3140 }, { "epoch": 43.75, - "learning_rate": 6.366197183098592e-07, - "loss": 0.5299, + "learning_rate": 3.7545142857142864e-05, + "loss": 0.5181, "step": 3150 }, { "epoch": 43.89, - "learning_rate": 6.225352112676057e-07, - "loss": 0.5345, + "learning_rate": 3.753371428571429e-05, + "loss": 0.5174, "step": 3160 }, { "epoch": 44.0, - "eval_loss": 0.5230171084403992, - "eval_runtime": 129.6367, - "eval_samples_per_second": 4.104, - "eval_steps_per_second": 0.517, - "eval_wer": 0.25306935784534296, + "eval_loss": 0.5150790214538574, + "eval_runtime": 126.4932, + "eval_samples_per_second": 4.206, + "eval_steps_per_second": 0.53, + "eval_wer": 0.24259175933663302, "step": 3168 }, { "epoch": 44.03, - "learning_rate": 6.084507042253521e-07, - "loss": 0.5468, + "learning_rate": 3.752228571428572e-05, + "loss": 0.5456, "step": 3170 }, { "epoch": 44.17, - "learning_rate": 5.943661971830986e-07, - "loss": 0.5317, + "learning_rate": 3.7510857142857144e-05, + "loss": 0.5191, "step": 3180 }, { "epoch": 44.3, - "learning_rate": 5.802816901408451e-07, - "loss": 0.5357, + "learning_rate": 3.749942857142857e-05, + "loss": 0.5328, "step": 3190 }, { "epoch": 44.44, - "learning_rate": 5.661971830985916e-07, - "loss": 0.5407, + "learning_rate": 3.7488000000000004e-05, + "loss": 0.5301, "step": 3200 }, { "epoch": 44.58, - "learning_rate": 5.521126760563381e-07, - "loss": 0.5388, + "learning_rate": 3.747657142857143e-05, + "loss": 0.5283, "step": 3210 }, { "epoch": 44.72, - "learning_rate": 5.380281690140846e-07, - "loss": 0.5096, + "learning_rate": 3.7465142857142865e-05, + "loss": 0.4951, "step": 3220 }, { "epoch": 44.86, - "learning_rate": 5.23943661971831e-07, - "loss": 0.5349, + "learning_rate": 3.745371428571429e-05, + "loss": 0.5281, "step": 3230 }, { "epoch": 45.0, - "learning_rate": 5.098591549295775e-07, - "loss": 0.5485, + "learning_rate": 3.744228571428572e-05, + "loss": 0.5281, "step": 3240 }, { "epoch": 45.0, - "eval_loss": 0.52115797996521, - "eval_runtime": 128.2514, - "eval_samples_per_second": 4.148, - "eval_steps_per_second": 0.522, - "eval_wer": 0.253712155299865, + "eval_loss": 0.5101660490036011, + "eval_runtime": 126.5347, + "eval_samples_per_second": 4.204, + "eval_steps_per_second": 0.529, + "eval_wer": 0.23963489104583147, "step": 3240 }, { "epoch": 45.14, - "learning_rate": 4.95774647887324e-07, - "loss": 0.536, + "learning_rate": 3.7430857142857145e-05, + "loss": 0.5226, "step": 3250 }, { "epoch": 45.28, - "learning_rate": 4.816901408450705e-07, - "loss": 0.5245, + "learning_rate": 3.741942857142857e-05, + "loss": 0.524, "step": 3260 }, { "epoch": 45.42, - "learning_rate": 4.6760563380281696e-07, - "loss": 0.5197, + "learning_rate": 3.7408000000000005e-05, + "loss": 0.5102, "step": 3270 }, { "epoch": 45.55, - "learning_rate": 4.535211267605634e-07, - "loss": 0.5556, + "learning_rate": 3.739657142857143e-05, + "loss": 0.5185, "step": 3280 }, { "epoch": 45.69, - "learning_rate": 4.3943661971830987e-07, - "loss": 0.5254, + "learning_rate": 3.7385142857142865e-05, + "loss": 0.5062, "step": 3290 }, { "epoch": 45.83, - "learning_rate": 4.253521126760564e-07, - "loss": 0.5375, + "learning_rate": 3.737371428571429e-05, + "loss": 0.5303, "step": 3300 }, { "epoch": 45.97, - "learning_rate": 4.1126760563380283e-07, - "loss": 0.5471, + "learning_rate": 3.736228571428571e-05, + "loss": 0.5204, "step": 3310 }, { "epoch": 46.0, - "eval_loss": 0.5214569568634033, - "eval_runtime": 128.944, - "eval_samples_per_second": 4.126, - "eval_steps_per_second": 0.52, - "eval_wer": 0.25319791733624736, + "eval_loss": 0.5097768902778625, + "eval_runtime": 127.439, + "eval_samples_per_second": 4.175, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2465771035546699, "step": 3312 }, { "epoch": 46.11, - "learning_rate": 3.971830985915493e-07, - "loss": 0.5549, + "learning_rate": 3.7350857142857146e-05, + "loss": 0.5366, "step": 3320 }, { "epoch": 46.25, - "learning_rate": 3.830985915492958e-07, - "loss": 0.5379, + "learning_rate": 3.733942857142857e-05, + "loss": 0.5188, "step": 3330 }, { "epoch": 46.39, - "learning_rate": 3.690140845070423e-07, - "loss": 0.521, + "learning_rate": 3.7328000000000006e-05, + "loss": 0.5203, "step": 3340 }, { "epoch": 46.53, - "learning_rate": 3.5492957746478875e-07, - "loss": 0.5369, + "learning_rate": 3.731657142857143e-05, + "loss": 0.5128, "step": 3350 }, { "epoch": 46.66, - "learning_rate": 3.4084507042253523e-07, - "loss": 0.5292, + "learning_rate": 3.730514285714286e-05, + "loss": 0.5065, "step": 3360 }, { "epoch": 46.8, - "learning_rate": 3.267605633802817e-07, - "loss": 0.5373, + "learning_rate": 3.7293714285714286e-05, + "loss": 0.5214, "step": 3370 }, { "epoch": 46.94, - "learning_rate": 3.126760563380282e-07, - "loss": 0.5375, + "learning_rate": 3.728228571428571e-05, + "loss": 0.5064, "step": 3380 }, { "epoch": 47.0, - "eval_loss": 0.5215560793876648, - "eval_runtime": 128.748, - "eval_samples_per_second": 4.132, - "eval_steps_per_second": 0.52, - "eval_wer": 0.2543549527543871, + "eval_loss": 0.5148393511772156, + "eval_runtime": 127.9513, + "eval_samples_per_second": 4.158, + "eval_steps_per_second": 0.524, + "eval_wer": 0.24837693642733175, "step": 3384 }, { "epoch": 47.08, - "learning_rate": 2.985915492957747e-07, - "loss": 0.5496, + "learning_rate": 3.7270857142857146e-05, + "loss": 0.5263, "step": 3390 }, { "epoch": 47.22, - "learning_rate": 2.8450704225352116e-07, - "loss": 0.5405, + "learning_rate": 3.725942857142857e-05, + "loss": 0.5031, "step": 3400 }, { "epoch": 47.36, - "learning_rate": 2.7042253521126764e-07, - "loss": 0.5353, + "learning_rate": 3.7248000000000007e-05, + "loss": 0.5043, "step": 3410 }, { "epoch": 47.5, - "learning_rate": 2.563380281690141e-07, - "loss": 0.5449, + "learning_rate": 3.723657142857143e-05, + "loss": 0.5047, "step": 3420 }, { "epoch": 47.64, - "learning_rate": 2.422535211267606e-07, - "loss": 0.5415, + "learning_rate": 3.722514285714286e-05, + "loss": 0.4999, "step": 3430 }, { "epoch": 47.78, - "learning_rate": 2.2816901408450706e-07, - "loss": 0.5322, + "learning_rate": 3.721371428571429e-05, + "loss": 0.5159, "step": 3440 }, { "epoch": 47.91, - "learning_rate": 2.1408450704225354e-07, - "loss": 0.5229, + "learning_rate": 3.7202285714285714e-05, + "loss": 0.5014, "step": 3450 }, { "epoch": 48.0, - "eval_loss": 0.5208937525749207, - "eval_runtime": 128.6533, - "eval_samples_per_second": 4.135, - "eval_steps_per_second": 0.521, - "eval_wer": 0.2551263096998136, + "eval_loss": 0.5260804891586304, + "eval_runtime": 127.2758, + "eval_samples_per_second": 4.18, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2479912579546185, "step": 3456 }, { "epoch": 48.06, - "learning_rate": 2.0000000000000002e-07, - "loss": 0.5553, + "learning_rate": 3.719085714285715e-05, + "loss": 0.5386, "step": 3460 }, { "epoch": 48.19, - "learning_rate": 1.8591549295774647e-07, - "loss": 0.5291, + "learning_rate": 3.7179428571428574e-05, + "loss": 0.5085, "step": 3470 }, { "epoch": 48.33, - "learning_rate": 1.7183098591549298e-07, - "loss": 0.5476, + "learning_rate": 3.716800000000001e-05, + "loss": 0.5237, "step": 3480 }, { "epoch": 48.47, - "learning_rate": 1.5774647887323943e-07, - "loss": 0.5228, + "learning_rate": 3.7156571428571434e-05, + "loss": 0.5033, "step": 3490 }, { "epoch": 48.61, - "learning_rate": 1.4366197183098591e-07, - "loss": 0.5252, + "learning_rate": 3.714514285714286e-05, + "loss": 0.5235, "step": 3500 }, { "epoch": 48.75, - "learning_rate": 1.295774647887324e-07, - "loss": 0.5434, + "learning_rate": 3.713371428571429e-05, + "loss": 0.5445, "step": 3510 }, { "epoch": 48.89, - "learning_rate": 1.1549295774647888e-07, - "loss": 0.5218, + "learning_rate": 3.7122285714285714e-05, + "loss": 0.5363, "step": 3520 }, { "epoch": 49.0, - "eval_loss": 0.5215969085693359, - "eval_runtime": 129.6533, - "eval_samples_per_second": 4.103, - "eval_steps_per_second": 0.517, - "eval_wer": 0.2536478755544128, + "eval_loss": 0.49922609329223633, + "eval_runtime": 127.0007, + "eval_samples_per_second": 4.189, + "eval_steps_per_second": 0.528, + "eval_wer": 0.2517837629362988, "step": 3528 }, { "epoch": 49.03, - "learning_rate": 1.0281690140845071e-07, - "loss": 0.5535, + "learning_rate": 3.711085714285715e-05, + "loss": 0.5449, "step": 3530 }, { "epoch": 49.17, - "learning_rate": 8.873239436619719e-08, - "loss": 0.529, + "learning_rate": 3.7099428571428575e-05, + "loss": 0.5164, "step": 3540 }, { "epoch": 49.3, - "learning_rate": 7.464788732394367e-08, - "loss": 0.5316, + "learning_rate": 3.7088e-05, + "loss": 0.5243, "step": 3550 }, { "epoch": 49.44, - "learning_rate": 6.056338028169015e-08, - "loss": 0.5191, + "learning_rate": 3.707657142857143e-05, + "loss": 0.5033, "step": 3560 }, { "epoch": 49.58, - "learning_rate": 4.647887323943662e-08, - "loss": 0.5505, + "learning_rate": 3.706514285714286e-05, + "loss": 0.5197, "step": 3570 }, { "epoch": 49.72, - "learning_rate": 3.23943661971831e-08, - "loss": 0.5328, + "learning_rate": 3.705371428571429e-05, + "loss": 0.5211, "step": 3580 }, { "epoch": 49.86, - "learning_rate": 1.830985915492958e-08, - "loss": 0.5271, + "learning_rate": 3.704228571428572e-05, + "loss": 0.5094, "step": 3590 }, { "epoch": 50.0, - "learning_rate": 4.225352112676057e-09, - "loss": 0.5292, + "learning_rate": 3.703085714285715e-05, + "loss": 0.5048, "step": 3600 }, { "epoch": 50.0, - "eval_loss": 0.5207646489143372, - "eval_runtime": 128.939, - "eval_samples_per_second": 4.126, - "eval_steps_per_second": 0.52, - "eval_wer": 0.25448351224529153, + "eval_loss": 0.5168222784996033, + "eval_runtime": 126.7305, + "eval_samples_per_second": 4.198, + "eval_steps_per_second": 0.529, + "eval_wer": 0.25107668573632447, "step": 3600 }, { - "epoch": 50.0, - "step": 3600, - "total_flos": 1.3601359172236221e+20, - "train_loss": 0.5537465457121531, - "train_runtime": 95750.0723, - "train_samples_per_second": 2.411, + "epoch": 50.14, + "learning_rate": 3.7020571428571434e-05, + "loss": 0.5159, + "step": 3610 + }, + { + "epoch": 50.28, + "learning_rate": 3.700914285714286e-05, + "loss": 0.4974, + "step": 3620 + }, + { + "epoch": 50.42, + "learning_rate": 3.699771428571429e-05, + "loss": 0.5034, + "step": 3630 + }, + { + "epoch": 50.55, + "learning_rate": 3.6986285714285714e-05, + "loss": 0.5091, + "step": 3640 + }, + { + "epoch": 50.69, + "learning_rate": 3.697485714285715e-05, + "loss": 0.5009, + "step": 3650 + }, + { + "epoch": 50.83, + "learning_rate": 3.6963428571428575e-05, + "loss": 0.5132, + "step": 3660 + }, + { + "epoch": 50.97, + "learning_rate": 3.6952e-05, + "loss": 0.5168, + "step": 3670 + }, + { + "epoch": 51.0, + "eval_loss": 0.5151329040527344, + "eval_runtime": 126.3015, + "eval_samples_per_second": 4.212, + "eval_steps_per_second": 0.53, + "eval_wer": 0.24503438966381694, + "step": 3672 + }, + { + "epoch": 51.11, + "learning_rate": 3.6940571428571435e-05, + "loss": 0.5321, + "step": 3680 + }, + { + "epoch": 51.25, + "learning_rate": 3.692914285714286e-05, + "loss": 0.516, + "step": 3690 + }, + { + "epoch": 51.39, + "learning_rate": 3.691771428571429e-05, + "loss": 0.5108, + "step": 3700 + }, + { + "epoch": 51.53, + "learning_rate": 3.6906285714285715e-05, + "loss": 0.5258, + "step": 3710 + }, + { + "epoch": 51.66, + "learning_rate": 3.689485714285715e-05, + "loss": 0.5001, + "step": 3720 + }, + { + "epoch": 51.8, + "learning_rate": 3.6883428571428575e-05, + "loss": 0.4999, + "step": 3730 + }, + { + "epoch": 51.94, + "learning_rate": 3.6872e-05, + "loss": 0.5167, + "step": 3740 + }, + { + "epoch": 52.0, + "eval_loss": 0.5150521397590637, + "eval_runtime": 126.1801, + "eval_samples_per_second": 4.216, + "eval_steps_per_second": 0.531, + "eval_wer": 0.24265603908208525, + "step": 3744 + }, + { + "epoch": 52.08, + "learning_rate": 3.6860571428571436e-05, + "loss": 0.5261, + "step": 3750 + }, + { + "epoch": 52.22, + "learning_rate": 3.6849142857142856e-05, + "loss": 0.5159, + "step": 3760 + }, + { + "epoch": 52.36, + "learning_rate": 3.683771428571429e-05, + "loss": 0.5199, + "step": 3770 + }, + { + "epoch": 52.5, + "learning_rate": 3.6826285714285716e-05, + "loss": 0.507, + "step": 3780 + }, + { + "epoch": 52.64, + "learning_rate": 3.681485714285715e-05, + "loss": 0.4992, + "step": 3790 + }, + { + "epoch": 52.78, + "learning_rate": 3.6803428571428576e-05, + "loss": 0.5194, + "step": 3800 + }, + { + "epoch": 52.91, + "learning_rate": 3.6792e-05, + "loss": 0.5106, + "step": 3810 + }, + { + "epoch": 53.0, + "eval_loss": 0.5151193737983704, + "eval_runtime": 126.2191, + "eval_samples_per_second": 4.215, + "eval_steps_per_second": 0.531, + "eval_wer": 0.23629234428231663, + "step": 3816 + }, + { + "epoch": 53.06, + "learning_rate": 3.678057142857143e-05, + "loss": 0.5237, + "step": 3820 + }, + { + "epoch": 53.19, + "learning_rate": 3.6769142857142856e-05, + "loss": 0.5112, + "step": 3830 + }, + { + "epoch": 53.33, + "learning_rate": 3.675771428571429e-05, + "loss": 0.5202, + "step": 3840 + }, + { + "epoch": 53.47, + "learning_rate": 3.6746285714285717e-05, + "loss": 0.5086, + "step": 3850 + }, + { + "epoch": 53.61, + "learning_rate": 3.673485714285715e-05, + "loss": 0.5063, + "step": 3860 + }, + { + "epoch": 53.75, + "learning_rate": 3.672342857142858e-05, + "loss": 0.5061, + "step": 3870 + }, + { + "epoch": 53.89, + "learning_rate": 3.6712000000000004e-05, + "loss": 0.4905, + "step": 3880 + }, + { + "epoch": 54.0, + "eval_loss": 0.5064216256141663, + "eval_runtime": 126.8837, + "eval_samples_per_second": 4.193, + "eval_steps_per_second": 0.528, + "eval_wer": 0.2598187311178248, + "step": 3888 + }, + { + "epoch": 54.03, + "learning_rate": 3.670057142857143e-05, + "loss": 0.5377, + "step": 3890 + }, + { + "epoch": 54.17, + "learning_rate": 3.668914285714286e-05, + "loss": 0.4957, + "step": 3900 + }, + { + "epoch": 54.3, + "learning_rate": 3.667771428571429e-05, + "loss": 0.5143, + "step": 3910 + }, + { + "epoch": 54.44, + "learning_rate": 3.666628571428572e-05, + "loss": 0.4976, + "step": 3920 + }, + { + "epoch": 54.58, + "learning_rate": 3.665485714285715e-05, + "loss": 0.5083, + "step": 3930 + }, + { + "epoch": 54.72, + "learning_rate": 3.664342857142858e-05, + "loss": 0.5017, + "step": 3940 + }, + { + "epoch": 54.86, + "learning_rate": 3.6632e-05, + "loss": 0.5087, + "step": 3950 + }, + { + "epoch": 55.0, + "learning_rate": 3.662057142857143e-05, + "loss": 0.5048, + "step": 3960 + }, + { + "epoch": 55.0, + "eval_loss": 0.47900819778442383, + "eval_runtime": 126.4061, + "eval_samples_per_second": 4.209, + "eval_steps_per_second": 0.53, + "eval_wer": 0.24336311628205953, + "step": 3960 + }, + { + "epoch": 55.14, + "learning_rate": 3.660914285714286e-05, + "loss": 0.4927, + "step": 3970 + }, + { + "epoch": 55.28, + "learning_rate": 3.659771428571429e-05, + "loss": 0.5082, + "step": 3980 + }, + { + "epoch": 55.42, + "learning_rate": 3.658628571428572e-05, + "loss": 0.5044, + "step": 3990 + }, + { + "epoch": 55.55, + "learning_rate": 3.6574857142857145e-05, + "loss": 0.4976, + "step": 4000 + }, + { + "epoch": 55.69, + "learning_rate": 3.656342857142857e-05, + "loss": 0.5041, + "step": 4010 + }, + { + "epoch": 55.83, + "learning_rate": 3.6552e-05, + "loss": 0.5126, + "step": 4020 + }, + { + "epoch": 55.97, + "learning_rate": 3.654057142857143e-05, + "loss": 0.5197, + "step": 4030 + }, + { + "epoch": 56.0, + "eval_loss": 0.5163145065307617, + "eval_runtime": 126.4091, + "eval_samples_per_second": 4.209, + "eval_steps_per_second": 0.53, + "eval_wer": 0.25101240599087227, + "step": 4032 + }, + { + "epoch": 56.11, + "learning_rate": 3.652914285714286e-05, + "loss": 0.4997, + "step": 4040 + }, + { + "epoch": 56.25, + "learning_rate": 3.651771428571429e-05, + "loss": 0.5047, + "step": 4050 + }, + { + "epoch": 56.39, + "learning_rate": 3.650628571428572e-05, + "loss": 0.4951, + "step": 4060 + }, + { + "epoch": 56.53, + "learning_rate": 3.6494857142857146e-05, + "loss": 0.5151, + "step": 4070 + }, + { + "epoch": 56.66, + "learning_rate": 3.648342857142857e-05, + "loss": 0.4921, + "step": 4080 + }, + { + "epoch": 56.8, + "learning_rate": 3.6472000000000006e-05, + "loss": 0.5158, + "step": 4090 + }, + { + "epoch": 56.94, + "learning_rate": 3.646057142857143e-05, + "loss": 0.5167, + "step": 4100 + }, + { + "epoch": 57.0, + "eval_loss": 0.5512666702270508, + "eval_runtime": 126.0221, + "eval_samples_per_second": 4.221, + "eval_steps_per_second": 0.532, + "eval_wer": 0.2513338047181333, + "step": 4104 + }, + { + "epoch": 57.08, + "learning_rate": 3.644914285714286e-05, + "loss": 0.5271, + "step": 4110 + }, + { + "epoch": 57.22, + "learning_rate": 3.643771428571429e-05, + "loss": 0.5089, + "step": 4120 + }, + { + "epoch": 57.36, + "learning_rate": 3.642628571428572e-05, + "loss": 0.5059, + "step": 4130 + }, + { + "epoch": 57.5, + "learning_rate": 3.6414857142857146e-05, + "loss": 0.5025, + "step": 4140 + }, + { + "epoch": 57.64, + "learning_rate": 3.640342857142857e-05, + "loss": 0.4938, + "step": 4150 + }, + { + "epoch": 57.78, + "learning_rate": 3.639200000000001e-05, + "loss": 0.5066, + "step": 4160 + }, + { + "epoch": 57.91, + "learning_rate": 3.6380571428571433e-05, + "loss": 0.4881, + "step": 4170 + }, + { + "epoch": 58.0, + "eval_loss": 0.5513039231300354, + "eval_runtime": 126.7483, + "eval_samples_per_second": 4.197, + "eval_steps_per_second": 0.529, + "eval_wer": 0.250305328790898, + "step": 4176 + }, + { + "epoch": 58.06, + "learning_rate": 3.636914285714286e-05, + "loss": 0.53, + "step": 4180 + }, + { + "epoch": 58.19, + "learning_rate": 3.635771428571429e-05, + "loss": 0.5054, + "step": 4190 + }, + { + "epoch": 58.33, + "learning_rate": 3.6346285714285714e-05, + "loss": 0.5133, + "step": 4200 + }, + { + "epoch": 58.47, + "learning_rate": 3.633485714285715e-05, + "loss": 0.5058, + "step": 4210 + }, + { + "epoch": 58.61, + "learning_rate": 3.6323428571428574e-05, + "loss": 0.5022, + "step": 4220 + }, + { + "epoch": 58.75, + "learning_rate": 3.631200000000001e-05, + "loss": 0.5251, + "step": 4230 + }, + { + "epoch": 58.89, + "learning_rate": 3.6300571428571434e-05, + "loss": 0.5064, + "step": 4240 + }, + { + "epoch": 59.0, + "eval_loss": 0.4960590898990631, + "eval_runtime": 126.6334, + "eval_samples_per_second": 4.201, + "eval_steps_per_second": 0.529, + "eval_wer": 0.24432731246384265, + "step": 4248 + }, + { + "epoch": 59.03, + "learning_rate": 3.628914285714286e-05, + "loss": 0.5172, + "step": 4250 + }, + { + "epoch": 59.17, + "learning_rate": 3.627771428571429e-05, + "loss": 0.4799, + "step": 4260 + }, + { + "epoch": 59.3, + "learning_rate": 3.6266285714285714e-05, + "loss": 0.5008, + "step": 4270 + }, + { + "epoch": 59.44, + "learning_rate": 3.625485714285715e-05, + "loss": 0.5117, + "step": 4280 + }, + { + "epoch": 59.58, + "learning_rate": 3.6243428571428575e-05, + "loss": 0.5219, + "step": 4290 + }, + { + "epoch": 59.72, + "learning_rate": 3.623200000000001e-05, + "loss": 0.5056, + "step": 4300 + }, + { + "epoch": 59.86, + "learning_rate": 3.6220571428571435e-05, + "loss": 0.4722, + "step": 4310 + }, + { + "epoch": 60.0, + "learning_rate": 3.6209142857142855e-05, + "loss": 0.498, + "step": 4320 + }, + { + "epoch": 60.0, + "eval_loss": 0.5065157413482666, + "eval_runtime": 126.3827, + "eval_samples_per_second": 4.209, + "eval_steps_per_second": 0.53, + "eval_wer": 0.24239892010027642, + "step": 4320 + }, + { + "epoch": 60.14, + "learning_rate": 3.619771428571429e-05, + "loss": 0.5047, + "step": 4330 + }, + { + "epoch": 60.28, + "learning_rate": 3.6186285714285715e-05, + "loss": 0.4955, + "step": 4340 + }, + { + "epoch": 60.42, + "learning_rate": 3.617485714285715e-05, + "loss": 0.4973, + "step": 4350 + }, + { + "epoch": 60.55, + "learning_rate": 3.6163428571428575e-05, + "loss": 0.4918, + "step": 4360 + }, + { + "epoch": 60.69, + "learning_rate": 3.6152e-05, + "loss": 0.4985, + "step": 4370 + }, + { + "epoch": 60.83, + "learning_rate": 3.614057142857143e-05, + "loss": 0.4986, + "step": 4380 + }, + { + "epoch": 60.97, + "learning_rate": 3.6129142857142856e-05, + "loss": 0.4935, + "step": 4390 + }, + { + "epoch": 61.0, + "eval_loss": 0.5017430782318115, + "eval_runtime": 127.0172, + "eval_samples_per_second": 4.188, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2515266439544899, + "step": 4392 + }, + { + "epoch": 61.11, + "learning_rate": 3.611771428571429e-05, + "loss": 0.5215, + "step": 4400 + }, + { + "epoch": 61.25, + "learning_rate": 3.6106285714285716e-05, + "loss": 0.5085, + "step": 4410 + }, + { + "epoch": 61.39, + "learning_rate": 3.609485714285715e-05, + "loss": 0.4893, + "step": 4420 + }, + { + "epoch": 61.53, + "learning_rate": 3.6083428571428576e-05, + "loss": 0.4798, + "step": 4430 + }, + { + "epoch": 61.66, + "learning_rate": 3.6072e-05, + "loss": 0.4679, + "step": 4440 + }, + { + "epoch": 61.8, + "learning_rate": 3.606057142857143e-05, + "loss": 0.5045, + "step": 4450 + }, + { + "epoch": 61.94, + "learning_rate": 3.6049142857142856e-05, + "loss": 0.4979, + "step": 4460 + }, + { + "epoch": 62.0, + "eval_loss": 0.4908694624900818, + "eval_runtime": 126.2259, + "eval_samples_per_second": 4.215, + "eval_steps_per_second": 0.531, + "eval_wer": 0.2377064986822652, + "step": 4464 + }, + { + "epoch": 62.08, + "learning_rate": 3.603771428571429e-05, + "loss": 0.5234, + "step": 4470 + }, + { + "epoch": 62.22, + "learning_rate": 3.602628571428572e-05, + "loss": 0.5053, + "step": 4480 + }, + { + "epoch": 62.36, + "learning_rate": 3.601485714285715e-05, + "loss": 0.5064, + "step": 4490 + }, + { + "epoch": 62.5, + "learning_rate": 3.600342857142858e-05, + "loss": 0.4974, + "step": 4500 + }, + { + "epoch": 62.64, + "learning_rate": 3.5992000000000004e-05, + "loss": 0.4835, + "step": 4510 + }, + { + "epoch": 62.78, + "learning_rate": 3.598057142857143e-05, + "loss": 0.5007, + "step": 4520 + }, + { + "epoch": 62.91, + "learning_rate": 3.596914285714286e-05, + "loss": 0.4867, + "step": 4530 + }, + { + "epoch": 63.0, + "eval_loss": 0.5188583731651306, + "eval_runtime": 126.578, + "eval_samples_per_second": 4.203, + "eval_steps_per_second": 0.529, + "eval_wer": 0.2393134923185704, + "step": 4536 + }, + { + "epoch": 63.06, + "learning_rate": 3.595771428571429e-05, + "loss": 0.5076, + "step": 4540 + }, + { + "epoch": 63.19, + "learning_rate": 3.594628571428572e-05, + "loss": 0.4969, + "step": 4550 + }, + { + "epoch": 63.33, + "learning_rate": 3.5934857142857144e-05, + "loss": 0.5029, + "step": 4560 + }, + { + "epoch": 63.47, + "learning_rate": 3.592342857142857e-05, + "loss": 0.4919, + "step": 4570 + }, + { + "epoch": 63.61, + "learning_rate": 3.5912000000000004e-05, + "loss": 0.4844, + "step": 4580 + }, + { + "epoch": 63.75, + "learning_rate": 3.590057142857143e-05, + "loss": 0.486, + "step": 4590 + }, + { + "epoch": 63.89, + "learning_rate": 3.588914285714286e-05, + "loss": 0.4804, + "step": 4600 + }, + { + "epoch": 64.0, + "eval_loss": 0.554358184337616, + "eval_runtime": 126.3581, + "eval_samples_per_second": 4.21, + "eval_steps_per_second": 0.53, + "eval_wer": 0.24606286559105225, + "step": 4608 + }, + { + "epoch": 64.03, + "learning_rate": 3.587771428571429e-05, + "loss": 0.5121, + "step": 4610 + }, + { + "epoch": 64.17, + "learning_rate": 3.586628571428572e-05, + "loss": 0.5081, + "step": 4620 + }, + { + "epoch": 64.3, + "learning_rate": 3.5854857142857145e-05, + "loss": 0.504, + "step": 4630 + }, + { + "epoch": 64.44, + "learning_rate": 3.584342857142857e-05, + "loss": 0.4815, + "step": 4640 + }, + { + "epoch": 64.58, + "learning_rate": 3.5832000000000005e-05, + "loss": 0.5042, + "step": 4650 + }, + { + "epoch": 64.72, + "learning_rate": 3.582057142857143e-05, + "loss": 0.4816, + "step": 4660 + }, + { + "epoch": 64.86, + "learning_rate": 3.580914285714286e-05, + "loss": 0.4955, + "step": 4670 + }, + { + "epoch": 65.0, + "learning_rate": 3.579771428571429e-05, + "loss": 0.4893, + "step": 4680 + }, + { + "epoch": 65.0, + "eval_loss": 0.5091788172721863, + "eval_runtime": 126.9715, + "eval_samples_per_second": 4.19, + "eval_steps_per_second": 0.528, + "eval_wer": 0.23841357588223952, + "step": 4680 + }, + { + "epoch": 65.14, + "learning_rate": 3.578628571428572e-05, + "loss": 0.5113, + "step": 4690 + }, + { + "epoch": 65.28, + "learning_rate": 3.5774857142857146e-05, + "loss": 0.5095, + "step": 4700 + }, + { + "epoch": 65.42, + "learning_rate": 3.576342857142857e-05, + "loss": 0.4809, + "step": 4710 + }, + { + "epoch": 65.55, + "learning_rate": 3.5752000000000006e-05, + "loss": 0.4829, + "step": 4720 + }, + { + "epoch": 65.69, + "learning_rate": 3.574057142857143e-05, + "loss": 0.4904, + "step": 4730 + }, + { + "epoch": 65.83, + "learning_rate": 3.572914285714286e-05, + "loss": 0.5061, + "step": 4740 + }, + { + "epoch": 65.97, + "learning_rate": 3.5717714285714286e-05, + "loss": 0.472, + "step": 4750 + }, + { + "epoch": 66.0, + "eval_loss": 0.5024771094322205, + "eval_runtime": 126.7045, + "eval_samples_per_second": 4.199, + "eval_steps_per_second": 0.529, + "eval_wer": 0.2422060808639198, + "step": 4752 + }, + { + "epoch": 66.11, + "learning_rate": 3.570628571428571e-05, + "loss": 0.5205, + "step": 4760 + }, + { + "epoch": 66.25, + "learning_rate": 3.5694857142857146e-05, + "loss": 0.5117, + "step": 4770 + }, + { + "epoch": 66.39, + "learning_rate": 3.568342857142857e-05, + "loss": 0.4942, + "step": 4780 + }, + { + "epoch": 66.53, + "learning_rate": 3.567200000000001e-05, + "loss": 0.4919, + "step": 4790 + }, + { + "epoch": 66.66, + "learning_rate": 3.5660571428571434e-05, + "loss": 0.487, + "step": 4800 + }, + { + "epoch": 66.8, + "learning_rate": 3.564914285714286e-05, + "loss": 0.4857, + "step": 4810 + }, + { + "epoch": 66.94, + "learning_rate": 3.563771428571429e-05, + "loss": 0.4829, + "step": 4820 + }, + { + "epoch": 67.0, + "eval_loss": 0.4762025475502014, + "eval_runtime": 126.1692, + "eval_samples_per_second": 4.217, + "eval_steps_per_second": 0.531, + "eval_wer": 0.23699942148229092, + "step": 4824 + }, + { + "epoch": 67.08, + "learning_rate": 3.5626285714285714e-05, + "loss": 0.4934, + "step": 4830 + }, + { + "epoch": 67.22, + "learning_rate": 3.561485714285715e-05, + "loss": 0.4918, + "step": 4840 + }, + { + "epoch": 67.36, + "learning_rate": 3.5603428571428574e-05, + "loss": 0.4703, + "step": 4850 + }, + { + "epoch": 67.5, + "learning_rate": 3.559200000000001e-05, + "loss": 0.4893, + "step": 4860 + }, + { + "epoch": 67.64, + "learning_rate": 3.5580571428571434e-05, + "loss": 0.5176, + "step": 4870 + }, + { + "epoch": 67.78, + "learning_rate": 3.556914285714286e-05, + "loss": 0.5218, + "step": 4880 + }, + { + "epoch": 67.91, + "learning_rate": 3.555771428571429e-05, + "loss": 0.5035, + "step": 4890 + }, + { + "epoch": 68.0, + "eval_loss": 0.5178850293159485, + "eval_runtime": 126.4705, + "eval_samples_per_second": 4.207, + "eval_steps_per_second": 0.53, + "eval_wer": 0.2515266439544899, + "step": 4896 + }, + { + "epoch": 68.06, + "learning_rate": 3.5546285714285715e-05, + "loss": 0.5279, + "step": 4900 + }, + { + "epoch": 68.19, + "learning_rate": 3.553485714285715e-05, + "loss": 0.5018, + "step": 4910 + }, + { + "epoch": 68.33, + "learning_rate": 3.5523428571428575e-05, + "loss": 0.5043, + "step": 4920 + }, + { + "epoch": 68.47, + "learning_rate": 3.5512e-05, + "loss": 0.5007, + "step": 4930 + }, + { + "epoch": 68.61, + "learning_rate": 3.550057142857143e-05, + "loss": 0.4953, + "step": 4940 + }, + { + "epoch": 68.75, + "learning_rate": 3.548914285714286e-05, + "loss": 0.4898, + "step": 4950 + }, + { + "epoch": 68.89, + "learning_rate": 3.547771428571429e-05, + "loss": 0.4976, + "step": 4960 + }, + { + "epoch": 69.0, + "eval_loss": 0.49693354964256287, + "eval_runtime": 126.6145, + "eval_samples_per_second": 4.202, + "eval_steps_per_second": 0.529, + "eval_wer": 0.2399562897730925, + "step": 4968 + }, + { + "epoch": 69.03, + "learning_rate": 3.5466285714285715e-05, + "loss": 0.5068, + "step": 4970 + }, + { + "epoch": 69.17, + "learning_rate": 3.545485714285715e-05, + "loss": 0.5022, + "step": 4980 + }, + { + "epoch": 69.3, + "learning_rate": 3.5443428571428576e-05, + "loss": 0.5046, + "step": 4990 + }, + { + "epoch": 69.44, + "learning_rate": 3.5432e-05, + "loss": 0.4941, + "step": 5000 + }, + { + "epoch": 69.58, + "learning_rate": 3.542057142857143e-05, + "loss": 0.495, + "step": 5010 + }, + { + "epoch": 69.72, + "learning_rate": 3.540914285714286e-05, + "loss": 0.4929, + "step": 5020 + }, + { + "epoch": 69.86, + "learning_rate": 3.539771428571429e-05, + "loss": 0.4921, + "step": 5030 + }, + { + "epoch": 70.0, + "learning_rate": 3.5386285714285716e-05, + "loss": 0.5168, + "step": 5040 + }, + { + "epoch": 70.0, + "eval_loss": 0.516396701335907, + "eval_runtime": 126.7251, + "eval_samples_per_second": 4.198, + "eval_steps_per_second": 0.529, + "eval_wer": 0.2542263932634827, + "step": 5040 + }, + { + "epoch": 70.14, + "learning_rate": 3.537485714285715e-05, + "loss": 0.5108, + "step": 5050 + }, + { + "epoch": 70.28, + "learning_rate": 3.5363428571428576e-05, + "loss": 0.5141, + "step": 5060 + }, + { + "epoch": 70.42, + "learning_rate": 3.5352e-05, + "loss": 0.513, + "step": 5070 + }, + { + "epoch": 70.55, + "learning_rate": 3.534057142857143e-05, + "loss": 0.5034, + "step": 5080 + }, + { + "epoch": 70.69, + "learning_rate": 3.532914285714286e-05, + "loss": 0.5036, + "step": 5090 + }, + { + "epoch": 70.83, + "learning_rate": 3.531771428571429e-05, + "loss": 0.522, + "step": 5100 + }, + { + "epoch": 70.97, + "learning_rate": 3.530628571428572e-05, + "loss": 0.5024, + "step": 5110 + }, + { + "epoch": 71.0, + "eval_loss": 0.48929738998413086, + "eval_runtime": 126.6202, + "eval_samples_per_second": 4.202, + "eval_steps_per_second": 0.529, + "eval_wer": 0.24612714533650445, + "step": 5112 + }, + { + "epoch": 71.11, + "learning_rate": 3.5294857142857144e-05, + "loss": 0.5095, + "step": 5120 + }, + { + "epoch": 71.25, + "learning_rate": 3.528342857142857e-05, + "loss": 0.4804, + "step": 5130 + }, + { + "epoch": 71.39, + "learning_rate": 3.5272000000000004e-05, + "loss": 0.4908, + "step": 5140 + }, + { + "epoch": 71.53, + "learning_rate": 3.526057142857143e-05, + "loss": 0.5071, + "step": 5150 + }, + { + "epoch": 71.66, + "learning_rate": 3.5249142857142864e-05, + "loss": 0.5175, + "step": 5160 + }, + { + "epoch": 71.8, + "learning_rate": 3.523771428571429e-05, + "loss": 0.5078, + "step": 5170 + }, + { + "epoch": 71.94, + "learning_rate": 3.522628571428572e-05, + "loss": 0.5031, + "step": 5180 + }, + { + "epoch": 72.0, + "eval_loss": 0.4890044927597046, + "eval_runtime": 127.1756, + "eval_samples_per_second": 4.183, + "eval_steps_per_second": 0.527, + "eval_wer": 0.25673330333611877, + "step": 5184 + }, + { + "epoch": 72.08, + "learning_rate": 3.5214857142857144e-05, + "loss": 0.5279, + "step": 5190 + }, + { + "epoch": 72.22, + "learning_rate": 3.520342857142857e-05, + "loss": 0.5101, + "step": 5200 + }, + { + "epoch": 72.36, + "learning_rate": 3.5192000000000005e-05, + "loss": 0.4849, + "step": 5210 + }, + { + "epoch": 72.5, + "learning_rate": 3.518057142857143e-05, + "loss": 0.4984, + "step": 5220 + }, + { + "epoch": 72.64, + "learning_rate": 3.5169142857142865e-05, + "loss": 0.4945, + "step": 5230 + }, + { + "epoch": 72.78, + "learning_rate": 3.515771428571429e-05, + "loss": 0.4937, + "step": 5240 + }, + { + "epoch": 72.91, + "learning_rate": 3.514628571428572e-05, + "loss": 0.486, + "step": 5250 + }, + { + "epoch": 73.0, + "eval_loss": 0.5191527009010315, + "eval_runtime": 126.9635, + "eval_samples_per_second": 4.19, + "eval_steps_per_second": 0.528, + "eval_wer": 0.2454843478819824, + "step": 5256 + }, + { + "epoch": 73.06, + "learning_rate": 3.5134857142857145e-05, + "loss": 0.5119, + "step": 5260 + }, + { + "epoch": 73.19, + "learning_rate": 3.512342857142857e-05, + "loss": 0.4958, + "step": 5270 + }, + { + "epoch": 73.33, + "learning_rate": 3.5112000000000005e-05, + "loss": 0.5054, + "step": 5280 + }, + { + "epoch": 73.47, + "learning_rate": 3.510057142857143e-05, + "loss": 0.4935, + "step": 5290 + }, + { + "epoch": 73.61, + "learning_rate": 3.508914285714286e-05, + "loss": 0.4953, + "step": 5300 + }, + { + "epoch": 73.75, + "learning_rate": 3.5077714285714286e-05, + "loss": 0.4906, + "step": 5310 + }, + { + "epoch": 73.89, + "learning_rate": 3.506628571428572e-05, + "loss": 0.4733, + "step": 5320 + }, + { + "epoch": 74.0, + "eval_loss": 0.5048214793205261, + "eval_runtime": 126.6746, + "eval_samples_per_second": 4.2, + "eval_steps_per_second": 0.529, + "eval_wer": 0.23789933791862183, + "step": 5328 + }, + { + "epoch": 74.03, + "learning_rate": 3.5054857142857146e-05, + "loss": 0.5087, + "step": 5330 + }, + { + "epoch": 74.17, + "learning_rate": 3.504342857142857e-05, + "loss": 0.4732, + "step": 5340 + }, + { + "epoch": 74.3, + "learning_rate": 3.5032000000000006e-05, + "loss": 0.4999, + "step": 5350 + }, + { + "epoch": 74.44, + "learning_rate": 3.502057142857143e-05, + "loss": 0.4813, + "step": 5360 + }, + { + "epoch": 74.58, + "learning_rate": 3.500914285714286e-05, + "loss": 0.4902, + "step": 5370 + }, + { + "epoch": 74.72, + "learning_rate": 3.4997714285714286e-05, + "loss": 0.4867, + "step": 5380 + }, + { + "epoch": 74.86, + "learning_rate": 3.498628571428572e-05, + "loss": 0.4917, + "step": 5390 + }, + { + "epoch": 75.0, + "learning_rate": 3.497485714285715e-05, + "loss": 0.482, + "step": 5400 + }, + { + "epoch": 75.0, + "eval_loss": 0.4869886636734009, + "eval_runtime": 126.5678, + "eval_samples_per_second": 4.203, + "eval_steps_per_second": 0.529, + "eval_wer": 0.23462107090055923, + "step": 5400 + }, + { + "epoch": 75.14, + "learning_rate": 3.496342857142857e-05, + "loss": 0.502, + "step": 5410 + }, + { + "epoch": 75.28, + "learning_rate": 3.495200000000001e-05, + "loss": 0.4839, + "step": 5420 + }, + { + "epoch": 75.42, + "learning_rate": 3.4940571428571434e-05, + "loss": 0.4892, + "step": 5430 + }, + { + "epoch": 75.55, + "learning_rate": 3.492914285714286e-05, + "loss": 0.4881, + "step": 5440 + }, + { + "epoch": 75.69, + "learning_rate": 3.491771428571429e-05, + "loss": 0.4803, + "step": 5450 + }, + { + "epoch": 75.83, + "learning_rate": 3.490628571428572e-05, + "loss": 0.48, + "step": 5460 + }, + { + "epoch": 75.97, + "learning_rate": 3.489485714285715e-05, + "loss": 0.4763, + "step": 5470 + }, + { + "epoch": 76.0, + "eval_loss": 0.5020842552185059, + "eval_runtime": 127.118, + "eval_samples_per_second": 4.185, + "eval_steps_per_second": 0.527, + "eval_wer": 0.232692678536993, + "step": 5472 + }, + { + "epoch": 76.11, + "learning_rate": 3.4883428571428574e-05, + "loss": 0.4767, + "step": 5480 + }, + { + "epoch": 76.25, + "learning_rate": 3.4872e-05, + "loss": 0.486, + "step": 5490 + }, + { + "epoch": 76.39, + "learning_rate": 3.486057142857143e-05, + "loss": 0.4816, + "step": 5500 + }, + { + "epoch": 76.53, + "learning_rate": 3.484914285714286e-05, + "loss": 0.4778, + "step": 5510 + }, + { + "epoch": 76.66, + "learning_rate": 3.483771428571429e-05, + "loss": 0.4821, + "step": 5520 + }, + { + "epoch": 76.8, + "learning_rate": 3.482628571428572e-05, + "loss": 0.4754, + "step": 5530 + }, + { + "epoch": 76.94, + "learning_rate": 3.481485714285715e-05, + "loss": 0.4814, + "step": 5540 + }, + { + "epoch": 77.0, + "eval_loss": 0.5127823948860168, + "eval_runtime": 126.7108, + "eval_samples_per_second": 4.199, + "eval_steps_per_second": 0.529, + "eval_wer": 0.23680658224593432, + "step": 5544 + }, + { + "epoch": 77.08, + "learning_rate": 3.4803428571428575e-05, + "loss": 0.489, + "step": 5550 + }, + { + "epoch": 77.22, + "learning_rate": 3.4792e-05, + "loss": 0.4738, + "step": 5560 + }, + { + "epoch": 77.36, + "learning_rate": 3.478057142857143e-05, + "loss": 0.4854, + "step": 5570 + }, + { + "epoch": 77.5, + "learning_rate": 3.476914285714286e-05, + "loss": 0.4914, + "step": 5580 + }, + { + "epoch": 77.64, + "learning_rate": 3.475771428571429e-05, + "loss": 0.4699, + "step": 5590 + }, + { + "epoch": 77.78, + "learning_rate": 3.474628571428572e-05, + "loss": 0.5074, + "step": 5600 + }, + { + "epoch": 77.91, + "learning_rate": 3.4736e-05, + "loss": 0.4731, + "step": 5610 + }, + { + "epoch": 78.0, + "eval_loss": 0.5221678018569946, + "eval_runtime": 126.9338, + "eval_samples_per_second": 4.191, + "eval_steps_per_second": 0.528, + "eval_wer": 0.23455679115510703, + "step": 5616 + }, + { + "epoch": 78.06, + "learning_rate": 3.4724571428571434e-05, + "loss": 0.491, + "step": 5620 + }, + { + "epoch": 78.19, + "learning_rate": 3.471314285714286e-05, + "loss": 0.4669, + "step": 5630 + }, + { + "epoch": 78.33, + "learning_rate": 3.470171428571429e-05, + "loss": 0.4838, + "step": 5640 + }, + { + "epoch": 78.47, + "learning_rate": 3.4690285714285715e-05, + "loss": 0.4694, + "step": 5650 + }, + { + "epoch": 78.61, + "learning_rate": 3.467885714285715e-05, + "loss": 0.4756, + "step": 5660 + }, + { + "epoch": 78.75, + "learning_rate": 3.4667428571428575e-05, + "loss": 0.4909, + "step": 5670 + }, + { + "epoch": 78.89, + "learning_rate": 3.4656e-05, + "loss": 0.4769, + "step": 5680 + }, + { + "epoch": 79.0, + "eval_loss": 0.4936656057834625, + "eval_runtime": 126.5632, + "eval_samples_per_second": 4.203, + "eval_steps_per_second": 0.529, + "eval_wer": 0.22915729253712155, + "step": 5688 + }, + { + "epoch": 79.03, + "learning_rate": 3.4644571428571435e-05, + "loss": 0.4818, + "step": 5690 + }, + { + "epoch": 79.17, + "learning_rate": 3.463314285714286e-05, + "loss": 0.4764, + "step": 5700 + }, + { + "epoch": 79.3, + "learning_rate": 3.462171428571429e-05, + "loss": 0.4867, + "step": 5710 + }, + { + "epoch": 79.44, + "learning_rate": 3.4610285714285715e-05, + "loss": 0.4759, + "step": 5720 + }, + { + "epoch": 79.58, + "learning_rate": 3.459885714285715e-05, + "loss": 0.4802, + "step": 5730 + }, + { + "epoch": 79.72, + "learning_rate": 3.4587428571428576e-05, + "loss": 0.4772, + "step": 5740 + }, + { + "epoch": 79.86, + "learning_rate": 3.4576e-05, + "loss": 0.4781, + "step": 5750 + }, + { + "epoch": 80.0, + "learning_rate": 3.456457142857143e-05, + "loss": 0.4751, + "step": 5760 + }, + { + "epoch": 80.0, + "eval_loss": 0.49694111943244934, + "eval_runtime": 126.6725, + "eval_samples_per_second": 4.2, + "eval_steps_per_second": 0.529, + "eval_wer": 0.23796361766407406, + "step": 5760 + }, + { + "epoch": 80.14, + "learning_rate": 3.4553142857142856e-05, + "loss": 0.4742, + "step": 5770 + }, + { + "epoch": 80.28, + "learning_rate": 3.454171428571429e-05, + "loss": 0.4716, + "step": 5780 + }, + { + "epoch": 80.42, + "learning_rate": 3.4530285714285716e-05, + "loss": 0.4667, + "step": 5790 + }, + { + "epoch": 80.55, + "learning_rate": 3.451885714285715e-05, + "loss": 0.4646, + "step": 5800 + }, + { + "epoch": 80.69, + "learning_rate": 3.4507428571428576e-05, + "loss": 0.4626, + "step": 5810 + }, + { + "epoch": 80.83, + "learning_rate": 3.449714285714286e-05, + "loss": 0.4792, + "step": 5820 + }, + { + "epoch": 80.97, + "learning_rate": 3.448571428571429e-05, + "loss": 0.4792, + "step": 5830 + }, + { + "epoch": 81.0, + "eval_loss": 0.4837154448032379, + "eval_runtime": 127.7186, + "eval_samples_per_second": 4.165, + "eval_steps_per_second": 0.525, + "eval_wer": 0.23468535064601145, + "step": 5832 + }, + { + "epoch": 81.11, + "learning_rate": 3.4474285714285715e-05, + "loss": 0.4801, + "step": 5840 + }, + { + "epoch": 81.25, + "learning_rate": 3.446285714285714e-05, + "loss": 0.4808, + "step": 5850 + }, + { + "epoch": 81.39, + "learning_rate": 3.4451428571428576e-05, + "loss": 0.4651, + "step": 5860 + }, + { + "epoch": 81.53, + "learning_rate": 3.444e-05, + "loss": 0.4771, + "step": 5870 + }, + { + "epoch": 81.66, + "learning_rate": 3.4428571428571436e-05, + "loss": 0.478, + "step": 5880 + }, + { + "epoch": 81.8, + "learning_rate": 3.441714285714286e-05, + "loss": 0.4802, + "step": 5890 + }, + { + "epoch": 81.94, + "learning_rate": 3.440571428571429e-05, + "loss": 0.467, + "step": 5900 + }, + { + "epoch": 82.0, + "eval_loss": 0.5006660223007202, + "eval_runtime": 126.9056, + "eval_samples_per_second": 4.192, + "eval_steps_per_second": 0.528, + "eval_wer": 0.24047052773671015, + "step": 5904 + }, + { + "epoch": 82.08, + "learning_rate": 3.4394285714285716e-05, + "loss": 0.4874, + "step": 5910 + }, + { + "epoch": 82.22, + "learning_rate": 3.438285714285714e-05, + "loss": 0.4795, + "step": 5920 + }, + { + "epoch": 82.36, + "learning_rate": 3.4371428571428576e-05, + "loss": 0.4541, + "step": 5930 + }, + { + "epoch": 82.5, + "learning_rate": 3.436e-05, + "loss": 0.486, + "step": 5940 + }, + { + "epoch": 82.64, + "learning_rate": 3.4348571428571437e-05, + "loss": 0.4761, + "step": 5950 + }, + { + "epoch": 82.78, + "learning_rate": 3.433714285714286e-05, + "loss": 0.4761, + "step": 5960 + }, + { + "epoch": 82.91, + "learning_rate": 3.432571428571428e-05, + "loss": 0.4682, + "step": 5970 + }, + { + "epoch": 83.0, + "eval_loss": 0.5114097595214844, + "eval_runtime": 126.8507, + "eval_samples_per_second": 4.194, + "eval_steps_per_second": 0.528, + "eval_wer": 0.23719226071864755, + "step": 5976 + }, + { + "epoch": 83.06, + "learning_rate": 3.431428571428572e-05, + "loss": 0.4722, + "step": 5980 + }, + { + "epoch": 83.19, + "learning_rate": 3.4302857142857144e-05, + "loss": 0.4778, + "step": 5990 + }, + { + "epoch": 83.33, + "learning_rate": 3.429142857142858e-05, + "loss": 0.4716, + "step": 6000 + }, + { + "epoch": 83.47, + "learning_rate": 3.4280000000000004e-05, + "loss": 0.4798, + "step": 6010 + }, + { + "epoch": 83.61, + "learning_rate": 3.426857142857143e-05, + "loss": 0.4629, + "step": 6020 + }, + { + "epoch": 83.75, + "learning_rate": 3.425714285714286e-05, + "loss": 0.4618, + "step": 6030 + }, + { + "epoch": 83.89, + "learning_rate": 3.4245714285714284e-05, + "loss": 0.4672, + "step": 6040 + }, + { + "epoch": 84.0, + "eval_loss": 0.4994150698184967, + "eval_runtime": 127.7789, + "eval_samples_per_second": 4.163, + "eval_steps_per_second": 0.524, + "eval_wer": 0.24522722890017357, + "step": 6048 + }, + { + "epoch": 84.03, + "learning_rate": 3.423428571428572e-05, + "loss": 0.4826, + "step": 6050 + }, + { + "epoch": 84.17, + "learning_rate": 3.4222857142857144e-05, + "loss": 0.465, + "step": 6060 + }, + { + "epoch": 84.3, + "learning_rate": 3.421142857142858e-05, + "loss": 0.4801, + "step": 6070 + }, + { + "epoch": 84.44, + "learning_rate": 3.4200000000000005e-05, + "loss": 0.4826, + "step": 6080 + }, + { + "epoch": 84.58, + "learning_rate": 3.418857142857143e-05, + "loss": 0.4702, + "step": 6090 + }, + { + "epoch": 84.72, + "learning_rate": 3.417714285714286e-05, + "loss": 0.456, + "step": 6100 + }, + { + "epoch": 84.86, + "learning_rate": 3.4165714285714285e-05, + "loss": 0.4709, + "step": 6110 + }, + { + "epoch": 85.0, + "learning_rate": 3.415428571428572e-05, + "loss": 0.4701, + "step": 6120 + }, + { + "epoch": 85.0, + "eval_loss": 0.4967518746852875, + "eval_runtime": 127.2344, + "eval_samples_per_second": 4.181, + "eval_steps_per_second": 0.527, + "eval_wer": 0.23976345053673587, + "step": 6120 + }, + { + "epoch": 85.14, + "learning_rate": 3.4142857142857145e-05, + "loss": 0.4705, + "step": 6130 + }, + { + "epoch": 85.28, + "learning_rate": 3.413142857142858e-05, + "loss": 0.4704, + "step": 6140 + }, + { + "epoch": 85.42, + "learning_rate": 3.4120000000000005e-05, + "loss": 0.4939, + "step": 6150 + }, + { + "epoch": 85.55, + "learning_rate": 3.410857142857143e-05, + "loss": 0.4704, + "step": 6160 + }, + { + "epoch": 85.69, + "learning_rate": 3.409714285714286e-05, + "loss": 0.471, + "step": 6170 + }, + { + "epoch": 85.83, + "learning_rate": 3.4085714285714286e-05, + "loss": 0.4718, + "step": 6180 + }, + { + "epoch": 85.97, + "learning_rate": 3.407428571428572e-05, + "loss": 0.4678, + "step": 6190 + }, + { + "epoch": 86.0, + "eval_loss": 0.49197760224342346, + "eval_runtime": 127.2978, + "eval_samples_per_second": 4.179, + "eval_steps_per_second": 0.526, + "eval_wer": 0.23474963039146365, + "step": 6192 + }, + { + "epoch": 86.11, + "learning_rate": 3.4062857142857146e-05, + "loss": 0.4744, + "step": 6200 + }, + { + "epoch": 86.25, + "learning_rate": 3.405142857142857e-05, + "loss": 0.4709, + "step": 6210 + }, + { + "epoch": 86.39, + "learning_rate": 3.404e-05, + "loss": 0.4615, + "step": 6220 + }, + { + "epoch": 86.53, + "learning_rate": 3.402857142857143e-05, + "loss": 0.4638, + "step": 6230 + }, + { + "epoch": 86.66, + "learning_rate": 3.401714285714286e-05, + "loss": 0.4627, + "step": 6240 + }, + { + "epoch": 86.8, + "learning_rate": 3.4005714285714286e-05, + "loss": 0.471, + "step": 6250 + }, + { + "epoch": 86.94, + "learning_rate": 3.399428571428572e-05, + "loss": 0.472, + "step": 6260 + }, + { + "epoch": 87.0, + "eval_loss": 0.48062899708747864, + "eval_runtime": 127.5542, + "eval_samples_per_second": 4.171, + "eval_steps_per_second": 0.525, + "eval_wer": 0.22999292922800027, + "step": 6264 + }, + { + "epoch": 87.08, + "learning_rate": 3.398285714285715e-05, + "loss": 0.4763, + "step": 6270 + }, + { + "epoch": 87.22, + "learning_rate": 3.397142857142857e-05, + "loss": 0.4686, + "step": 6280 + }, + { + "epoch": 87.36, + "learning_rate": 3.396e-05, + "loss": 0.457, + "step": 6290 + }, + { + "epoch": 87.5, + "learning_rate": 3.3948571428571434e-05, + "loss": 0.4672, + "step": 6300 + }, + { + "epoch": 87.64, + "learning_rate": 3.393714285714286e-05, + "loss": 0.4593, + "step": 6310 + }, + { + "epoch": 87.78, + "learning_rate": 3.3925714285714294e-05, + "loss": 0.4588, + "step": 6320 + }, + { + "epoch": 87.91, + "learning_rate": 3.391428571428572e-05, + "loss": 0.4787, + "step": 6330 + }, + { + "epoch": 88.0, + "eval_loss": 0.4793696105480194, + "eval_runtime": 127.1856, + "eval_samples_per_second": 4.183, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2319213215915665, + "step": 6336 + }, + { + "epoch": 88.06, + "learning_rate": 3.390285714285715e-05, + "loss": 0.4864, + "step": 6340 + }, + { + "epoch": 88.19, + "learning_rate": 3.3891428571428574e-05, + "loss": 0.4668, + "step": 6350 + }, + { + "epoch": 88.33, + "learning_rate": 3.388e-05, + "loss": 0.4718, + "step": 6360 + }, + { + "epoch": 88.47, + "learning_rate": 3.3868571428571434e-05, + "loss": 0.4602, + "step": 6370 + }, + { + "epoch": 88.61, + "learning_rate": 3.385714285714286e-05, + "loss": 0.46, + "step": 6380 + }, + { + "epoch": 88.75, + "learning_rate": 3.384571428571429e-05, + "loss": 0.4802, + "step": 6390 + }, + { + "epoch": 88.89, + "learning_rate": 3.3834285714285715e-05, + "loss": 0.474, + "step": 6400 + }, + { + "epoch": 89.0, + "eval_loss": 0.4934304654598236, + "eval_runtime": 126.8396, + "eval_samples_per_second": 4.194, + "eval_steps_per_second": 0.528, + "eval_wer": 0.23166420260975767, + "step": 6408 + }, + { + "epoch": 89.03, + "learning_rate": 3.382285714285714e-05, + "loss": 0.484, + "step": 6410 + }, + { + "epoch": 89.17, + "learning_rate": 3.3811428571428575e-05, + "loss": 0.4686, + "step": 6420 + }, + { + "epoch": 89.3, + "learning_rate": 3.38e-05, + "loss": 0.4695, + "step": 6430 + }, + { + "epoch": 89.44, + "learning_rate": 3.3788571428571435e-05, + "loss": 0.4729, + "step": 6440 + }, + { + "epoch": 89.58, + "learning_rate": 3.377714285714286e-05, + "loss": 0.4716, + "step": 6450 + }, + { + "epoch": 89.72, + "learning_rate": 3.376571428571429e-05, + "loss": 0.4854, + "step": 6460 + }, + { + "epoch": 89.86, + "learning_rate": 3.3754285714285715e-05, + "loss": 0.4777, + "step": 6470 + }, + { + "epoch": 90.0, + "learning_rate": 3.374285714285714e-05, + "loss": 0.4838, + "step": 6480 + }, + { + "epoch": 90.0, + "eval_loss": 0.5315157771110535, + "eval_runtime": 127.1462, + "eval_samples_per_second": 4.184, + "eval_steps_per_second": 0.527, + "eval_wer": 0.23642090377322106, + "step": 6480 + }, + { + "epoch": 90.14, + "learning_rate": 3.3731428571428576e-05, + "loss": 0.4862, + "step": 6490 + }, + { + "epoch": 90.28, + "learning_rate": 3.372e-05, + "loss": 0.4818, + "step": 6500 + }, + { + "epoch": 90.42, + "learning_rate": 3.3708571428571436e-05, + "loss": 0.4768, + "step": 6510 + }, + { + "epoch": 90.55, + "learning_rate": 3.369714285714286e-05, + "loss": 0.4771, + "step": 6520 + }, + { + "epoch": 90.69, + "learning_rate": 3.368571428571429e-05, + "loss": 0.4649, + "step": 6530 + }, + { + "epoch": 90.83, + "learning_rate": 3.3674285714285716e-05, + "loss": 0.4728, + "step": 6540 + }, + { + "epoch": 90.97, + "learning_rate": 3.366285714285714e-05, + "loss": 0.4802, + "step": 6550 + }, + { + "epoch": 91.0, + "eval_loss": 0.5070334076881409, + "eval_runtime": 127.7259, + "eval_samples_per_second": 4.165, + "eval_steps_per_second": 0.525, + "eval_wer": 0.234235392427846, + "step": 6552 + }, + { + "epoch": 91.11, + "learning_rate": 3.3651428571428576e-05, + "loss": 0.4889, + "step": 6560 + }, + { + "epoch": 91.25, + "learning_rate": 3.364e-05, + "loss": 0.4698, + "step": 6570 + }, + { + "epoch": 91.39, + "learning_rate": 3.362857142857143e-05, + "loss": 0.4577, + "step": 6580 + }, + { + "epoch": 91.53, + "learning_rate": 3.361714285714286e-05, + "loss": 0.4589, + "step": 6590 + }, + { + "epoch": 91.66, + "learning_rate": 3.360571428571429e-05, + "loss": 0.4581, + "step": 6600 + }, + { + "epoch": 91.8, + "learning_rate": 3.359428571428572e-05, + "loss": 0.4642, + "step": 6610 + }, + { + "epoch": 91.94, + "learning_rate": 3.3582857142857144e-05, + "loss": 0.4656, + "step": 6620 + }, + { + "epoch": 92.0, + "eval_loss": 0.5284181833267212, + "eval_runtime": 126.8514, + "eval_samples_per_second": 4.194, + "eval_steps_per_second": 0.528, + "eval_wer": 0.23410683293694157, + "step": 6624 + }, + { + "epoch": 92.08, + "learning_rate": 3.357142857142858e-05, + "loss": 0.4804, + "step": 6630 + }, + { + "epoch": 92.22, + "learning_rate": 3.3560000000000004e-05, + "loss": 0.4675, + "step": 6640 + }, + { + "epoch": 92.36, + "learning_rate": 3.354857142857143e-05, + "loss": 0.4684, + "step": 6650 + }, + { + "epoch": 92.5, + "learning_rate": 3.353714285714286e-05, + "loss": 0.4679, + "step": 6660 + }, + { + "epoch": 92.64, + "learning_rate": 3.352571428571429e-05, + "loss": 0.4633, + "step": 6670 + }, + { + "epoch": 92.78, + "learning_rate": 3.351428571428572e-05, + "loss": 0.4813, + "step": 6680 + }, + { + "epoch": 92.91, + "learning_rate": 3.3502857142857144e-05, + "loss": 0.4684, + "step": 6690 + }, + { + "epoch": 93.0, + "eval_loss": 0.5020865797996521, + "eval_runtime": 126.8852, + "eval_samples_per_second": 4.193, + "eval_steps_per_second": 0.528, + "eval_wer": 0.24021340875490133, + "step": 6696 + }, + { + "epoch": 93.06, + "learning_rate": 3.349142857142858e-05, + "loss": 0.5045, + "step": 6700 + }, + { + "epoch": 93.19, + "learning_rate": 3.3480000000000005e-05, + "loss": 0.4553, + "step": 6710 + }, + { + "epoch": 93.33, + "learning_rate": 3.346857142857143e-05, + "loss": 0.4601, + "step": 6720 + }, + { + "epoch": 93.47, + "learning_rate": 3.345714285714286e-05, + "loss": 0.466, + "step": 6730 + }, + { + "epoch": 93.61, + "learning_rate": 3.344571428571429e-05, + "loss": 0.4659, + "step": 6740 + }, + { + "epoch": 93.75, + "learning_rate": 3.343428571428572e-05, + "loss": 0.472, + "step": 6750 + }, + { + "epoch": 93.89, + "learning_rate": 3.3422857142857145e-05, + "loss": 0.4524, + "step": 6760 + }, + { + "epoch": 94.0, + "eval_loss": 0.4932425916194916, + "eval_runtime": 128.6113, + "eval_samples_per_second": 4.136, + "eval_steps_per_second": 0.521, + "eval_wer": 0.23687086199138652, + "step": 6768 + }, + { + "epoch": 94.03, + "learning_rate": 3.341142857142857e-05, + "loss": 0.4761, + "step": 6770 + }, + { + "epoch": 94.17, + "learning_rate": 3.34e-05, + "loss": 0.4563, + "step": 6780 + }, + { + "epoch": 94.3, + "learning_rate": 3.338857142857143e-05, + "loss": 0.4562, + "step": 6790 + }, + { + "epoch": 94.44, + "learning_rate": 3.337714285714286e-05, + "loss": 0.4564, + "step": 6800 + }, + { + "epoch": 94.58, + "learning_rate": 3.336571428571429e-05, + "loss": 0.4706, + "step": 6810 + }, + { + "epoch": 94.72, + "learning_rate": 3.335428571428572e-05, + "loss": 0.4856, + "step": 6820 + }, + { + "epoch": 94.86, + "learning_rate": 3.3342857142857146e-05, + "loss": 0.4761, + "step": 6830 + }, + { + "epoch": 95.0, + "learning_rate": 3.333142857142857e-05, + "loss": 0.4652, + "step": 6840 + }, + { + "epoch": 95.0, + "eval_loss": 0.500057578086853, + "eval_runtime": 128.3052, + "eval_samples_per_second": 4.146, + "eval_steps_per_second": 0.522, + "eval_wer": 0.22600758500996337, + "step": 6840 + }, + { + "epoch": 95.14, + "learning_rate": 3.332e-05, + "loss": 0.4533, + "step": 6850 + }, + { + "epoch": 95.28, + "learning_rate": 3.330857142857143e-05, + "loss": 0.4729, + "step": 6860 + }, + { + "epoch": 95.42, + "learning_rate": 3.329714285714286e-05, + "loss": 0.4648, + "step": 6870 + }, + { + "epoch": 95.55, + "learning_rate": 3.328571428571429e-05, + "loss": 0.4633, + "step": 6880 + }, + { + "epoch": 95.69, + "learning_rate": 3.327428571428572e-05, + "loss": 0.4587, + "step": 6890 + }, + { + "epoch": 95.83, + "learning_rate": 3.326285714285715e-05, + "loss": 0.4668, + "step": 6900 + }, + { + "epoch": 95.97, + "learning_rate": 3.3251428571428573e-05, + "loss": 0.4618, + "step": 6910 + }, + { + "epoch": 96.0, + "eval_loss": 0.4992883503437042, + "eval_runtime": 127.8206, + "eval_samples_per_second": 4.162, + "eval_steps_per_second": 0.524, + "eval_wer": 0.2367423025004821, + "step": 6912 + }, + { + "epoch": 96.11, + "learning_rate": 3.324e-05, + "loss": 0.4646, + "step": 6920 + }, + { + "epoch": 96.25, + "learning_rate": 3.3228571428571434e-05, + "loss": 0.456, + "step": 6930 + }, + { + "epoch": 96.39, + "learning_rate": 3.321714285714286e-05, + "loss": 0.4425, + "step": 6940 + }, + { + "epoch": 96.53, + "learning_rate": 3.320571428571429e-05, + "loss": 0.4674, + "step": 6950 + }, + { + "epoch": 96.66, + "learning_rate": 3.3194285714285714e-05, + "loss": 0.4568, + "step": 6960 + }, + { + "epoch": 96.8, + "learning_rate": 3.318285714285715e-05, + "loss": 0.4674, + "step": 6970 + }, + { + "epoch": 96.94, + "learning_rate": 3.3171428571428574e-05, + "loss": 0.4662, + "step": 6980 + }, + { + "epoch": 97.0, + "eval_loss": 0.5127889513969421, + "eval_runtime": 128.0439, + "eval_samples_per_second": 4.155, + "eval_steps_per_second": 0.523, + "eval_wer": 0.22587902551905895, + "step": 6984 + }, + { + "epoch": 97.08, + "learning_rate": 3.316e-05, + "loss": 0.4612, + "step": 6990 + }, + { + "epoch": 97.22, + "learning_rate": 3.3148571428571435e-05, + "loss": 0.4561, + "step": 7000 + }, + { + "epoch": 97.36, + "learning_rate": 3.313714285714286e-05, + "loss": 0.462, + "step": 7010 + }, + { + "epoch": 97.5, + "learning_rate": 3.312571428571429e-05, + "loss": 0.4545, + "step": 7020 + }, + { + "epoch": 97.64, + "learning_rate": 3.3114285714285715e-05, + "loss": 0.4424, + "step": 7030 + }, + { + "epoch": 97.78, + "learning_rate": 3.310285714285715e-05, + "loss": 0.4661, + "step": 7040 + }, + { + "epoch": 97.91, + "learning_rate": 3.3091428571428575e-05, + "loss": 0.4824, + "step": 7050 + }, + { + "epoch": 98.0, + "eval_loss": 0.5148744583129883, + "eval_runtime": 127.0725, + "eval_samples_per_second": 4.187, + "eval_steps_per_second": 0.527, + "eval_wer": 0.23847785562769172, + "step": 7056 + }, + { + "epoch": 98.06, + "learning_rate": 3.308e-05, + "loss": 0.4786, + "step": 7060 + }, + { + "epoch": 98.19, + "learning_rate": 3.3068571428571435e-05, + "loss": 0.4523, + "step": 7070 + }, + { + "epoch": 98.33, + "learning_rate": 3.305714285714286e-05, + "loss": 0.4563, + "step": 7080 + }, + { + "epoch": 98.47, + "learning_rate": 3.304571428571429e-05, + "loss": 0.471, + "step": 7090 + }, + { + "epoch": 98.61, + "learning_rate": 3.3034285714285716e-05, + "loss": 0.4563, + "step": 7100 + }, + { + "epoch": 98.75, + "learning_rate": 3.302285714285715e-05, + "loss": 0.4599, + "step": 7110 + }, + { + "epoch": 98.89, + "learning_rate": 3.3011428571428576e-05, + "loss": 0.4562, + "step": 7120 + }, + { + "epoch": 99.0, + "eval_loss": 0.5179585218429565, + "eval_runtime": 126.6626, + "eval_samples_per_second": 4.2, + "eval_steps_per_second": 0.529, + "eval_wer": 0.23346403548241948, + "step": 7128 + }, + { + "epoch": 99.03, + "learning_rate": 3.3e-05, + "loss": 0.4797, + "step": 7130 + }, + { + "epoch": 99.17, + "learning_rate": 3.298857142857143e-05, + "loss": 0.451, + "step": 7140 + }, + { + "epoch": 99.3, + "learning_rate": 3.2977142857142856e-05, + "loss": 0.4443, + "step": 7150 + }, + { + "epoch": 99.44, + "learning_rate": 3.296571428571429e-05, + "loss": 0.4659, + "step": 7160 + }, + { + "epoch": 99.58, + "learning_rate": 3.2954285714285716e-05, + "loss": 0.4606, + "step": 7170 + }, + { + "epoch": 99.72, + "learning_rate": 3.294285714285715e-05, + "loss": 0.4501, + "step": 7180 + }, + { + "epoch": 99.86, + "learning_rate": 3.2931428571428577e-05, + "loss": 0.439, + "step": 7190 + }, + { + "epoch": 100.0, + "learning_rate": 3.292e-05, + "loss": 0.4487, + "step": 7200 + }, + { + "epoch": 100.0, + "eval_loss": 0.5029368996620178, + "eval_runtime": 126.9366, + "eval_samples_per_second": 4.191, + "eval_steps_per_second": 0.528, + "eval_wer": 0.2280002571189818, + "step": 7200 + }, + { + "epoch": 100.14, + "learning_rate": 3.290857142857143e-05, + "loss": 0.4551, + "step": 7210 + }, + { + "epoch": 100.28, + "learning_rate": 3.289714285714286e-05, + "loss": 0.455, + "step": 7220 + }, + { + "epoch": 100.42, + "learning_rate": 3.288571428571429e-05, + "loss": 0.4434, + "step": 7230 + }, + { + "epoch": 100.55, + "learning_rate": 3.287428571428572e-05, + "loss": 0.4512, + "step": 7240 + }, + { + "epoch": 100.69, + "learning_rate": 3.286285714285715e-05, + "loss": 0.4551, + "step": 7250 + }, + { + "epoch": 100.83, + "learning_rate": 3.285142857142858e-05, + "loss": 0.4498, + "step": 7260 + }, + { + "epoch": 100.97, + "learning_rate": 3.2840000000000004e-05, + "loss": 0.451, + "step": 7270 + }, + { + "epoch": 101.0, + "eval_loss": 0.4906499683856964, + "eval_runtime": 127.0075, + "eval_samples_per_second": 4.189, + "eval_steps_per_second": 0.528, + "eval_wer": 0.2269717811917465, + "step": 7272 + }, + { + "epoch": 101.11, + "learning_rate": 3.282857142857143e-05, + "loss": 0.4673, + "step": 7280 + }, + { + "epoch": 101.25, + "learning_rate": 3.281714285714286e-05, + "loss": 0.4594, + "step": 7290 + }, + { + "epoch": 101.39, + "learning_rate": 3.280571428571429e-05, + "loss": 0.4555, + "step": 7300 + }, + { + "epoch": 101.53, + "learning_rate": 3.279428571428572e-05, + "loss": 0.4855, + "step": 7310 + }, + { + "epoch": 101.66, + "learning_rate": 3.2782857142857145e-05, + "loss": 0.4618, + "step": 7320 + }, + { + "epoch": 101.8, + "learning_rate": 3.277142857142857e-05, + "loss": 0.4702, + "step": 7330 + }, + { + "epoch": 101.94, + "learning_rate": 3.276e-05, + "loss": 0.4581, + "step": 7340 + }, + { + "epoch": 102.0, + "eval_loss": 0.5254329442977905, + "eval_runtime": 126.7287, + "eval_samples_per_second": 4.198, + "eval_steps_per_second": 0.529, + "eval_wer": 0.22748601915536415, + "step": 7344 + }, + { + "epoch": 102.08, + "learning_rate": 3.274857142857143e-05, + "loss": 0.4693, + "step": 7350 + }, + { + "epoch": 102.22, + "learning_rate": 3.273714285714286e-05, + "loss": 0.4633, + "step": 7360 + }, + { + "epoch": 102.36, + "learning_rate": 3.272571428571429e-05, + "loss": 0.4423, + "step": 7370 + }, + { + "epoch": 102.5, + "learning_rate": 3.271428571428572e-05, + "loss": 0.4626, + "step": 7380 + }, + { + "epoch": 102.64, + "learning_rate": 3.2702857142857145e-05, + "loss": 0.4477, + "step": 7390 + }, + { + "epoch": 102.78, + "learning_rate": 3.269142857142857e-05, + "loss": 0.4509, + "step": 7400 + }, + { + "epoch": 102.91, + "learning_rate": 3.268e-05, + "loss": 0.4582, + "step": 7410 + }, + { + "epoch": 103.0, + "eval_loss": 0.4760190546512604, + "eval_runtime": 126.8679, + "eval_samples_per_second": 4.193, + "eval_steps_per_second": 0.528, + "eval_wer": 0.22928585202802598, + "step": 7416 + }, + { + "epoch": 103.06, + "learning_rate": 3.266857142857143e-05, + "loss": 0.4741, + "step": 7420 + }, + { + "epoch": 103.19, + "learning_rate": 3.265714285714286e-05, + "loss": 0.4582, + "step": 7430 + }, + { + "epoch": 103.33, + "learning_rate": 3.264571428571429e-05, + "loss": 0.4373, + "step": 7440 + }, + { + "epoch": 103.47, + "learning_rate": 3.263428571428572e-05, + "loss": 0.4593, + "step": 7450 + }, + { + "epoch": 103.61, + "learning_rate": 3.2622857142857146e-05, + "loss": 0.4644, + "step": 7460 + }, + { + "epoch": 103.75, + "learning_rate": 3.261142857142857e-05, + "loss": 0.4585, + "step": 7470 + }, + { + "epoch": 103.89, + "learning_rate": 3.26e-05, + "loss": 0.4515, + "step": 7480 + }, + { + "epoch": 104.0, + "eval_loss": 0.4804626405239105, + "eval_runtime": 126.9851, + "eval_samples_per_second": 4.189, + "eval_steps_per_second": 0.528, + "eval_wer": 0.22427203188275374, + "step": 7488 + }, + { + "epoch": 104.03, + "learning_rate": 3.258857142857143e-05, + "loss": 0.479, + "step": 7490 + }, + { + "epoch": 104.17, + "learning_rate": 3.257714285714286e-05, + "loss": 0.4589, + "step": 7500 + }, + { + "epoch": 104.3, + "learning_rate": 3.2565714285714287e-05, + "loss": 0.4559, + "step": 7510 + }, + { + "epoch": 104.44, + "learning_rate": 3.255428571428571e-05, + "loss": 0.4599, + "step": 7520 + }, + { + "epoch": 104.58, + "learning_rate": 3.254285714285715e-05, + "loss": 0.4502, + "step": 7530 + }, + { + "epoch": 104.72, + "learning_rate": 3.2531428571428574e-05, + "loss": 0.4576, + "step": 7540 + }, + { + "epoch": 104.86, + "learning_rate": 3.252e-05, + "loss": 0.4541, + "step": 7550 + }, + { + "epoch": 105.0, + "learning_rate": 3.2508571428571434e-05, + "loss": 0.4543, + "step": 7560 + }, + { + "epoch": 105.0, + "eval_loss": 0.48694542050361633, + "eval_runtime": 126.7334, + "eval_samples_per_second": 4.198, + "eval_steps_per_second": 0.529, + "eval_wer": 0.23314263675515845, + "step": 7560 + }, + { + "epoch": 105.14, + "learning_rate": 3.249714285714286e-05, + "loss": 0.4552, + "step": 7570 + }, + { + "epoch": 105.28, + "learning_rate": 3.248571428571429e-05, + "loss": 0.4573, + "step": 7580 + }, + { + "epoch": 105.42, + "learning_rate": 3.2474285714285714e-05, + "loss": 0.4517, + "step": 7590 + }, + { + "epoch": 105.55, + "learning_rate": 3.246285714285715e-05, + "loss": 0.4587, + "step": 7600 + }, + { + "epoch": 105.69, + "learning_rate": 3.2451428571428574e-05, + "loss": 0.4451, + "step": 7610 + }, + { + "epoch": 105.83, + "learning_rate": 3.244000000000001e-05, + "loss": 0.4557, + "step": 7620 + }, + { + "epoch": 105.97, + "learning_rate": 3.2428571428571435e-05, + "loss": 0.4546, + "step": 7630 + }, + { + "epoch": 106.0, + "eval_loss": 0.5053684711456299, + "eval_runtime": 127.3504, + "eval_samples_per_second": 4.177, + "eval_steps_per_second": 0.526, + "eval_wer": 0.22774313813717298, + "step": 7632 + }, + { + "epoch": 106.11, + "learning_rate": 3.241714285714286e-05, + "loss": 0.4462, + "step": 7640 + }, + { + "epoch": 106.25, + "learning_rate": 3.240571428571429e-05, + "loss": 0.4594, + "step": 7650 + }, + { + "epoch": 106.39, + "learning_rate": 3.2394285714285715e-05, + "loss": 0.4375, + "step": 7660 + }, + { + "epoch": 106.53, + "learning_rate": 3.238285714285715e-05, + "loss": 0.4527, + "step": 7670 + }, + { + "epoch": 106.66, + "learning_rate": 3.2371428571428575e-05, + "loss": 0.4583, + "step": 7680 + }, + { + "epoch": 106.8, + "learning_rate": 3.236e-05, + "loss": 0.458, + "step": 7690 + }, + { + "epoch": 106.94, + "learning_rate": 3.234857142857143e-05, + "loss": 0.4449, + "step": 7700 + }, + { + "epoch": 107.0, + "eval_loss": 0.5338627099990845, + "eval_runtime": 127.4923, + "eval_samples_per_second": 4.173, + "eval_steps_per_second": 0.526, + "eval_wer": 0.22671466220993766, + "step": 7704 + }, + { + "epoch": 107.08, + "learning_rate": 3.2337142857142855e-05, + "loss": 0.4692, + "step": 7710 + }, + { + "epoch": 107.22, + "learning_rate": 3.232571428571429e-05, + "loss": 0.4626, + "step": 7720 + }, + { + "epoch": 107.36, + "learning_rate": 3.2314285714285716e-05, + "loss": 0.441, + "step": 7730 + }, + { + "epoch": 107.5, + "learning_rate": 3.230285714285715e-05, + "loss": 0.4541, + "step": 7740 + }, + { + "epoch": 107.64, + "learning_rate": 3.2291428571428576e-05, + "loss": 0.4541, + "step": 7750 + }, + { + "epoch": 107.78, + "learning_rate": 3.228e-05, + "loss": 0.4561, + "step": 7760 + }, + { + "epoch": 107.91, + "learning_rate": 3.226857142857143e-05, + "loss": 0.4561, + "step": 7770 + }, + { + "epoch": 108.0, + "eval_loss": 0.5065799951553345, + "eval_runtime": 127.7419, + "eval_samples_per_second": 4.165, + "eval_steps_per_second": 0.524, + "eval_wer": 0.2287073343189561, + "step": 7776 + }, + { + "epoch": 108.06, + "learning_rate": 3.2257142857142856e-05, + "loss": 0.4688, + "step": 7780 + }, + { + "epoch": 108.19, + "learning_rate": 3.224571428571429e-05, + "loss": 0.4532, + "step": 7790 + }, + { + "epoch": 108.33, + "learning_rate": 3.2234285714285716e-05, + "loss": 0.4498, + "step": 7800 + }, + { + "epoch": 108.47, + "learning_rate": 3.222285714285715e-05, + "loss": 0.4532, + "step": 7810 + }, + { + "epoch": 108.61, + "learning_rate": 3.221142857142858e-05, + "loss": 0.4441, + "step": 7820 + }, + { + "epoch": 108.75, + "learning_rate": 3.2200000000000003e-05, + "loss": 0.4495, + "step": 7830 + }, + { + "epoch": 108.89, + "learning_rate": 3.218857142857143e-05, + "loss": 0.4335, + "step": 7840 + }, + { + "epoch": 109.0, + "eval_loss": 0.5241791009902954, + "eval_runtime": 128.6203, + "eval_samples_per_second": 4.136, + "eval_steps_per_second": 0.521, + "eval_wer": 0.2310214051552356, + "step": 7848 + }, + { + "epoch": 109.03, + "learning_rate": 3.217714285714286e-05, + "loss": 0.4635, + "step": 7850 + }, + { + "epoch": 109.17, + "learning_rate": 3.216571428571429e-05, + "loss": 0.4455, + "step": 7860 + }, + { + "epoch": 109.3, + "learning_rate": 3.215428571428572e-05, + "loss": 0.4591, + "step": 7870 + }, + { + "epoch": 109.44, + "learning_rate": 3.2142857142857144e-05, + "loss": 0.4538, + "step": 7880 + }, + { + "epoch": 109.58, + "learning_rate": 3.213142857142857e-05, + "loss": 0.4526, + "step": 7890 + }, + { + "epoch": 109.72, + "learning_rate": 3.2120000000000004e-05, + "loss": 0.471, + "step": 7900 + }, + { + "epoch": 109.86, + "learning_rate": 3.210857142857143e-05, + "loss": 0.4568, + "step": 7910 + }, + { + "epoch": 110.0, + "learning_rate": 3.209714285714286e-05, + "loss": 0.4796, + "step": 7920 + }, + { + "epoch": 110.0, + "eval_loss": 0.5436424016952515, + "eval_runtime": 130.7764, + "eval_samples_per_second": 4.068, + "eval_steps_per_second": 0.512, + "eval_wer": 0.24464871119110368, + "step": 7920 + }, + { + "epoch": 110.14, + "learning_rate": 3.208571428571429e-05, + "loss": 0.4582, + "step": 7930 + }, + { + "epoch": 110.28, + "learning_rate": 3.207428571428572e-05, + "loss": 0.4583, + "step": 7940 + }, + { + "epoch": 110.42, + "learning_rate": 3.2062857142857145e-05, + "loss": 0.4638, + "step": 7950 + }, + { + "epoch": 110.55, + "learning_rate": 3.205142857142857e-05, + "loss": 0.4596, + "step": 7960 + }, + { + "epoch": 110.69, + "learning_rate": 3.2040000000000005e-05, + "loss": 0.4533, + "step": 7970 + }, + { + "epoch": 110.83, + "learning_rate": 3.202857142857143e-05, + "loss": 0.4492, + "step": 7980 + }, + { + "epoch": 110.97, + "learning_rate": 3.201714285714286e-05, + "loss": 0.4598, + "step": 7990 + }, + { + "epoch": 111.0, + "eval_loss": 0.48683521151542664, + "eval_runtime": 127.9159, + "eval_samples_per_second": 4.159, + "eval_steps_per_second": 0.524, + "eval_wer": 0.22440059137365817, + "step": 7992 + }, + { + "epoch": 111.11, + "learning_rate": 3.200571428571429e-05, + "loss": 0.4703, + "step": 8000 + }, + { + "epoch": 111.25, + "learning_rate": 3.199428571428572e-05, + "loss": 0.4533, + "step": 8010 + }, + { + "epoch": 111.39, + "learning_rate": 3.1982857142857145e-05, + "loss": 0.4475, + "step": 8020 + }, + { + "epoch": 111.53, + "learning_rate": 3.197142857142857e-05, + "loss": 0.447, + "step": 8030 + }, + { + "epoch": 111.66, + "learning_rate": 3.1960000000000006e-05, + "loss": 0.457, + "step": 8040 + }, + { + "epoch": 111.8, + "learning_rate": 3.194857142857143e-05, + "loss": 0.463, + "step": 8050 + }, + { + "epoch": 111.94, + "learning_rate": 3.193714285714286e-05, + "loss": 0.4586, + "step": 8060 + }, + { + "epoch": 112.0, + "eval_loss": 0.5303194522857666, + "eval_runtime": 127.0804, + "eval_samples_per_second": 4.186, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2366780227550299, + "step": 8064 + }, + { + "epoch": 112.08, + "learning_rate": 3.1925714285714286e-05, + "loss": 0.4705, + "step": 8070 + }, + { + "epoch": 112.22, + "learning_rate": 3.191428571428571e-05, + "loss": 0.4476, + "step": 8080 + }, + { + "epoch": 112.36, + "learning_rate": 3.1902857142857146e-05, + "loss": 0.454, + "step": 8090 + }, + { + "epoch": 112.5, + "learning_rate": 3.189142857142857e-05, + "loss": 0.4656, + "step": 8100 + }, + { + "epoch": 112.64, + "learning_rate": 3.1880000000000006e-05, + "loss": 0.4543, + "step": 8110 + }, + { + "epoch": 112.78, + "learning_rate": 3.186857142857143e-05, + "loss": 0.4494, + "step": 8120 + }, + { + "epoch": 112.91, + "learning_rate": 3.185714285714286e-05, + "loss": 0.4551, + "step": 8130 + }, + { + "epoch": 113.0, + "eval_loss": 0.5224958062171936, + "eval_runtime": 126.7319, + "eval_samples_per_second": 4.198, + "eval_steps_per_second": 0.529, + "eval_wer": 0.22613614450086778, + "step": 8136 + }, + { + "epoch": 113.06, + "learning_rate": 3.184571428571429e-05, + "loss": 0.4594, + "step": 8140 + }, + { + "epoch": 113.19, + "learning_rate": 3.1834285714285713e-05, + "loss": 0.4422, + "step": 8150 + }, + { + "epoch": 113.33, + "learning_rate": 3.182285714285715e-05, + "loss": 0.4448, + "step": 8160 + }, + { + "epoch": 113.47, + "learning_rate": 3.1811428571428574e-05, + "loss": 0.4457, + "step": 8170 + }, + { + "epoch": 113.61, + "learning_rate": 3.180000000000001e-05, + "loss": 0.44, + "step": 8180 + }, + { + "epoch": 113.75, + "learning_rate": 3.1788571428571434e-05, + "loss": 0.4466, + "step": 8190 + }, + { + "epoch": 113.89, + "learning_rate": 3.177714285714286e-05, + "loss": 0.443, + "step": 8200 + }, + { + "epoch": 114.0, + "eval_loss": 0.5137814283370972, + "eval_runtime": 127.3506, + "eval_samples_per_second": 4.177, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2375779391913608, + "step": 8208 + }, + { + "epoch": 114.03, + "learning_rate": 3.176571428571429e-05, + "loss": 0.4876, + "step": 8210 + }, + { + "epoch": 114.17, + "learning_rate": 3.1754285714285714e-05, + "loss": 0.451, + "step": 8220 + }, + { + "epoch": 114.3, + "learning_rate": 3.174285714285715e-05, + "loss": 0.4516, + "step": 8230 + }, + { + "epoch": 114.44, + "learning_rate": 3.1731428571428574e-05, + "loss": 0.4729, + "step": 8240 + }, + { + "epoch": 114.58, + "learning_rate": 3.172e-05, + "loss": 0.4518, + "step": 8250 + }, + { + "epoch": 114.72, + "learning_rate": 3.170857142857143e-05, + "loss": 0.4539, + "step": 8260 + }, + { + "epoch": 114.86, + "learning_rate": 3.169714285714286e-05, + "loss": 0.4494, + "step": 8270 + }, + { + "epoch": 115.0, + "learning_rate": 3.168571428571429e-05, + "loss": 0.4735, + "step": 8280 + }, + { + "epoch": 115.0, + "eval_loss": 0.5186481475830078, + "eval_runtime": 127.4886, + "eval_samples_per_second": 4.173, + "eval_steps_per_second": 0.526, + "eval_wer": 0.23474963039146365, + "step": 8280 + }, + { + "epoch": 115.14, + "learning_rate": 3.1674285714285715e-05, + "loss": 0.4646, + "step": 8290 + }, + { + "epoch": 115.28, + "learning_rate": 3.166285714285715e-05, + "loss": 0.4725, + "step": 8300 + }, + { + "epoch": 115.42, + "learning_rate": 3.1651428571428575e-05, + "loss": 0.4592, + "step": 8310 + }, + { + "epoch": 115.55, + "learning_rate": 3.164e-05, + "loss": 0.4649, + "step": 8320 + }, + { + "epoch": 115.69, + "learning_rate": 3.162857142857143e-05, + "loss": 0.4572, + "step": 8330 + }, + { + "epoch": 115.83, + "learning_rate": 3.161714285714286e-05, + "loss": 0.4624, + "step": 8340 + }, + { + "epoch": 115.97, + "learning_rate": 3.160571428571429e-05, + "loss": 0.4645, + "step": 8350 + }, + { + "epoch": 116.0, + "eval_loss": 0.5066367387771606, + "eval_runtime": 126.9917, + "eval_samples_per_second": 4.189, + "eval_steps_per_second": 0.528, + "eval_wer": 0.23288551777334962, + "step": 8352 + }, + { + "epoch": 116.11, + "learning_rate": 3.1594285714285716e-05, + "loss": 0.4698, + "step": 8360 + }, + { + "epoch": 116.25, + "learning_rate": 3.158285714285715e-05, + "loss": 0.4484, + "step": 8370 + }, + { + "epoch": 116.39, + "learning_rate": 3.1571428571428576e-05, + "loss": 0.4523, + "step": 8380 + }, + { + "epoch": 116.53, + "learning_rate": 3.156e-05, + "loss": 0.4551, + "step": 8390 + }, + { + "epoch": 116.66, + "learning_rate": 3.154857142857143e-05, + "loss": 0.4524, + "step": 8400 + }, + { + "epoch": 116.8, + "learning_rate": 3.153714285714286e-05, + "loss": 0.4426, + "step": 8410 + }, + { + "epoch": 116.94, + "learning_rate": 3.152571428571429e-05, + "loss": 0.4515, + "step": 8420 + }, + { + "epoch": 117.0, + "eval_loss": 0.5190147757530212, + "eval_runtime": 126.8196, + "eval_samples_per_second": 4.195, + "eval_steps_per_second": 0.528, + "eval_wer": 0.23166420260975767, + "step": 8424 + }, + { + "epoch": 117.08, + "learning_rate": 3.1514285714285717e-05, + "loss": 0.4593, + "step": 8430 + }, + { + "epoch": 117.22, + "learning_rate": 3.150285714285714e-05, + "loss": 0.4578, + "step": 8440 + }, + { + "epoch": 117.36, + "learning_rate": 3.149142857142857e-05, + "loss": 0.4559, + "step": 8450 + }, + { + "epoch": 117.5, + "learning_rate": 3.1480000000000004e-05, + "loss": 0.4504, + "step": 8460 + }, + { + "epoch": 117.64, + "learning_rate": 3.146857142857143e-05, + "loss": 0.441, + "step": 8470 + }, + { + "epoch": 117.78, + "learning_rate": 3.1457142857142864e-05, + "loss": 0.453, + "step": 8480 + }, + { + "epoch": 117.91, + "learning_rate": 3.144571428571429e-05, + "loss": 0.4376, + "step": 8490 + }, + { + "epoch": 118.0, + "eval_loss": 0.550697386264801, + "eval_runtime": 126.9179, + "eval_samples_per_second": 4.192, + "eval_steps_per_second": 0.528, + "eval_wer": 0.2325641190460886, + "step": 8496 + }, + { + "epoch": 118.06, + "learning_rate": 3.143428571428572e-05, + "loss": 0.4512, + "step": 8500 + }, + { + "epoch": 118.19, + "learning_rate": 3.1422857142857144e-05, + "loss": 0.4573, + "step": 8510 + }, + { + "epoch": 118.33, + "learning_rate": 3.141142857142857e-05, + "loss": 0.4405, + "step": 8520 + }, + { + "epoch": 118.47, + "learning_rate": 3.1400000000000004e-05, + "loss": 0.4405, + "step": 8530 + }, + { + "epoch": 118.61, + "learning_rate": 3.138857142857143e-05, + "loss": 0.4349, + "step": 8540 + }, + { + "epoch": 118.75, + "learning_rate": 3.1377142857142865e-05, + "loss": 0.4397, + "step": 8550 + }, + { + "epoch": 118.89, + "learning_rate": 3.136571428571429e-05, + "loss": 0.4364, + "step": 8560 + }, + { + "epoch": 119.0, + "eval_loss": 0.49354130029678345, + "eval_runtime": 126.9677, + "eval_samples_per_second": 4.19, + "eval_steps_per_second": 0.528, + "eval_wer": 0.22742173940991195, + "step": 8568 + }, + { + "epoch": 119.03, + "learning_rate": 3.135428571428572e-05, + "loss": 0.4614, + "step": 8570 + }, + { + "epoch": 119.17, + "learning_rate": 3.1342857142857145e-05, + "loss": 0.4338, + "step": 8580 + }, + { + "epoch": 119.3, + "learning_rate": 3.133142857142857e-05, + "loss": 0.4399, + "step": 8590 + }, + { + "epoch": 119.44, + "learning_rate": 3.1320000000000005e-05, + "loss": 0.4437, + "step": 8600 + }, + { + "epoch": 119.58, + "learning_rate": 3.130857142857143e-05, + "loss": 0.453, + "step": 8610 + }, + { + "epoch": 119.72, + "learning_rate": 3.129714285714286e-05, + "loss": 0.4529, + "step": 8620 + }, + { + "epoch": 119.86, + "learning_rate": 3.1285714285714285e-05, + "loss": 0.4554, + "step": 8630 + }, + { + "epoch": 120.0, + "learning_rate": 3.127428571428571e-05, + "loss": 0.4441, + "step": 8640 + }, + { + "epoch": 120.0, + "eval_loss": 0.5050033926963806, + "eval_runtime": 127.3447, + "eval_samples_per_second": 4.178, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2224079192646397, + "step": 8640 + }, + { + "epoch": 120.14, + "learning_rate": 3.1262857142857146e-05, + "loss": 0.4485, + "step": 8650 + }, + { + "epoch": 120.28, + "learning_rate": 3.125142857142857e-05, + "loss": 0.4454, + "step": 8660 + }, + { + "epoch": 120.42, + "learning_rate": 3.1240000000000006e-05, + "loss": 0.4319, + "step": 8670 + }, + { + "epoch": 120.55, + "learning_rate": 3.122857142857143e-05, + "loss": 0.4453, + "step": 8680 + }, + { + "epoch": 120.69, + "learning_rate": 3.121714285714286e-05, + "loss": 0.4387, + "step": 8690 + }, + { + "epoch": 120.83, + "learning_rate": 3.1205714285714286e-05, + "loss": 0.4436, + "step": 8700 + }, + { + "epoch": 120.97, + "learning_rate": 3.119428571428571e-05, + "loss": 0.4583, + "step": 8710 + }, + { + "epoch": 121.0, + "eval_loss": 0.5257618427276611, + "eval_runtime": 127.0648, + "eval_samples_per_second": 4.187, + "eval_steps_per_second": 0.527, + "eval_wer": 0.23314263675515845, + "step": 8712 + }, + { + "epoch": 121.11, + "learning_rate": 3.1182857142857146e-05, + "loss": 0.4621, + "step": 8720 + }, + { + "epoch": 121.25, + "learning_rate": 3.117142857142857e-05, + "loss": 0.4502, + "step": 8730 + }, + { + "epoch": 121.39, + "learning_rate": 3.1160000000000007e-05, + "loss": 0.445, + "step": 8740 + }, + { + "epoch": 121.53, + "learning_rate": 3.114857142857143e-05, + "loss": 0.462, + "step": 8750 + }, + { + "epoch": 121.66, + "learning_rate": 3.113714285714286e-05, + "loss": 0.4498, + "step": 8760 + }, + { + "epoch": 121.8, + "learning_rate": 3.112571428571429e-05, + "loss": 0.4499, + "step": 8770 + }, + { + "epoch": 121.94, + "learning_rate": 3.1114285714285714e-05, + "loss": 0.4525, + "step": 8780 + }, + { + "epoch": 122.0, + "eval_loss": 0.5263261198997498, + "eval_runtime": 127.2524, + "eval_samples_per_second": 4.181, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2296715305007392, + "step": 8784 + }, + { + "epoch": 122.08, + "learning_rate": 3.110285714285715e-05, + "loss": 0.4488, + "step": 8790 + }, + { + "epoch": 122.22, + "learning_rate": 3.1091428571428574e-05, + "loss": 0.449, + "step": 8800 + }, + { + "epoch": 122.36, + "learning_rate": 3.108e-05, + "loss": 0.4336, + "step": 8810 + }, + { + "epoch": 122.5, + "learning_rate": 3.106857142857143e-05, + "loss": 0.4403, + "step": 8820 + }, + { + "epoch": 122.64, + "learning_rate": 3.105714285714286e-05, + "loss": 0.4554, + "step": 8830 + }, + { + "epoch": 122.78, + "learning_rate": 3.104571428571429e-05, + "loss": 0.4511, + "step": 8840 + }, + { + "epoch": 122.91, + "learning_rate": 3.103428571428572e-05, + "loss": 0.4448, + "step": 8850 + }, + { + "epoch": 123.0, + "eval_loss": 0.5362554788589478, + "eval_runtime": 126.9397, + "eval_samples_per_second": 4.191, + "eval_steps_per_second": 0.528, + "eval_wer": 0.2229864369737096, + "step": 8856 + }, + { + "epoch": 123.06, + "learning_rate": 3.102285714285715e-05, + "loss": 0.4553, + "step": 8860 + }, + { + "epoch": 123.19, + "learning_rate": 3.1011428571428575e-05, + "loss": 0.4502, + "step": 8870 + }, + { + "epoch": 123.33, + "learning_rate": 3.1e-05, + "loss": 0.4525, + "step": 8880 + }, + { + "epoch": 123.47, + "learning_rate": 3.098857142857143e-05, + "loss": 0.4499, + "step": 8890 + }, + { + "epoch": 123.61, + "learning_rate": 3.097714285714286e-05, + "loss": 0.46, + "step": 8900 + }, + { + "epoch": 123.75, + "learning_rate": 3.096571428571429e-05, + "loss": 0.4556, + "step": 8910 + }, + { + "epoch": 123.89, + "learning_rate": 3.095428571428572e-05, + "loss": 0.4598, + "step": 8920 + }, + { + "epoch": 124.0, + "eval_loss": 0.5361588597297668, + "eval_runtime": 127.2634, + "eval_samples_per_second": 4.18, + "eval_steps_per_second": 0.526, + "eval_wer": 0.23905637333676158, + "step": 8928 + }, + { + "epoch": 124.03, + "learning_rate": 3.094285714285715e-05, + "loss": 0.473, + "step": 8930 + }, + { + "epoch": 124.17, + "learning_rate": 3.0931428571428575e-05, + "loss": 0.4693, + "step": 8940 + }, + { + "epoch": 124.3, + "learning_rate": 3.092e-05, + "loss": 0.4675, + "step": 8950 + }, + { + "epoch": 124.44, + "learning_rate": 3.090857142857143e-05, + "loss": 0.4557, + "step": 8960 + }, + { + "epoch": 124.58, + "learning_rate": 3.089714285714286e-05, + "loss": 0.4653, + "step": 8970 + }, + { + "epoch": 124.72, + "learning_rate": 3.088571428571429e-05, + "loss": 0.4484, + "step": 8980 + }, + { + "epoch": 124.86, + "learning_rate": 3.0874285714285716e-05, + "loss": 0.446, + "step": 8990 + }, + { + "epoch": 125.0, + "learning_rate": 3.086285714285714e-05, + "loss": 0.4447, + "step": 9000 + }, + { + "epoch": 125.0, + "eval_loss": 0.5188495516777039, + "eval_runtime": 126.7943, + "eval_samples_per_second": 4.196, + "eval_steps_per_second": 0.528, + "eval_wer": 0.22459343061001477, + "step": 9000 + }, + { + "epoch": 125.14, + "learning_rate": 3.085142857142857e-05, + "loss": 0.4488, + "step": 9010 + }, + { + "epoch": 125.28, + "learning_rate": 3.084e-05, + "loss": 0.4434, + "step": 9020 + }, + { + "epoch": 125.42, + "learning_rate": 3.082857142857143e-05, + "loss": 0.4499, + "step": 9030 + }, + { + "epoch": 125.55, + "learning_rate": 3.081714285714286e-05, + "loss": 0.445, + "step": 9040 + }, + { + "epoch": 125.69, + "learning_rate": 3.080571428571429e-05, + "loss": 0.4528, + "step": 9050 + }, + { + "epoch": 125.83, + "learning_rate": 3.079428571428572e-05, + "loss": 0.4573, + "step": 9060 + }, + { + "epoch": 125.97, + "learning_rate": 3.078285714285714e-05, + "loss": 0.4604, + "step": 9070 + }, + { + "epoch": 126.0, + "eval_loss": 0.5183969140052795, + "eval_runtime": 127.9613, + "eval_samples_per_second": 4.158, + "eval_steps_per_second": 0.524, + "eval_wer": 0.23185704184611428, + "step": 9072 + }, + { + "epoch": 126.11, + "learning_rate": 3.077142857142857e-05, + "loss": 0.4803, + "step": 9080 + }, + { + "epoch": 126.25, + "learning_rate": 3.0760000000000004e-05, + "loss": 0.4647, + "step": 9090 + }, + { + "epoch": 126.39, + "learning_rate": 3.074857142857143e-05, + "loss": 0.4403, + "step": 9100 + }, + { + "epoch": 126.53, + "learning_rate": 3.0737142857142864e-05, + "loss": 0.4736, + "step": 9110 + }, + { + "epoch": 126.66, + "learning_rate": 3.072571428571429e-05, + "loss": 0.4697, + "step": 9120 + }, + { + "epoch": 126.8, + "learning_rate": 3.071428571428572e-05, + "loss": 0.4836, + "step": 9130 + }, + { + "epoch": 126.94, + "learning_rate": 3.0702857142857144e-05, + "loss": 0.4582, + "step": 9140 + }, + { + "epoch": 127.0, + "eval_loss": 0.5066961646080017, + "eval_runtime": 127.0768, + "eval_samples_per_second": 4.186, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2335283152278717, + "step": 9144 + }, + { + "epoch": 127.08, + "learning_rate": 3.069142857142857e-05, + "loss": 0.4556, + "step": 9150 + }, + { + "epoch": 127.22, + "learning_rate": 3.0680000000000004e-05, + "loss": 0.444, + "step": 9160 + }, + { + "epoch": 127.36, + "learning_rate": 3.066857142857143e-05, + "loss": 0.4418, + "step": 9170 + }, + { + "epoch": 127.5, + "learning_rate": 3.065714285714286e-05, + "loss": 0.4407, + "step": 9180 + }, + { + "epoch": 127.64, + "learning_rate": 3.0645714285714285e-05, + "loss": 0.4363, + "step": 9190 + }, + { + "epoch": 127.78, + "learning_rate": 3.063428571428572e-05, + "loss": 0.4471, + "step": 9200 + }, + { + "epoch": 127.91, + "learning_rate": 3.0622857142857145e-05, + "loss": 0.439, + "step": 9210 + }, + { + "epoch": 128.0, + "eval_loss": 0.5583868026733398, + "eval_runtime": 127.7205, + "eval_samples_per_second": 4.165, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2359066658096034, + "step": 9216 + }, + { + "epoch": 128.06, + "learning_rate": 3.061142857142857e-05, + "loss": 0.4641, + "step": 9220 + }, + { + "epoch": 128.19, + "learning_rate": 3.0600000000000005e-05, + "loss": 0.4432, + "step": 9230 + }, + { + "epoch": 128.33, + "learning_rate": 3.058857142857143e-05, + "loss": 0.4523, + "step": 9240 + }, + { + "epoch": 128.47, + "learning_rate": 3.057714285714286e-05, + "loss": 0.449, + "step": 9250 + }, + { + "epoch": 128.61, + "learning_rate": 3.0565714285714285e-05, + "loss": 0.437, + "step": 9260 + }, + { + "epoch": 128.75, + "learning_rate": 3.055428571428572e-05, + "loss": 0.4308, + "step": 9270 + }, + { + "epoch": 128.89, + "learning_rate": 3.0542857142857146e-05, + "loss": 0.4396, + "step": 9280 + }, + { + "epoch": 129.0, + "eval_loss": 0.5287209153175354, + "eval_runtime": 126.9423, + "eval_samples_per_second": 4.191, + "eval_steps_per_second": 0.528, + "eval_wer": 0.23378543420968054, + "step": 9288 + }, + { + "epoch": 129.03, + "learning_rate": 3.053142857142857e-05, + "loss": 0.4602, + "step": 9290 + }, + { + "epoch": 129.17, + "learning_rate": 3.0520000000000006e-05, + "loss": 0.433, + "step": 9300 + }, + { + "epoch": 129.3, + "learning_rate": 3.050857142857143e-05, + "loss": 0.4433, + "step": 9310 + }, + { + "epoch": 129.44, + "learning_rate": 3.049714285714286e-05, + "loss": 0.4207, + "step": 9320 + }, + { + "epoch": 129.58, + "learning_rate": 3.0485714285714286e-05, + "loss": 0.451, + "step": 9330 + }, + { + "epoch": 129.72, + "learning_rate": 3.047428571428572e-05, + "loss": 0.4592, + "step": 9340 + }, + { + "epoch": 129.86, + "learning_rate": 3.0462857142857146e-05, + "loss": 0.4451, + "step": 9350 + }, + { + "epoch": 130.0, + "learning_rate": 3.0451428571428573e-05, + "loss": 0.4461, + "step": 9360 + }, + { + "epoch": 130.0, + "eval_loss": 0.5332010388374329, + "eval_runtime": 127.1595, + "eval_samples_per_second": 4.184, + "eval_steps_per_second": 0.527, + "eval_wer": 0.23217844057337533, + "step": 9360 + }, + { + "epoch": 130.14, + "learning_rate": 3.0440000000000003e-05, + "loss": 0.4535, + "step": 9370 + }, + { + "epoch": 130.28, + "learning_rate": 3.042857142857143e-05, + "loss": 0.4494, + "step": 9380 + }, + { + "epoch": 130.42, + "learning_rate": 3.041714285714286e-05, + "loss": 0.4298, + "step": 9390 + }, + { + "epoch": 130.55, + "learning_rate": 3.0405714285714287e-05, + "loss": 0.433, + "step": 9400 + }, + { + "epoch": 130.69, + "learning_rate": 3.0394285714285717e-05, + "loss": 0.442, + "step": 9410 + }, + { + "epoch": 130.83, + "learning_rate": 3.0382857142857144e-05, + "loss": 0.4452, + "step": 9420 + }, + { + "epoch": 130.97, + "learning_rate": 3.037142857142857e-05, + "loss": 0.4654, + "step": 9430 + }, + { + "epoch": 131.0, + "eval_loss": 0.49537086486816406, + "eval_runtime": 128.5196, + "eval_samples_per_second": 4.139, + "eval_steps_per_second": 0.521, + "eval_wer": 0.229607250755287, + "step": 9432 + }, + { + "epoch": 131.11, + "learning_rate": 3.0360000000000004e-05, + "loss": 0.4646, + "step": 9440 + }, + { + "epoch": 131.25, + "learning_rate": 3.034857142857143e-05, + "loss": 0.4493, + "step": 9450 + }, + { + "epoch": 131.39, + "learning_rate": 3.033714285714286e-05, + "loss": 0.4358, + "step": 9460 + }, + { + "epoch": 131.53, + "learning_rate": 3.0325714285714288e-05, + "loss": 0.4361, + "step": 9470 + }, + { + "epoch": 131.66, + "learning_rate": 3.0314285714285718e-05, + "loss": 0.4384, + "step": 9480 + }, + { + "epoch": 131.8, + "learning_rate": 3.0302857142857145e-05, + "loss": 0.4396, + "step": 9490 + }, + { + "epoch": 131.94, + "learning_rate": 3.0291428571428575e-05, + "loss": 0.4303, + "step": 9500 + }, + { + "epoch": 132.0, + "eval_loss": 0.5328178405761719, + "eval_runtime": 127.4601, + "eval_samples_per_second": 4.174, + "eval_steps_per_second": 0.526, + "eval_wer": 0.22620042424631998, + "step": 9504 + }, + { + "epoch": 132.08, + "learning_rate": 3.028e-05, + "loss": 0.4355, + "step": 9510 + }, + { + "epoch": 132.22, + "learning_rate": 3.0268571428571428e-05, + "loss": 0.4388, + "step": 9520 + }, + { + "epoch": 132.36, + "learning_rate": 3.0257142857142862e-05, + "loss": 0.4572, + "step": 9530 + }, + { + "epoch": 132.5, + "learning_rate": 3.024571428571429e-05, + "loss": 0.4593, + "step": 9540 + }, + { + "epoch": 132.64, + "learning_rate": 3.023428571428572e-05, + "loss": 0.4514, + "step": 9550 + }, + { + "epoch": 132.78, + "learning_rate": 3.0222857142857145e-05, + "loss": 0.4493, + "step": 9560 + }, + { + "epoch": 132.91, + "learning_rate": 3.0211428571428575e-05, + "loss": 0.4413, + "step": 9570 + }, + { + "epoch": 133.0, + "eval_loss": 0.5558308362960815, + "eval_runtime": 127.2236, + "eval_samples_per_second": 4.182, + "eval_steps_per_second": 0.527, + "eval_wer": 0.23622806453686443, + "step": 9576 + }, + { + "epoch": 133.06, + "learning_rate": 3.0200000000000002e-05, + "loss": 0.47, + "step": 9580 + }, + { + "epoch": 133.19, + "learning_rate": 3.018857142857143e-05, + "loss": 0.4472, + "step": 9590 + }, + { + "epoch": 133.33, + "learning_rate": 3.017714285714286e-05, + "loss": 0.4622, + "step": 9600 + }, + { + "epoch": 133.47, + "learning_rate": 3.0165714285714286e-05, + "loss": 0.4517, + "step": 9610 + }, + { + "epoch": 133.61, + "learning_rate": 3.015428571428572e-05, + "loss": 0.447, + "step": 9620 + }, + { + "epoch": 133.75, + "learning_rate": 3.0142857142857146e-05, + "loss": 0.4569, + "step": 9630 + }, + { + "epoch": 133.89, + "learning_rate": 3.0131428571428576e-05, + "loss": 0.4406, + "step": 9640 + }, + { + "epoch": 134.0, + "eval_loss": 0.5305873155593872, + "eval_runtime": 126.9175, + "eval_samples_per_second": 4.192, + "eval_steps_per_second": 0.528, + "eval_wer": 0.22735745966445972, + "step": 9648 + }, + { + "epoch": 134.03, + "learning_rate": 3.0120000000000003e-05, + "loss": 0.4634, + "step": 9650 + }, + { + "epoch": 134.17, + "learning_rate": 3.010857142857143e-05, + "loss": 0.4428, + "step": 9660 + }, + { + "epoch": 134.3, + "learning_rate": 3.009714285714286e-05, + "loss": 0.4375, + "step": 9670 + }, + { + "epoch": 134.44, + "learning_rate": 3.0085714285714287e-05, + "loss": 0.4561, + "step": 9680 + }, + { + "epoch": 134.58, + "learning_rate": 3.0074285714285717e-05, + "loss": 0.4467, + "step": 9690 + }, + { + "epoch": 134.72, + "learning_rate": 3.0062857142857143e-05, + "loss": 0.4381, + "step": 9700 + }, + { + "epoch": 134.86, + "learning_rate": 3.0051428571428577e-05, + "loss": 0.429, + "step": 9710 + }, + { + "epoch": 135.0, + "learning_rate": 3.0040000000000004e-05, + "loss": 0.4249, + "step": 9720 + }, + { + "epoch": 135.0, + "eval_loss": 0.5095993876457214, + "eval_runtime": 126.6382, + "eval_samples_per_second": 4.201, + "eval_steps_per_second": 0.529, + "eval_wer": 0.2191296522465771, + "step": 9720 + }, + { + "epoch": 135.14, + "learning_rate": 3.002857142857143e-05, + "loss": 0.4376, + "step": 9730 + }, + { + "epoch": 135.28, + "learning_rate": 3.001714285714286e-05, + "loss": 0.4492, + "step": 9740 + }, + { + "epoch": 135.42, + "learning_rate": 3.0005714285714287e-05, + "loss": 0.4302, + "step": 9750 + }, + { + "epoch": 135.55, + "learning_rate": 2.9994285714285718e-05, + "loss": 0.4409, + "step": 9760 + }, + { + "epoch": 135.69, + "learning_rate": 2.9982857142857144e-05, + "loss": 0.452, + "step": 9770 + }, + { + "epoch": 135.83, + "learning_rate": 2.9971428571428574e-05, + "loss": 0.4341, + "step": 9780 + }, + { + "epoch": 135.97, + "learning_rate": 2.996e-05, + "loss": 0.4359, + "step": 9790 + }, + { + "epoch": 136.0, + "eval_loss": 0.5437365174293518, + "eval_runtime": 126.924, + "eval_samples_per_second": 4.191, + "eval_steps_per_second": 0.528, + "eval_wer": 0.2240149129009449, + "step": 9792 + }, + { + "epoch": 136.11, + "learning_rate": 2.9948571428571428e-05, + "loss": 0.4474, + "step": 9800 + }, + { + "epoch": 136.25, + "learning_rate": 2.993714285714286e-05, + "loss": 0.4496, + "step": 9810 + }, + { + "epoch": 136.39, + "learning_rate": 2.9925714285714288e-05, + "loss": 0.443, + "step": 9820 + }, + { + "epoch": 136.53, + "learning_rate": 2.9914285714285718e-05, + "loss": 0.4673, + "step": 9830 + }, + { + "epoch": 136.66, + "learning_rate": 2.9902857142857145e-05, + "loss": 0.4483, + "step": 9840 + }, + { + "epoch": 136.8, + "learning_rate": 2.9891428571428575e-05, + "loss": 0.4416, + "step": 9850 + }, + { + "epoch": 136.94, + "learning_rate": 2.9880000000000002e-05, + "loss": 0.4535, + "step": 9860 + }, + { + "epoch": 137.0, + "eval_loss": 0.5400481224060059, + "eval_runtime": 127.3795, + "eval_samples_per_second": 4.176, + "eval_steps_per_second": 0.526, + "eval_wer": 0.23076428617342676, + "step": 9864 + }, + { + "epoch": 137.08, + "learning_rate": 2.986857142857143e-05, + "loss": 0.4738, + "step": 9870 + }, + { + "epoch": 137.22, + "learning_rate": 2.985714285714286e-05, + "loss": 0.4435, + "step": 9880 + }, + { + "epoch": 137.36, + "learning_rate": 2.9845714285714286e-05, + "loss": 0.4605, + "step": 9890 + }, + { + "epoch": 137.5, + "learning_rate": 2.983428571428572e-05, + "loss": 0.4504, + "step": 9900 + }, + { + "epoch": 137.64, + "learning_rate": 2.9822857142857146e-05, + "loss": 0.4461, + "step": 9910 + }, + { + "epoch": 137.78, + "learning_rate": 2.9811428571428576e-05, + "loss": 0.4411, + "step": 9920 + }, + { + "epoch": 137.91, + "learning_rate": 2.9800000000000003e-05, + "loss": 0.4366, + "step": 9930 + }, + { + "epoch": 138.0, + "eval_loss": 0.5375600457191467, + "eval_runtime": 126.626, + "eval_samples_per_second": 4.201, + "eval_steps_per_second": 0.529, + "eval_wer": 0.2270360609371987, + "step": 9936 + }, + { + "epoch": 138.06, + "learning_rate": 2.978857142857143e-05, + "loss": 0.437, + "step": 9940 + }, + { + "epoch": 138.19, + "learning_rate": 2.977714285714286e-05, + "loss": 0.4342, + "step": 9950 + }, + { + "epoch": 138.33, + "learning_rate": 2.9765714285714286e-05, + "loss": 0.436, + "step": 9960 + }, + { + "epoch": 138.47, + "learning_rate": 2.9754285714285716e-05, + "loss": 0.4488, + "step": 9970 + }, + { + "epoch": 138.61, + "learning_rate": 2.9742857142857143e-05, + "loss": 0.4509, + "step": 9980 + }, + { + "epoch": 138.75, + "learning_rate": 2.9731428571428577e-05, + "loss": 0.4292, + "step": 9990 + }, + { + "epoch": 138.89, + "learning_rate": 2.9720000000000003e-05, + "loss": 0.4312, + "step": 10000 + }, + { + "epoch": 139.0, + "eval_loss": 0.5271294713020325, + "eval_runtime": 127.0263, + "eval_samples_per_second": 4.188, + "eval_steps_per_second": 0.527, + "eval_wer": 0.22491482933727583, + "step": 10008 + }, + { + "epoch": 139.03, + "learning_rate": 2.970857142857143e-05, + "loss": 0.4448, + "step": 10010 + }, + { + "epoch": 139.17, + "learning_rate": 2.969714285714286e-05, + "loss": 0.4286, + "step": 10020 + }, + { + "epoch": 139.3, + "learning_rate": 2.9685714285714287e-05, + "loss": 0.4314, + "step": 10030 + }, + { + "epoch": 139.44, + "learning_rate": 2.9674285714285717e-05, + "loss": 0.436, + "step": 10040 + }, + { + "epoch": 139.58, + "learning_rate": 2.9662857142857144e-05, + "loss": 0.4355, + "step": 10050 + }, + { + "epoch": 139.72, + "learning_rate": 2.9651428571428574e-05, + "loss": 0.4355, + "step": 10060 + }, + { + "epoch": 139.86, + "learning_rate": 2.964e-05, + "loss": 0.4361, + "step": 10070 + }, + { + "epoch": 140.0, + "learning_rate": 2.9628571428571434e-05, + "loss": 0.4369, + "step": 10080 + }, + { + "epoch": 140.0, + "eval_loss": 0.5074235796928406, + "eval_runtime": 126.7888, + "eval_samples_per_second": 4.196, + "eval_steps_per_second": 0.528, + "eval_wer": 0.219708169955647, + "step": 10080 + }, + { + "epoch": 140.14, + "learning_rate": 2.961714285714286e-05, + "loss": 0.4327, + "step": 10090 + }, + { + "epoch": 140.28, + "learning_rate": 2.9605714285714288e-05, + "loss": 0.4317, + "step": 10100 + }, + { + "epoch": 140.42, + "learning_rate": 2.9594285714285718e-05, + "loss": 0.4337, + "step": 10110 + }, + { + "epoch": 140.55, + "learning_rate": 2.9582857142857145e-05, + "loss": 0.4343, + "step": 10120 + }, + { + "epoch": 140.69, + "learning_rate": 2.9571428571428575e-05, + "loss": 0.4366, + "step": 10130 + }, + { + "epoch": 140.83, + "learning_rate": 2.956e-05, + "loss": 0.4437, + "step": 10140 + }, + { + "epoch": 140.97, + "learning_rate": 2.9548571428571432e-05, + "loss": 0.4365, + "step": 10150 + }, + { + "epoch": 141.0, + "eval_loss": 0.5184508562088013, + "eval_runtime": 127.6636, + "eval_samples_per_second": 4.167, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2325641190460886, + "step": 10152 + }, + { + "epoch": 141.11, + "learning_rate": 2.953714285714286e-05, + "loss": 0.445, + "step": 10160 + }, + { + "epoch": 141.25, + "learning_rate": 2.9525714285714285e-05, + "loss": 0.4424, + "step": 10170 + }, + { + "epoch": 141.39, + "learning_rate": 2.951428571428572e-05, + "loss": 0.4338, + "step": 10180 + }, + { + "epoch": 141.53, + "learning_rate": 2.9502857142857145e-05, + "loss": 0.44, + "step": 10190 + }, + { + "epoch": 141.66, + "learning_rate": 2.9491428571428576e-05, + "loss": 0.4254, + "step": 10200 + }, + { + "epoch": 141.8, + "learning_rate": 2.9480000000000002e-05, + "loss": 0.4273, + "step": 10210 + }, + { + "epoch": 141.94, + "learning_rate": 2.9468571428571432e-05, + "loss": 0.416, + "step": 10220 + }, + { + "epoch": 142.0, + "eval_loss": 0.49054965376853943, + "eval_runtime": 127.392, + "eval_samples_per_second": 4.176, + "eval_steps_per_second": 0.526, + "eval_wer": 0.22343639519187505, + "step": 10224 + }, + { + "epoch": 142.08, + "learning_rate": 2.945714285714286e-05, + "loss": 0.4325, + "step": 10230 + }, + { + "epoch": 142.22, + "learning_rate": 2.9445714285714286e-05, + "loss": 0.4264, + "step": 10240 + }, + { + "epoch": 142.36, + "learning_rate": 2.9434285714285716e-05, + "loss": 0.4335, + "step": 10250 + }, + { + "epoch": 142.5, + "learning_rate": 2.9422857142857143e-05, + "loss": 0.4266, + "step": 10260 + }, + { + "epoch": 142.64, + "learning_rate": 2.9411428571428576e-05, + "loss": 0.4172, + "step": 10270 + }, + { + "epoch": 142.78, + "learning_rate": 2.9400000000000003e-05, + "loss": 0.4494, + "step": 10280 + }, + { + "epoch": 142.91, + "learning_rate": 2.9388571428571433e-05, + "loss": 0.4306, + "step": 10290 + }, + { + "epoch": 143.0, + "eval_loss": 0.5001691579818726, + "eval_runtime": 127.4245, + "eval_samples_per_second": 4.175, + "eval_steps_per_second": 0.526, + "eval_wer": 0.22253647875554414, + "step": 10296 + }, + { + "epoch": 143.06, + "learning_rate": 2.937714285714286e-05, + "loss": 0.452, + "step": 10300 + }, + { + "epoch": 143.19, + "learning_rate": 2.9365714285714287e-05, + "loss": 0.4294, + "step": 10310 + }, + { + "epoch": 143.33, + "learning_rate": 2.9354285714285717e-05, + "loss": 0.4492, + "step": 10320 + }, + { + "epoch": 143.47, + "learning_rate": 2.9342857142857144e-05, + "loss": 0.4372, + "step": 10330 + }, + { + "epoch": 143.61, + "learning_rate": 2.9331428571428574e-05, + "loss": 0.4405, + "step": 10340 + }, + { + "epoch": 143.75, + "learning_rate": 2.932e-05, + "loss": 0.4411, + "step": 10350 + }, + { + "epoch": 143.89, + "learning_rate": 2.9308571428571434e-05, + "loss": 0.435, + "step": 10360 + }, + { + "epoch": 144.0, + "eval_loss": 0.4939168393611908, + "eval_runtime": 128.3749, + "eval_samples_per_second": 4.144, + "eval_steps_per_second": 0.522, + "eval_wer": 0.22427203188275374, + "step": 10368 + }, + { + "epoch": 144.03, + "learning_rate": 2.929714285714286e-05, + "loss": 0.4535, + "step": 10370 + }, + { + "epoch": 144.17, + "learning_rate": 2.9285714285714288e-05, + "loss": 0.4342, + "step": 10380 + }, + { + "epoch": 144.3, + "learning_rate": 2.9274285714285718e-05, + "loss": 0.4325, + "step": 10390 + }, + { + "epoch": 144.44, + "learning_rate": 2.9262857142857144e-05, + "loss": 0.4292, + "step": 10400 + }, + { + "epoch": 144.58, + "learning_rate": 2.9251428571428575e-05, + "loss": 0.4461, + "step": 10410 + }, + { + "epoch": 144.72, + "learning_rate": 2.924e-05, + "loss": 0.4284, + "step": 10420 + }, + { + "epoch": 144.86, + "learning_rate": 2.922857142857143e-05, + "loss": 0.435, + "step": 10430 + }, + { + "epoch": 145.0, + "learning_rate": 2.9217142857142858e-05, + "loss": 0.443, + "step": 10440 + }, + { + "epoch": 145.0, + "eval_loss": 0.5476204752922058, + "eval_runtime": 128.2741, + "eval_samples_per_second": 4.147, + "eval_steps_per_second": 0.522, + "eval_wer": 0.22658610271903323, + "step": 10440 + }, + { + "epoch": 145.14, + "learning_rate": 2.9205714285714285e-05, + "loss": 0.4497, + "step": 10450 + }, + { + "epoch": 145.28, + "learning_rate": 2.919428571428572e-05, + "loss": 0.4435, + "step": 10460 + }, + { + "epoch": 145.42, + "learning_rate": 2.9182857142857145e-05, + "loss": 0.4314, + "step": 10470 + }, + { + "epoch": 145.55, + "learning_rate": 2.9171428571428575e-05, + "loss": 0.4453, + "step": 10480 + }, + { + "epoch": 145.69, + "learning_rate": 2.9160000000000002e-05, + "loss": 0.4325, + "step": 10490 + }, + { + "epoch": 145.83, + "learning_rate": 2.9148571428571432e-05, + "loss": 0.4345, + "step": 10500 + }, + { + "epoch": 145.97, + "learning_rate": 2.913714285714286e-05, + "loss": 0.4478, + "step": 10510 + }, + { + "epoch": 146.0, + "eval_loss": 0.49572858214378357, + "eval_runtime": 127.3526, + "eval_samples_per_second": 4.177, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2366137430095777, + "step": 10512 + }, + { + "epoch": 146.11, + "learning_rate": 2.9125714285714286e-05, + "loss": 0.4644, + "step": 10520 + }, + { + "epoch": 146.25, + "learning_rate": 2.9114285714285716e-05, + "loss": 0.4322, + "step": 10530 + }, + { + "epoch": 146.39, + "learning_rate": 2.9102857142857143e-05, + "loss": 0.4382, + "step": 10540 + }, + { + "epoch": 146.53, + "learning_rate": 2.9091428571428576e-05, + "loss": 0.4437, + "step": 10550 + }, + { + "epoch": 146.66, + "learning_rate": 2.9080000000000003e-05, + "loss": 0.4283, + "step": 10560 + }, + { + "epoch": 146.8, + "learning_rate": 2.9068571428571433e-05, + "loss": 0.4252, + "step": 10570 + }, + { + "epoch": 146.94, + "learning_rate": 2.905714285714286e-05, + "loss": 0.4211, + "step": 10580 + }, + { + "epoch": 147.0, + "eval_loss": 0.5512177348136902, + "eval_runtime": 127.098, + "eval_samples_per_second": 4.186, + "eval_steps_per_second": 0.527, + "eval_wer": 0.22272931799190074, + "step": 10584 + }, + { + "epoch": 147.08, + "learning_rate": 2.9045714285714286e-05, + "loss": 0.4544, + "step": 10590 + }, + { + "epoch": 147.22, + "learning_rate": 2.9034285714285717e-05, + "loss": 0.4377, + "step": 10600 + }, + { + "epoch": 147.36, + "learning_rate": 2.9022857142857143e-05, + "loss": 0.4196, + "step": 10610 + }, + { + "epoch": 147.5, + "learning_rate": 2.9011428571428573e-05, + "loss": 0.4308, + "step": 10620 + }, + { + "epoch": 147.64, + "learning_rate": 2.9e-05, + "loss": 0.4214, + "step": 10630 + }, + { + "epoch": 147.78, + "learning_rate": 2.8988571428571434e-05, + "loss": 0.4301, + "step": 10640 + }, + { + "epoch": 147.91, + "learning_rate": 2.897714285714286e-05, + "loss": 0.43, + "step": 10650 + }, + { + "epoch": 148.0, + "eval_loss": 0.5209096074104309, + "eval_runtime": 128.8457, + "eval_samples_per_second": 4.129, + "eval_steps_per_second": 0.52, + "eval_wer": 0.2270360609371987, + "step": 10656 + }, + { + "epoch": 148.06, + "learning_rate": 2.8965714285714287e-05, + "loss": 0.4403, + "step": 10660 + }, + { + "epoch": 148.19, + "learning_rate": 2.8954285714285717e-05, + "loss": 0.4238, + "step": 10670 + }, + { + "epoch": 148.33, + "learning_rate": 2.8942857142857144e-05, + "loss": 0.4324, + "step": 10680 + }, + { + "epoch": 148.47, + "learning_rate": 2.8931428571428574e-05, + "loss": 0.4417, + "step": 10690 + }, + { + "epoch": 148.61, + "learning_rate": 2.892e-05, + "loss": 0.4259, + "step": 10700 + }, + { + "epoch": 148.75, + "learning_rate": 2.890857142857143e-05, + "loss": 0.4357, + "step": 10710 + }, + { + "epoch": 148.89, + "learning_rate": 2.8897142857142858e-05, + "loss": 0.4305, + "step": 10720 + }, + { + "epoch": 149.0, + "eval_loss": 0.5511650443077087, + "eval_runtime": 126.9645, + "eval_samples_per_second": 4.19, + "eval_steps_per_second": 0.528, + "eval_wer": 0.22722890017355532, + "step": 10728 + }, + { + "epoch": 149.03, + "learning_rate": 2.888571428571429e-05, + "loss": 0.434, + "step": 10730 + }, + { + "epoch": 149.17, + "learning_rate": 2.8874285714285718e-05, + "loss": 0.4221, + "step": 10740 + }, + { + "epoch": 149.3, + "learning_rate": 2.8862857142857145e-05, + "loss": 0.4352, + "step": 10750 + }, + { + "epoch": 149.44, + "learning_rate": 2.8851428571428575e-05, + "loss": 0.4293, + "step": 10760 + }, + { + "epoch": 149.58, + "learning_rate": 2.8840000000000002e-05, + "loss": 0.4136, + "step": 10770 + }, + { + "epoch": 149.72, + "learning_rate": 2.8828571428571432e-05, + "loss": 0.4357, + "step": 10780 + }, + { + "epoch": 149.86, + "learning_rate": 2.881714285714286e-05, + "loss": 0.4165, + "step": 10790 + }, + { + "epoch": 150.0, + "learning_rate": 2.880571428571429e-05, + "loss": 0.4412, + "step": 10800 + }, + { + "epoch": 150.0, + "eval_loss": 0.5091713070869446, + "eval_runtime": 128.5386, + "eval_samples_per_second": 4.139, + "eval_steps_per_second": 0.521, + "eval_wer": 0.22028668766471685, + "step": 10800 + }, + { + "epoch": 150.14, + "learning_rate": 2.8794285714285715e-05, + "loss": 0.4319, + "step": 10810 + }, + { + "epoch": 150.28, + "learning_rate": 2.8782857142857142e-05, + "loss": 0.4335, + "step": 10820 + }, + { + "epoch": 150.42, + "learning_rate": 2.8771428571428576e-05, + "loss": 0.4272, + "step": 10830 + }, + { + "epoch": 150.55, + "learning_rate": 2.8760000000000002e-05, + "loss": 0.4361, + "step": 10840 + }, + { + "epoch": 150.69, + "learning_rate": 2.8748571428571433e-05, + "loss": 0.4508, + "step": 10850 + }, + { + "epoch": 150.83, + "learning_rate": 2.873714285714286e-05, + "loss": 0.4344, + "step": 10860 + }, + { + "epoch": 150.97, + "learning_rate": 2.872571428571429e-05, + "loss": 0.4301, + "step": 10870 + }, + { + "epoch": 151.0, + "eval_loss": 0.5206985473632812, + "eval_runtime": 127.0592, + "eval_samples_per_second": 4.187, + "eval_steps_per_second": 0.527, + "eval_wer": 0.22851449508259947, + "step": 10872 + }, + { + "epoch": 151.11, + "learning_rate": 2.8714285714285716e-05, + "loss": 0.441, + "step": 10880 + }, + { + "epoch": 151.25, + "learning_rate": 2.8702857142857143e-05, + "loss": 0.4335, + "step": 10890 + }, + { + "epoch": 151.39, + "learning_rate": 2.8691428571428573e-05, + "loss": 0.4404, + "step": 10900 + }, + { + "epoch": 151.53, + "learning_rate": 2.868e-05, + "loss": 0.4299, + "step": 10910 + }, + { + "epoch": 151.66, + "learning_rate": 2.8668571428571433e-05, + "loss": 0.4373, + "step": 10920 + }, + { + "epoch": 151.8, + "learning_rate": 2.865714285714286e-05, + "loss": 0.4284, + "step": 10930 + }, + { + "epoch": 151.94, + "learning_rate": 2.864571428571429e-05, + "loss": 0.4309, + "step": 10940 + }, + { + "epoch": 152.0, + "eval_loss": 0.5265570282936096, + "eval_runtime": 127.9954, + "eval_samples_per_second": 4.156, + "eval_steps_per_second": 0.523, + "eval_wer": 0.2253647875554413, + "step": 10944 + }, + { + "epoch": 152.08, + "learning_rate": 2.8634285714285717e-05, + "loss": 0.4518, + "step": 10950 + }, + { + "epoch": 152.22, + "learning_rate": 2.8622857142857144e-05, + "loss": 0.4337, + "step": 10960 + }, + { + "epoch": 152.36, + "learning_rate": 2.8611428571428574e-05, + "loss": 0.4168, + "step": 10970 + }, + { + "epoch": 152.5, + "learning_rate": 2.86e-05, + "loss": 0.4167, + "step": 10980 + }, + { + "epoch": 152.64, + "learning_rate": 2.858857142857143e-05, + "loss": 0.4066, + "step": 10990 + }, + { + "epoch": 152.78, + "learning_rate": 2.8577142857142857e-05, + "loss": 0.4271, + "step": 11000 + }, + { + "epoch": 152.91, + "learning_rate": 2.856571428571429e-05, + "loss": 0.424, + "step": 11010 + }, + { + "epoch": 153.0, + "eval_loss": 0.49600622057914734, + "eval_runtime": 126.9946, + "eval_samples_per_second": 4.189, + "eval_steps_per_second": 0.528, + "eval_wer": 0.22375779391913608, + "step": 11016 + }, + { + "epoch": 153.06, + "learning_rate": 2.8554285714285718e-05, + "loss": 0.4369, + "step": 11020 + }, + { + "epoch": 153.19, + "learning_rate": 2.8542857142857144e-05, + "loss": 0.431, + "step": 11030 + }, + { + "epoch": 153.33, + "learning_rate": 2.8531428571428575e-05, + "loss": 0.4373, + "step": 11040 + }, + { + "epoch": 153.47, + "learning_rate": 2.852e-05, + "loss": 0.4252, + "step": 11050 + }, + { + "epoch": 153.61, + "learning_rate": 2.850857142857143e-05, + "loss": 0.4108, + "step": 11060 + }, + { + "epoch": 153.75, + "learning_rate": 2.8497142857142858e-05, + "loss": 0.4162, + "step": 11070 + }, + { + "epoch": 153.89, + "learning_rate": 2.848571428571429e-05, + "loss": 0.4197, + "step": 11080 + }, + { + "epoch": 154.0, + "eval_loss": 0.5001970529556274, + "eval_runtime": 128.5772, + "eval_samples_per_second": 4.138, + "eval_steps_per_second": 0.521, + "eval_wer": 0.22002956868290802, + "step": 11088 + }, + { + "epoch": 154.03, + "learning_rate": 2.8474285714285715e-05, + "loss": 0.4353, + "step": 11090 + }, + { + "epoch": 154.17, + "learning_rate": 2.8462857142857142e-05, + "loss": 0.412, + "step": 11100 + }, + { + "epoch": 154.3, + "learning_rate": 2.8451428571428575e-05, + "loss": 0.4342, + "step": 11110 + }, + { + "epoch": 154.44, + "learning_rate": 2.8440000000000002e-05, + "loss": 0.4288, + "step": 11120 + }, + { + "epoch": 154.58, + "learning_rate": 2.8428571428571432e-05, + "loss": 0.4068, + "step": 11130 + }, + { + "epoch": 154.72, + "learning_rate": 2.841714285714286e-05, + "loss": 0.4138, + "step": 11140 + }, + { + "epoch": 154.86, + "learning_rate": 2.840571428571429e-05, + "loss": 0.4207, + "step": 11150 + }, + { + "epoch": 155.0, + "learning_rate": 2.8394285714285716e-05, + "loss": 0.4195, + "step": 11160 + }, + { + "epoch": 155.0, + "eval_loss": 0.5221587419509888, + "eval_runtime": 127.2928, + "eval_samples_per_second": 4.179, + "eval_steps_per_second": 0.526, + "eval_wer": 0.22350067493732725, + "step": 11160 + }, + { + "epoch": 155.14, + "learning_rate": 2.8382857142857143e-05, + "loss": 0.4173, + "step": 11170 + }, + { + "epoch": 155.28, + "learning_rate": 2.8371428571428573e-05, + "loss": 0.4144, + "step": 11180 + }, + { + "epoch": 155.42, + "learning_rate": 2.836e-05, + "loss": 0.4208, + "step": 11190 + }, + { + "epoch": 155.55, + "learning_rate": 2.8348571428571433e-05, + "loss": 0.4171, + "step": 11200 + }, + { + "epoch": 155.69, + "learning_rate": 2.833714285714286e-05, + "loss": 0.4226, + "step": 11210 + }, + { + "epoch": 155.83, + "learning_rate": 2.832571428571429e-05, + "loss": 0.4092, + "step": 11220 + }, + { + "epoch": 155.97, + "learning_rate": 2.8314285714285717e-05, + "loss": 0.4306, + "step": 11230 + }, + { + "epoch": 156.0, + "eval_loss": 0.5121257901191711, + "eval_runtime": 127.477, + "eval_samples_per_second": 4.173, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2231792762100662, + "step": 11232 + }, + { + "epoch": 156.11, + "learning_rate": 2.8302857142857143e-05, + "loss": 0.4227, + "step": 11240 + }, + { + "epoch": 156.25, + "learning_rate": 2.8291428571428574e-05, + "loss": 0.4097, + "step": 11250 + }, + { + "epoch": 156.39, + "learning_rate": 2.828e-05, + "loss": 0.4169, + "step": 11260 + }, + { + "epoch": 156.53, + "learning_rate": 2.826857142857143e-05, + "loss": 0.4326, + "step": 11270 + }, + { + "epoch": 156.66, + "learning_rate": 2.8257142857142857e-05, + "loss": 0.4282, + "step": 11280 + }, + { + "epoch": 156.8, + "learning_rate": 2.824571428571429e-05, + "loss": 0.4188, + "step": 11290 + }, + { + "epoch": 156.94, + "learning_rate": 2.8234285714285717e-05, + "loss": 0.4122, + "step": 11300 + }, + { + "epoch": 157.0, + "eval_loss": 0.5221469402313232, + "eval_runtime": 126.7985, + "eval_samples_per_second": 4.196, + "eval_steps_per_second": 0.528, + "eval_wer": 0.229607250755287, + "step": 11304 + }, + { + "epoch": 157.08, + "learning_rate": 2.8224000000000003e-05, + "loss": 0.4303, + "step": 11310 + }, + { + "epoch": 157.22, + "learning_rate": 2.821257142857143e-05, + "loss": 0.4231, + "step": 11320 + }, + { + "epoch": 157.36, + "learning_rate": 2.820114285714286e-05, + "loss": 0.409, + "step": 11330 + }, + { + "epoch": 157.5, + "learning_rate": 2.8189714285714286e-05, + "loss": 0.4119, + "step": 11340 + }, + { + "epoch": 157.64, + "learning_rate": 2.8178285714285717e-05, + "loss": 0.4131, + "step": 11350 + }, + { + "epoch": 157.78, + "learning_rate": 2.8166857142857143e-05, + "loss": 0.4312, + "step": 11360 + }, + { + "epoch": 157.91, + "learning_rate": 2.8155428571428577e-05, + "loss": 0.4247, + "step": 11370 + }, + { + "epoch": 158.0, + "eval_loss": 0.5244585871696472, + "eval_runtime": 126.9746, + "eval_samples_per_second": 4.19, + "eval_steps_per_second": 0.528, + "eval_wer": 0.22221508002828308, + "step": 11376 + }, + { + "epoch": 158.06, + "learning_rate": 2.8144000000000004e-05, + "loss": 0.4362, + "step": 11380 + }, + { + "epoch": 158.19, + "learning_rate": 2.813257142857143e-05, + "loss": 0.4023, + "step": 11390 + }, + { + "epoch": 158.33, + "learning_rate": 2.812114285714286e-05, + "loss": 0.4151, + "step": 11400 + }, + { + "epoch": 158.47, + "learning_rate": 2.8109714285714287e-05, + "loss": 0.4229, + "step": 11410 + }, + { + "epoch": 158.61, + "learning_rate": 2.8098285714285717e-05, + "loss": 0.4217, + "step": 11420 + }, + { + "epoch": 158.75, + "learning_rate": 2.8086857142857144e-05, + "loss": 0.4322, + "step": 11430 + }, + { + "epoch": 158.89, + "learning_rate": 2.8075428571428574e-05, + "loss": 0.4103, + "step": 11440 + }, + { + "epoch": 159.0, + "eval_loss": 0.5090242028236389, + "eval_runtime": 127.2172, + "eval_samples_per_second": 4.182, + "eval_steps_per_second": 0.527, + "eval_wer": 0.22497910908272803, + "step": 11448 + }, + { + "epoch": 159.03, + "learning_rate": 2.8064e-05, + "loss": 0.4356, + "step": 11450 + }, + { + "epoch": 159.17, + "learning_rate": 2.8052571428571428e-05, + "loss": 0.3959, + "step": 11460 + }, + { + "epoch": 159.3, + "learning_rate": 2.804114285714286e-05, + "loss": 0.4066, + "step": 11470 + }, + { + "epoch": 159.44, + "learning_rate": 2.8029714285714288e-05, + "loss": 0.4221, + "step": 11480 + }, + { + "epoch": 159.58, + "learning_rate": 2.8018285714285718e-05, + "loss": 0.435, + "step": 11490 + }, + { + "epoch": 159.72, + "learning_rate": 2.8006857142857145e-05, + "loss": 0.4198, + "step": 11500 + }, + { + "epoch": 159.86, + "learning_rate": 2.7995428571428575e-05, + "loss": 0.4319, + "step": 11510 + }, + { + "epoch": 160.0, + "learning_rate": 2.7984000000000002e-05, + "loss": 0.435, + "step": 11520 + }, + { + "epoch": 160.0, + "eval_loss": 0.5126460790634155, + "eval_runtime": 127.041, + "eval_samples_per_second": 4.188, + "eval_steps_per_second": 0.527, + "eval_wer": 0.22909301279166935, + "step": 11520 + }, + { + "epoch": 160.14, + "learning_rate": 2.797257142857143e-05, + "loss": 0.4239, + "step": 11530 + }, + { + "epoch": 160.28, + "learning_rate": 2.796114285714286e-05, + "loss": 0.4305, + "step": 11540 + }, + { + "epoch": 160.42, + "learning_rate": 2.7949714285714285e-05, + "loss": 0.4266, + "step": 11550 + }, + { + "epoch": 160.55, + "learning_rate": 2.793828571428572e-05, + "loss": 0.4192, + "step": 11560 + }, + { + "epoch": 160.69, + "learning_rate": 2.7926857142857146e-05, + "loss": 0.4147, + "step": 11570 + }, + { + "epoch": 160.83, + "learning_rate": 2.7915428571428576e-05, + "loss": 0.431, + "step": 11580 + }, + { + "epoch": 160.97, + "learning_rate": 2.7904000000000003e-05, + "loss": 0.4191, + "step": 11590 + }, + { + "epoch": 161.0, + "eval_loss": 0.52158123254776, + "eval_runtime": 127.1778, + "eval_samples_per_second": 4.183, + "eval_steps_per_second": 0.527, + "eval_wer": 0.22935013177347818, + "step": 11592 + }, + { + "epoch": 161.11, + "learning_rate": 2.789257142857143e-05, + "loss": 0.4234, + "step": 11600 + }, + { + "epoch": 161.25, + "learning_rate": 2.788114285714286e-05, + "loss": 0.4249, + "step": 11610 + }, + { + "epoch": 161.39, + "learning_rate": 2.7869714285714286e-05, + "loss": 0.415, + "step": 11620 + }, + { + "epoch": 161.53, + "learning_rate": 2.7858285714285716e-05, + "loss": 0.4057, + "step": 11630 + }, + { + "epoch": 161.66, + "learning_rate": 2.7846857142857143e-05, + "loss": 0.4111, + "step": 11640 + }, + { + "epoch": 161.8, + "learning_rate": 2.7835428571428577e-05, + "loss": 0.4242, + "step": 11650 + }, + { + "epoch": 161.94, + "learning_rate": 2.7824000000000003e-05, + "loss": 0.4241, + "step": 11660 + }, + { + "epoch": 162.0, + "eval_loss": 0.5006119608879089, + "eval_runtime": 127.6966, + "eval_samples_per_second": 4.166, + "eval_steps_per_second": 0.525, + "eval_wer": 0.22157228257376102, + "step": 11664 + }, + { + "epoch": 162.08, + "learning_rate": 2.781257142857143e-05, + "loss": 0.4138, + "step": 11670 + }, + { + "epoch": 162.22, + "learning_rate": 2.780114285714286e-05, + "loss": 0.4173, + "step": 11680 + }, + { + "epoch": 162.36, + "learning_rate": 2.7789714285714287e-05, + "loss": 0.417, + "step": 11690 + }, + { + "epoch": 162.5, + "learning_rate": 2.7778285714285717e-05, + "loss": 0.4184, + "step": 11700 + }, + { + "epoch": 162.64, + "learning_rate": 2.7766857142857144e-05, + "loss": 0.4063, + "step": 11710 + }, + { + "epoch": 162.78, + "learning_rate": 2.7755428571428574e-05, + "loss": 0.42, + "step": 11720 + }, + { + "epoch": 162.91, + "learning_rate": 2.7744e-05, + "loss": 0.4179, + "step": 11730 + }, + { + "epoch": 163.0, + "eval_loss": 0.5012219548225403, + "eval_runtime": 127.4025, + "eval_samples_per_second": 4.176, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2214437230828566, + "step": 11736 + }, + { + "epoch": 163.06, + "learning_rate": 2.7732571428571427e-05, + "loss": 0.4245, + "step": 11740 + }, + { + "epoch": 163.19, + "learning_rate": 2.772114285714286e-05, + "loss": 0.4202, + "step": 11750 + }, + { + "epoch": 163.33, + "learning_rate": 2.7709714285714288e-05, + "loss": 0.4303, + "step": 11760 + }, + { + "epoch": 163.47, + "learning_rate": 2.7698285714285718e-05, + "loss": 0.4141, + "step": 11770 + }, + { + "epoch": 163.61, + "learning_rate": 2.7686857142857145e-05, + "loss": 0.414, + "step": 11780 + }, + { + "epoch": 163.75, + "learning_rate": 2.7675428571428575e-05, + "loss": 0.4181, + "step": 11790 + }, + { + "epoch": 163.89, + "learning_rate": 2.7664e-05, + "loss": 0.4084, + "step": 11800 + }, + { + "epoch": 164.0, + "eval_loss": 0.5084073543548584, + "eval_runtime": 127.5479, + "eval_samples_per_second": 4.171, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2240149129009449, + "step": 11808 + }, + { + "epoch": 164.03, + "learning_rate": 2.7652571428571428e-05, + "loss": 0.4429, + "step": 11810 + }, + { + "epoch": 164.17, + "learning_rate": 2.764114285714286e-05, + "loss": 0.4025, + "step": 11820 + }, + { + "epoch": 164.3, + "learning_rate": 2.7629714285714285e-05, + "loss": 0.4135, + "step": 11830 + }, + { + "epoch": 164.44, + "learning_rate": 2.761828571428572e-05, + "loss": 0.4127, + "step": 11840 + }, + { + "epoch": 164.58, + "learning_rate": 2.7606857142857145e-05, + "loss": 0.4159, + "step": 11850 + }, + { + "epoch": 164.72, + "learning_rate": 2.7595428571428575e-05, + "loss": 0.4112, + "step": 11860 + }, + { + "epoch": 164.86, + "learning_rate": 2.7584000000000002e-05, + "loss": 0.4122, + "step": 11870 + }, + { + "epoch": 165.0, + "learning_rate": 2.7572571428571432e-05, + "loss": 0.4254, + "step": 11880 + }, + { + "epoch": 165.0, + "eval_loss": 0.5040953755378723, + "eval_runtime": 127.1386, + "eval_samples_per_second": 4.184, + "eval_steps_per_second": 0.527, + "eval_wer": 0.23384971395513274, + "step": 11880 + }, + { + "epoch": 165.14, + "learning_rate": 2.756114285714286e-05, + "loss": 0.4037, + "step": 11890 + }, + { + "epoch": 165.28, + "learning_rate": 2.7549714285714286e-05, + "loss": 0.4163, + "step": 11900 + }, + { + "epoch": 165.42, + "learning_rate": 2.7538285714285716e-05, + "loss": 0.4204, + "step": 11910 + }, + { + "epoch": 165.55, + "learning_rate": 2.7526857142857143e-05, + "loss": 0.4184, + "step": 11920 + }, + { + "epoch": 165.69, + "learning_rate": 2.7515428571428576e-05, + "loss": 0.4065, + "step": 11930 + }, + { + "epoch": 165.83, + "learning_rate": 2.7504000000000003e-05, + "loss": 0.4118, + "step": 11940 + }, + { + "epoch": 165.97, + "learning_rate": 2.7492571428571433e-05, + "loss": 0.415, + "step": 11950 + }, + { + "epoch": 166.0, + "eval_loss": 0.5107947587966919, + "eval_runtime": 127.3843, + "eval_samples_per_second": 4.176, + "eval_steps_per_second": 0.526, + "eval_wer": 0.22131516359195216, + "step": 11952 + }, + { + "epoch": 166.11, + "learning_rate": 2.748114285714286e-05, + "loss": 0.4331, + "step": 11960 + }, + { + "epoch": 166.25, + "learning_rate": 2.7469714285714287e-05, + "loss": 0.4163, + "step": 11970 + }, + { + "epoch": 166.39, + "learning_rate": 2.7458285714285717e-05, + "loss": 0.4074, + "step": 11980 + }, + { + "epoch": 166.53, + "learning_rate": 2.7446857142857143e-05, + "loss": 0.4042, + "step": 11990 + }, + { + "epoch": 166.66, + "learning_rate": 2.7435428571428574e-05, + "loss": 0.4083, + "step": 12000 + }, + { + "epoch": 166.8, + "learning_rate": 2.7424e-05, + "loss": 0.4201, + "step": 12010 + }, + { + "epoch": 166.94, + "learning_rate": 2.7412571428571434e-05, + "loss": 0.4162, + "step": 12020 + }, + { + "epoch": 167.0, + "eval_loss": 0.506522536277771, + "eval_runtime": 127.174, + "eval_samples_per_second": 4.183, + "eval_steps_per_second": 0.527, + "eval_wer": 0.23712798097319535, + "step": 12024 + }, + { + "epoch": 167.08, + "learning_rate": 2.740114285714286e-05, + "loss": 0.4429, + "step": 12030 + }, + { + "epoch": 167.22, + "learning_rate": 2.7389714285714287e-05, + "loss": 0.4168, + "step": 12040 + }, + { + "epoch": 167.36, + "learning_rate": 2.7378285714285717e-05, + "loss": 0.4049, + "step": 12050 + }, + { + "epoch": 167.5, + "learning_rate": 2.7366857142857144e-05, + "loss": 0.4237, + "step": 12060 + }, + { + "epoch": 167.64, + "learning_rate": 2.7355428571428574e-05, + "loss": 0.421, + "step": 12070 + }, + { + "epoch": 167.78, + "learning_rate": 2.7344e-05, + "loss": 0.4223, + "step": 12080 + }, + { + "epoch": 167.91, + "learning_rate": 2.733257142857143e-05, + "loss": 0.4114, + "step": 12090 + }, + { + "epoch": 168.0, + "eval_loss": 0.5043089389801025, + "eval_runtime": 127.038, + "eval_samples_per_second": 4.188, + "eval_steps_per_second": 0.527, + "eval_wer": 0.22665038246448543, + "step": 12096 + }, + { + "epoch": 168.06, + "learning_rate": 2.7321142857142858e-05, + "loss": 0.4215, + "step": 12100 + }, + { + "epoch": 168.19, + "learning_rate": 2.7309714285714285e-05, + "loss": 0.4157, + "step": 12110 + }, + { + "epoch": 168.33, + "learning_rate": 2.7298285714285718e-05, + "loss": 0.4166, + "step": 12120 + }, + { + "epoch": 168.47, + "learning_rate": 2.7286857142857145e-05, + "loss": 0.4052, + "step": 12130 + }, + { + "epoch": 168.61, + "learning_rate": 2.7275428571428575e-05, + "loss": 0.4127, + "step": 12140 + }, + { + "epoch": 168.75, + "learning_rate": 2.7264000000000002e-05, + "loss": 0.4084, + "step": 12150 + }, + { + "epoch": 168.89, + "learning_rate": 2.7252571428571432e-05, + "loss": 0.4162, + "step": 12160 + }, + { + "epoch": 169.0, + "eval_loss": 0.5249109864234924, + "eval_runtime": 127.1493, + "eval_samples_per_second": 4.184, + "eval_steps_per_second": 0.527, + "eval_wer": 0.22909301279166935, + "step": 12168 + }, + { + "epoch": 169.03, + "learning_rate": 2.724114285714286e-05, + "loss": 0.4388, + "step": 12170 + }, + { + "epoch": 169.17, + "learning_rate": 2.7229714285714286e-05, + "loss": 0.4124, + "step": 12180 + }, + { + "epoch": 169.3, + "learning_rate": 2.7218285714285716e-05, + "loss": 0.4103, + "step": 12190 + }, + { + "epoch": 169.44, + "learning_rate": 2.7206857142857142e-05, + "loss": 0.4105, + "step": 12200 + }, + { + "epoch": 169.58, + "learning_rate": 2.7195428571428576e-05, + "loss": 0.4104, + "step": 12210 + }, + { + "epoch": 169.72, + "learning_rate": 2.7184000000000003e-05, + "loss": 0.4133, + "step": 12220 + }, + { + "epoch": 169.86, + "learning_rate": 2.7172571428571433e-05, + "loss": 0.4016, + "step": 12230 + }, + { + "epoch": 170.0, + "learning_rate": 2.716114285714286e-05, + "loss": 0.4163, + "step": 12240 + }, + { + "epoch": 170.0, + "eval_loss": 0.5167787075042725, + "eval_runtime": 126.5371, + "eval_samples_per_second": 4.204, + "eval_steps_per_second": 0.529, + "eval_wer": 0.22568618628270232, + "step": 12240 + }, + { + "epoch": 170.14, + "learning_rate": 2.7149714285714286e-05, + "loss": 0.3997, + "step": 12250 + }, + { + "epoch": 170.28, + "learning_rate": 2.7138285714285716e-05, + "loss": 0.408, + "step": 12260 + }, + { + "epoch": 170.42, + "learning_rate": 2.7126857142857143e-05, + "loss": 0.4101, + "step": 12270 + }, + { + "epoch": 170.55, + "learning_rate": 2.7115428571428573e-05, + "loss": 0.4148, + "step": 12280 + }, + { + "epoch": 170.69, + "learning_rate": 2.7104e-05, + "loss": 0.4183, + "step": 12290 + }, + { + "epoch": 170.83, + "learning_rate": 2.7092571428571434e-05, + "loss": 0.3985, + "step": 12300 + }, + { + "epoch": 170.97, + "learning_rate": 2.708114285714286e-05, + "loss": 0.4172, + "step": 12310 + }, + { + "epoch": 171.0, + "eval_loss": 0.5127407312393188, + "eval_runtime": 127.3272, + "eval_samples_per_second": 4.178, + "eval_steps_per_second": 0.526, + "eval_wer": 0.22292215722825737, + "step": 12312 + }, + { + "epoch": 171.11, + "learning_rate": 2.7069714285714287e-05, + "loss": 0.4135, + "step": 12320 + }, + { + "epoch": 171.25, + "learning_rate": 2.7058285714285717e-05, + "loss": 0.4147, + "step": 12330 + }, + { + "epoch": 171.39, + "learning_rate": 2.7046857142857144e-05, + "loss": 0.4036, + "step": 12340 + }, + { + "epoch": 171.53, + "learning_rate": 2.7035428571428574e-05, + "loss": 0.4081, + "step": 12350 + }, + { + "epoch": 171.66, + "learning_rate": 2.7024e-05, + "loss": 0.4205, + "step": 12360 + }, + { + "epoch": 171.8, + "learning_rate": 2.701257142857143e-05, + "loss": 0.4097, + "step": 12370 + }, + { + "epoch": 171.94, + "learning_rate": 2.7001142857142858e-05, + "loss": 0.4108, + "step": 12380 + }, + { + "epoch": 172.0, + "eval_loss": 0.5212448835372925, + "eval_runtime": 127.7703, + "eval_samples_per_second": 4.164, + "eval_steps_per_second": 0.524, + "eval_wer": 0.21874397377386384, + "step": 12384 + }, + { + "epoch": 172.08, + "learning_rate": 2.6989714285714284e-05, + "loss": 0.4308, + "step": 12390 + }, + { + "epoch": 172.22, + "learning_rate": 2.6978285714285718e-05, + "loss": 0.4069, + "step": 12400 + }, + { + "epoch": 172.36, + "learning_rate": 2.6966857142857145e-05, + "loss": 0.4058, + "step": 12410 + }, + { + "epoch": 172.5, + "learning_rate": 2.6955428571428575e-05, + "loss": 0.4013, + "step": 12420 + }, + { + "epoch": 172.64, + "learning_rate": 2.6944e-05, + "loss": 0.4071, + "step": 12430 + }, + { + "epoch": 172.78, + "learning_rate": 2.693257142857143e-05, + "loss": 0.4142, + "step": 12440 + }, + { + "epoch": 172.91, + "learning_rate": 2.692114285714286e-05, + "loss": 0.4022, + "step": 12450 + }, + { + "epoch": 173.0, + "eval_loss": 0.5032334923744202, + "eval_runtime": 127.2663, + "eval_samples_per_second": 4.18, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2191939319920293, + "step": 12456 + }, + { + "epoch": 173.06, + "learning_rate": 2.690971428571429e-05, + "loss": 0.4217, + "step": 12460 + }, + { + "epoch": 173.19, + "learning_rate": 2.6898285714285715e-05, + "loss": 0.4056, + "step": 12470 + }, + { + "epoch": 173.33, + "learning_rate": 2.6886857142857142e-05, + "loss": 0.4074, + "step": 12480 + }, + { + "epoch": 173.47, + "learning_rate": 2.6875428571428576e-05, + "loss": 0.4092, + "step": 12490 + }, + { + "epoch": 173.61, + "learning_rate": 2.6864000000000002e-05, + "loss": 0.4033, + "step": 12500 + }, + { + "epoch": 173.75, + "learning_rate": 2.6852571428571432e-05, + "loss": 0.3967, + "step": 12510 + }, + { + "epoch": 173.89, + "learning_rate": 2.684114285714286e-05, + "loss": 0.4083, + "step": 12520 + }, + { + "epoch": 174.0, + "eval_loss": 0.5316658616065979, + "eval_runtime": 128.2651, + "eval_samples_per_second": 4.148, + "eval_steps_per_second": 0.522, + "eval_wer": 0.22774313813717298, + "step": 12528 + }, + { + "epoch": 174.03, + "learning_rate": 2.682971428571429e-05, + "loss": 0.4346, + "step": 12530 + }, + { + "epoch": 174.17, + "learning_rate": 2.6818285714285716e-05, + "loss": 0.407, + "step": 12540 + }, + { + "epoch": 174.3, + "learning_rate": 2.6806857142857143e-05, + "loss": 0.4146, + "step": 12550 + }, + { + "epoch": 174.44, + "learning_rate": 2.6795428571428573e-05, + "loss": 0.4259, + "step": 12560 + }, + { + "epoch": 174.58, + "learning_rate": 2.6784e-05, + "loss": 0.4149, + "step": 12570 + }, + { + "epoch": 174.72, + "learning_rate": 2.6772571428571433e-05, + "loss": 0.4208, + "step": 12580 + }, + { + "epoch": 174.86, + "learning_rate": 2.676114285714286e-05, + "loss": 0.4119, + "step": 12590 + }, + { + "epoch": 175.0, + "learning_rate": 2.674971428571429e-05, + "loss": 0.4149, + "step": 12600 + }, + { + "epoch": 175.0, + "eval_loss": 0.5320192575454712, + "eval_runtime": 127.0953, + "eval_samples_per_second": 4.186, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21565854599215786, + "step": 12600 + }, + { + "epoch": 175.14, + "learning_rate": 2.6738285714285717e-05, + "loss": 0.4095, + "step": 12610 + }, + { + "epoch": 175.28, + "learning_rate": 2.6726857142857144e-05, + "loss": 0.4169, + "step": 12620 + }, + { + "epoch": 175.42, + "learning_rate": 2.6715428571428574e-05, + "loss": 0.4073, + "step": 12630 + }, + { + "epoch": 175.55, + "learning_rate": 2.6704e-05, + "loss": 0.3997, + "step": 12640 + }, + { + "epoch": 175.69, + "learning_rate": 2.669257142857143e-05, + "loss": 0.4117, + "step": 12650 + }, + { + "epoch": 175.83, + "learning_rate": 2.6681142857142857e-05, + "loss": 0.4096, + "step": 12660 + }, + { + "epoch": 175.97, + "learning_rate": 2.666971428571429e-05, + "loss": 0.4085, + "step": 12670 + }, + { + "epoch": 176.0, + "eval_loss": 0.5135429501533508, + "eval_runtime": 127.8136, + "eval_samples_per_second": 4.162, + "eval_steps_per_second": 0.524, + "eval_wer": 0.23076428617342676, + "step": 12672 + }, + { + "epoch": 176.11, + "learning_rate": 2.6658285714285718e-05, + "loss": 0.4286, + "step": 12680 + }, + { + "epoch": 176.25, + "learning_rate": 2.6646857142857144e-05, + "loss": 0.3963, + "step": 12690 + }, + { + "epoch": 176.39, + "learning_rate": 2.6635428571428574e-05, + "loss": 0.3936, + "step": 12700 + }, + { + "epoch": 176.53, + "learning_rate": 2.6624e-05, + "loss": 0.4149, + "step": 12710 + }, + { + "epoch": 176.66, + "learning_rate": 2.661257142857143e-05, + "loss": 0.4063, + "step": 12720 + }, + { + "epoch": 176.8, + "learning_rate": 2.6601142857142858e-05, + "loss": 0.3989, + "step": 12730 + }, + { + "epoch": 176.94, + "learning_rate": 2.6589714285714288e-05, + "loss": 0.3948, + "step": 12740 + }, + { + "epoch": 177.0, + "eval_loss": 0.5166184306144714, + "eval_runtime": 127.9318, + "eval_samples_per_second": 4.158, + "eval_steps_per_second": 0.524, + "eval_wer": 0.22092948511923893, + "step": 12744 + }, + { + "epoch": 177.08, + "learning_rate": 2.6578285714285715e-05, + "loss": 0.4124, + "step": 12750 + }, + { + "epoch": 177.22, + "learning_rate": 2.6566857142857142e-05, + "loss": 0.4071, + "step": 12760 + }, + { + "epoch": 177.36, + "learning_rate": 2.6555428571428575e-05, + "loss": 0.3976, + "step": 12770 + }, + { + "epoch": 177.5, + "learning_rate": 2.6544000000000002e-05, + "loss": 0.4021, + "step": 12780 + }, + { + "epoch": 177.64, + "learning_rate": 2.6532571428571432e-05, + "loss": 0.4009, + "step": 12790 + }, + { + "epoch": 177.78, + "learning_rate": 2.652114285714286e-05, + "loss": 0.4108, + "step": 12800 + }, + { + "epoch": 177.91, + "learning_rate": 2.650971428571429e-05, + "loss": 0.4198, + "step": 12810 + }, + { + "epoch": 178.0, + "eval_loss": 0.5269370675086975, + "eval_runtime": 126.437, + "eval_samples_per_second": 4.208, + "eval_steps_per_second": 0.53, + "eval_wer": 0.2240791926463971, + "step": 12816 + }, + { + "epoch": 178.06, + "learning_rate": 2.6498285714285716e-05, + "loss": 0.4099, + "step": 12820 + }, + { + "epoch": 178.19, + "learning_rate": 2.6486857142857143e-05, + "loss": 0.406, + "step": 12830 + }, + { + "epoch": 178.33, + "learning_rate": 2.6475428571428573e-05, + "loss": 0.4028, + "step": 12840 + }, + { + "epoch": 178.47, + "learning_rate": 2.6464e-05, + "loss": 0.3871, + "step": 12850 + }, + { + "epoch": 178.61, + "learning_rate": 2.6452571428571433e-05, + "loss": 0.3819, + "step": 12860 + }, + { + "epoch": 178.75, + "learning_rate": 2.644114285714286e-05, + "loss": 0.4125, + "step": 12870 + }, + { + "epoch": 178.89, + "learning_rate": 2.642971428571429e-05, + "loss": 0.4005, + "step": 12880 + }, + { + "epoch": 179.0, + "eval_loss": 0.5152977108955383, + "eval_runtime": 127.3194, + "eval_samples_per_second": 4.178, + "eval_steps_per_second": 0.526, + "eval_wer": 0.21996528893745582, + "step": 12888 + }, + { + "epoch": 179.03, + "learning_rate": 2.6418285714285717e-05, + "loss": 0.423, + "step": 12890 + }, + { + "epoch": 179.17, + "learning_rate": 2.6406857142857143e-05, + "loss": 0.4043, + "step": 12900 + }, + { + "epoch": 179.3, + "learning_rate": 2.6395428571428573e-05, + "loss": 0.4036, + "step": 12910 + }, + { + "epoch": 179.44, + "learning_rate": 2.6384e-05, + "loss": 0.4046, + "step": 12920 + }, + { + "epoch": 179.58, + "learning_rate": 2.637257142857143e-05, + "loss": 0.3982, + "step": 12930 + }, + { + "epoch": 179.72, + "learning_rate": 2.6361142857142857e-05, + "loss": 0.4061, + "step": 12940 + }, + { + "epoch": 179.86, + "learning_rate": 2.634971428571429e-05, + "loss": 0.4062, + "step": 12950 + }, + { + "epoch": 180.0, + "learning_rate": 2.6338285714285717e-05, + "loss": 0.4106, + "step": 12960 + }, + { + "epoch": 180.0, + "eval_loss": 0.5100762844085693, + "eval_runtime": 127.6735, + "eval_samples_per_second": 4.167, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2262647039917722, + "step": 12960 + }, + { + "epoch": 180.14, + "learning_rate": 2.6326857142857144e-05, + "loss": 0.4149, + "step": 12970 + }, + { + "epoch": 180.28, + "learning_rate": 2.6315428571428574e-05, + "loss": 0.3974, + "step": 12980 + }, + { + "epoch": 180.42, + "learning_rate": 2.6304e-05, + "loss": 0.4125, + "step": 12990 + }, + { + "epoch": 180.55, + "learning_rate": 2.629257142857143e-05, + "loss": 0.4072, + "step": 13000 + }, + { + "epoch": 180.69, + "learning_rate": 2.6281142857142858e-05, + "loss": 0.3956, + "step": 13010 + }, + { + "epoch": 180.83, + "learning_rate": 2.6269714285714288e-05, + "loss": 0.4025, + "step": 13020 + }, + { + "epoch": 180.97, + "learning_rate": 2.6258285714285715e-05, + "loss": 0.4109, + "step": 13030 + }, + { + "epoch": 181.0, + "eval_loss": 0.49679335951805115, + "eval_runtime": 128.4583, + "eval_samples_per_second": 4.141, + "eval_steps_per_second": 0.522, + "eval_wer": 0.2159156649739667, + "step": 13032 + }, + { + "epoch": 181.11, + "learning_rate": 2.624685714285714e-05, + "loss": 0.3967, + "step": 13040 + }, + { + "epoch": 181.25, + "learning_rate": 2.6235428571428575e-05, + "loss": 0.3981, + "step": 13050 + }, + { + "epoch": 181.39, + "learning_rate": 2.6224e-05, + "loss": 0.3888, + "step": 13060 + }, + { + "epoch": 181.53, + "learning_rate": 2.6212571428571432e-05, + "loss": 0.3932, + "step": 13070 + }, + { + "epoch": 181.66, + "learning_rate": 2.620114285714286e-05, + "loss": 0.4056, + "step": 13080 + }, + { + "epoch": 181.8, + "learning_rate": 2.618971428571429e-05, + "loss": 0.3915, + "step": 13090 + }, + { + "epoch": 181.94, + "learning_rate": 2.6178285714285715e-05, + "loss": 0.4068, + "step": 13100 + }, + { + "epoch": 182.0, + "eval_loss": 0.5250499248504639, + "eval_runtime": 127.5608, + "eval_samples_per_second": 4.171, + "eval_steps_per_second": 0.525, + "eval_wer": 0.22157228257376102, + "step": 13104 + }, + { + "epoch": 182.08, + "learning_rate": 2.6166857142857146e-05, + "loss": 0.4049, + "step": 13110 + }, + { + "epoch": 182.22, + "learning_rate": 2.6155428571428572e-05, + "loss": 0.3982, + "step": 13120 + }, + { + "epoch": 182.36, + "learning_rate": 2.6144e-05, + "loss": 0.381, + "step": 13130 + }, + { + "epoch": 182.5, + "learning_rate": 2.6132571428571433e-05, + "loss": 0.4, + "step": 13140 + }, + { + "epoch": 182.64, + "learning_rate": 2.612114285714286e-05, + "loss": 0.3915, + "step": 13150 + }, + { + "epoch": 182.78, + "learning_rate": 2.610971428571429e-05, + "loss": 0.4057, + "step": 13160 + }, + { + "epoch": 182.91, + "learning_rate": 2.6098285714285716e-05, + "loss": 0.4082, + "step": 13170 + }, + { + "epoch": 183.0, + "eval_loss": 0.5206136703491211, + "eval_runtime": 127.5242, + "eval_samples_per_second": 4.172, + "eval_steps_per_second": 0.525, + "eval_wer": 0.22215080028283088, + "step": 13176 + }, + { + "epoch": 183.06, + "learning_rate": 2.6086857142857146e-05, + "loss": 0.4218, + "step": 13180 + }, + { + "epoch": 183.19, + "learning_rate": 2.6075428571428573e-05, + "loss": 0.421, + "step": 13190 + }, + { + "epoch": 183.33, + "learning_rate": 2.6064e-05, + "loss": 0.4152, + "step": 13200 + }, + { + "epoch": 183.47, + "learning_rate": 2.605257142857143e-05, + "loss": 0.4128, + "step": 13210 + }, + { + "epoch": 183.61, + "learning_rate": 2.6041142857142857e-05, + "loss": 0.4106, + "step": 13220 + }, + { + "epoch": 183.75, + "learning_rate": 2.602971428571429e-05, + "loss": 0.409, + "step": 13230 + }, + { + "epoch": 183.89, + "learning_rate": 2.6018285714285717e-05, + "loss": 0.4074, + "step": 13240 + }, + { + "epoch": 184.0, + "eval_loss": 0.5401894450187683, + "eval_runtime": 126.8416, + "eval_samples_per_second": 4.194, + "eval_steps_per_second": 0.528, + "eval_wer": 0.22369351417368388, + "step": 13248 + }, + { + "epoch": 184.03, + "learning_rate": 2.6006857142857147e-05, + "loss": 0.4277, + "step": 13250 + }, + { + "epoch": 184.17, + "learning_rate": 2.5995428571428574e-05, + "loss": 0.3986, + "step": 13260 + }, + { + "epoch": 184.3, + "learning_rate": 2.5984e-05, + "loss": 0.4051, + "step": 13270 + }, + { + "epoch": 184.44, + "learning_rate": 2.597257142857143e-05, + "loss": 0.4043, + "step": 13280 + }, + { + "epoch": 184.58, + "learning_rate": 2.5961142857142857e-05, + "loss": 0.4146, + "step": 13290 + }, + { + "epoch": 184.72, + "learning_rate": 2.5949714285714288e-05, + "loss": 0.4008, + "step": 13300 + }, + { + "epoch": 184.86, + "learning_rate": 2.5938285714285714e-05, + "loss": 0.4005, + "step": 13310 + }, + { + "epoch": 185.0, + "learning_rate": 2.5926857142857148e-05, + "loss": 0.403, + "step": 13320 + }, + { + "epoch": 185.0, + "eval_loss": 0.5174187421798706, + "eval_runtime": 127.5695, + "eval_samples_per_second": 4.17, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21861541428295944, + "step": 13320 + }, + { + "epoch": 185.14, + "learning_rate": 2.5915428571428575e-05, + "loss": 0.406, + "step": 13330 + }, + { + "epoch": 185.28, + "learning_rate": 2.5904e-05, + "loss": 0.4181, + "step": 13340 + }, + { + "epoch": 185.42, + "learning_rate": 2.589257142857143e-05, + "loss": 0.4122, + "step": 13350 + }, + { + "epoch": 185.55, + "learning_rate": 2.5881142857142858e-05, + "loss": 0.4218, + "step": 13360 + }, + { + "epoch": 185.69, + "learning_rate": 2.586971428571429e-05, + "loss": 0.4237, + "step": 13370 + }, + { + "epoch": 185.83, + "learning_rate": 2.5858285714285715e-05, + "loss": 0.4013, + "step": 13380 + }, + { + "epoch": 185.97, + "learning_rate": 2.5846857142857145e-05, + "loss": 0.4026, + "step": 13390 + }, + { + "epoch": 186.0, + "eval_loss": 0.5516530871391296, + "eval_runtime": 126.5992, + "eval_samples_per_second": 4.202, + "eval_steps_per_second": 0.529, + "eval_wer": 0.2208009256283345, + "step": 13392 + }, + { + "epoch": 186.11, + "learning_rate": 2.5835428571428572e-05, + "loss": 0.4105, + "step": 13400 + }, + { + "epoch": 186.25, + "learning_rate": 2.5824e-05, + "loss": 0.4114, + "step": 13410 + }, + { + "epoch": 186.39, + "learning_rate": 2.5812571428571432e-05, + "loss": 0.3947, + "step": 13420 + }, + { + "epoch": 186.53, + "learning_rate": 2.580114285714286e-05, + "loss": 0.4133, + "step": 13430 + }, + { + "epoch": 186.66, + "learning_rate": 2.578971428571429e-05, + "loss": 0.3973, + "step": 13440 + }, + { + "epoch": 186.8, + "learning_rate": 2.5778285714285716e-05, + "loss": 0.4093, + "step": 13450 + }, + { + "epoch": 186.94, + "learning_rate": 2.5766857142857146e-05, + "loss": 0.4192, + "step": 13460 + }, + { + "epoch": 187.0, + "eval_loss": 0.564426064491272, + "eval_runtime": 128.0749, + "eval_samples_per_second": 4.154, + "eval_steps_per_second": 0.523, + "eval_wer": 0.22440059137365817, + "step": 13464 + }, + { + "epoch": 187.08, + "learning_rate": 2.5755428571428573e-05, + "loss": 0.4127, + "step": 13470 + }, + { + "epoch": 187.22, + "learning_rate": 2.5745142857142858e-05, + "loss": 0.4064, + "step": 13480 + }, + { + "epoch": 187.36, + "learning_rate": 2.5733714285714285e-05, + "loss": 0.4019, + "step": 13490 + }, + { + "epoch": 187.5, + "learning_rate": 2.572228571428572e-05, + "loss": 0.3931, + "step": 13500 + }, + { + "epoch": 187.64, + "learning_rate": 2.5710857142857145e-05, + "loss": 0.4102, + "step": 13510 + }, + { + "epoch": 187.78, + "learning_rate": 2.5699428571428575e-05, + "loss": 0.4068, + "step": 13520 + }, + { + "epoch": 187.91, + "learning_rate": 2.5688000000000002e-05, + "loss": 0.3928, + "step": 13530 + }, + { + "epoch": 188.0, + "eval_loss": 0.5148659348487854, + "eval_runtime": 127.7843, + "eval_samples_per_second": 4.163, + "eval_steps_per_second": 0.524, + "eval_wer": 0.22324355595551842, + "step": 13536 + }, + { + "epoch": 188.06, + "learning_rate": 2.567657142857143e-05, + "loss": 0.4139, + "step": 13540 + }, + { + "epoch": 188.19, + "learning_rate": 2.566514285714286e-05, + "loss": 0.4006, + "step": 13550 + }, + { + "epoch": 188.33, + "learning_rate": 2.5653714285714286e-05, + "loss": 0.3955, + "step": 13560 + }, + { + "epoch": 188.47, + "learning_rate": 2.5642285714285716e-05, + "loss": 0.391, + "step": 13570 + }, + { + "epoch": 188.61, + "learning_rate": 2.5630857142857143e-05, + "loss": 0.3826, + "step": 13580 + }, + { + "epoch": 188.75, + "learning_rate": 2.5619428571428576e-05, + "loss": 0.3967, + "step": 13590 + }, + { + "epoch": 188.89, + "learning_rate": 2.5608000000000003e-05, + "loss": 0.3869, + "step": 13600 + }, + { + "epoch": 189.0, + "eval_loss": 0.5339820384979248, + "eval_runtime": 127.4403, + "eval_samples_per_second": 4.175, + "eval_steps_per_second": 0.526, + "eval_wer": 0.21463007006492255, + "step": 13608 + }, + { + "epoch": 189.03, + "learning_rate": 2.5596571428571433e-05, + "loss": 0.4009, + "step": 13610 + }, + { + "epoch": 189.17, + "learning_rate": 2.558514285714286e-05, + "loss": 0.3911, + "step": 13620 + }, + { + "epoch": 189.3, + "learning_rate": 2.5573714285714286e-05, + "loss": 0.4028, + "step": 13630 + }, + { + "epoch": 189.44, + "learning_rate": 2.5562285714285717e-05, + "loss": 0.4038, + "step": 13640 + }, + { + "epoch": 189.58, + "learning_rate": 2.5550857142857143e-05, + "loss": 0.3953, + "step": 13650 + }, + { + "epoch": 189.72, + "learning_rate": 2.5539428571428573e-05, + "loss": 0.4026, + "step": 13660 + }, + { + "epoch": 189.86, + "learning_rate": 2.5528e-05, + "loss": 0.385, + "step": 13670 + }, + { + "epoch": 190.0, + "learning_rate": 2.5516571428571434e-05, + "loss": 0.4126, + "step": 13680 + }, + { + "epoch": 190.0, + "eval_loss": 0.5000819563865662, + "eval_runtime": 127.7665, + "eval_samples_per_second": 4.164, + "eval_steps_per_second": 0.524, + "eval_wer": 0.22555762679179792, + "step": 13680 + }, + { + "epoch": 190.14, + "learning_rate": 2.550514285714286e-05, + "loss": 0.3955, + "step": 13690 + }, + { + "epoch": 190.28, + "learning_rate": 2.5493714285714287e-05, + "loss": 0.407, + "step": 13700 + }, + { + "epoch": 190.42, + "learning_rate": 2.5482285714285717e-05, + "loss": 0.3828, + "step": 13710 + }, + { + "epoch": 190.55, + "learning_rate": 2.5470857142857144e-05, + "loss": 0.3944, + "step": 13720 + }, + { + "epoch": 190.69, + "learning_rate": 2.5459428571428574e-05, + "loss": 0.3957, + "step": 13730 + }, + { + "epoch": 190.83, + "learning_rate": 2.5448e-05, + "loss": 0.3928, + "step": 13740 + }, + { + "epoch": 190.97, + "learning_rate": 2.543657142857143e-05, + "loss": 0.4021, + "step": 13750 + }, + { + "epoch": 191.0, + "eval_loss": 0.5159122943878174, + "eval_runtime": 129.2956, + "eval_samples_per_second": 4.115, + "eval_steps_per_second": 0.518, + "eval_wer": 0.218486854792055, + "step": 13752 + }, + { + "epoch": 191.11, + "learning_rate": 2.5425142857142858e-05, + "loss": 0.4122, + "step": 13760 + }, + { + "epoch": 191.25, + "learning_rate": 2.5413714285714285e-05, + "loss": 0.3922, + "step": 13770 + }, + { + "epoch": 191.39, + "learning_rate": 2.5402285714285718e-05, + "loss": 0.4, + "step": 13780 + }, + { + "epoch": 191.53, + "learning_rate": 2.5390857142857145e-05, + "loss": 0.4067, + "step": 13790 + }, + { + "epoch": 191.66, + "learning_rate": 2.5379428571428575e-05, + "loss": 0.4138, + "step": 13800 + }, + { + "epoch": 191.8, + "learning_rate": 2.5368000000000002e-05, + "loss": 0.4083, + "step": 13810 + }, + { + "epoch": 191.94, + "learning_rate": 2.5356571428571432e-05, + "loss": 0.4105, + "step": 13820 + }, + { + "epoch": 192.0, + "eval_loss": 0.5466117858886719, + "eval_runtime": 127.1575, + "eval_samples_per_second": 4.184, + "eval_steps_per_second": 0.527, + "eval_wer": 0.22208652053737868, + "step": 13824 + }, + { + "epoch": 192.08, + "learning_rate": 2.534514285714286e-05, + "loss": 0.4197, + "step": 13830 + }, + { + "epoch": 192.22, + "learning_rate": 2.5333714285714285e-05, + "loss": 0.4086, + "step": 13840 + }, + { + "epoch": 192.36, + "learning_rate": 2.5322285714285715e-05, + "loss": 0.4015, + "step": 13850 + }, + { + "epoch": 192.5, + "learning_rate": 2.5310857142857142e-05, + "loss": 0.4102, + "step": 13860 + }, + { + "epoch": 192.64, + "learning_rate": 2.5299428571428576e-05, + "loss": 0.4043, + "step": 13870 + }, + { + "epoch": 192.78, + "learning_rate": 2.5288000000000003e-05, + "loss": 0.4162, + "step": 13880 + }, + { + "epoch": 192.91, + "learning_rate": 2.5276571428571433e-05, + "loss": 0.4144, + "step": 13890 + }, + { + "epoch": 193.0, + "eval_loss": 0.5516180992126465, + "eval_runtime": 127.8, + "eval_samples_per_second": 4.163, + "eval_steps_per_second": 0.524, + "eval_wer": 0.2240791926463971, + "step": 13896 + }, + { + "epoch": 193.06, + "learning_rate": 2.526514285714286e-05, + "loss": 0.4174, + "step": 13900 + }, + { + "epoch": 193.19, + "learning_rate": 2.5253714285714286e-05, + "loss": 0.3975, + "step": 13910 + }, + { + "epoch": 193.33, + "learning_rate": 2.5242285714285716e-05, + "loss": 0.4049, + "step": 13920 + }, + { + "epoch": 193.47, + "learning_rate": 2.5230857142857143e-05, + "loss": 0.4013, + "step": 13930 + }, + { + "epoch": 193.61, + "learning_rate": 2.5219428571428573e-05, + "loss": 0.3919, + "step": 13940 + }, + { + "epoch": 193.75, + "learning_rate": 2.5208e-05, + "loss": 0.4056, + "step": 13950 + }, + { + "epoch": 193.89, + "learning_rate": 2.5196571428571433e-05, + "loss": 0.3861, + "step": 13960 + }, + { + "epoch": 194.0, + "eval_loss": 0.5103843808174133, + "eval_runtime": 126.7492, + "eval_samples_per_second": 4.197, + "eval_steps_per_second": 0.529, + "eval_wer": 0.22440059137365817, + "step": 13968 + }, + { + "epoch": 194.03, + "learning_rate": 2.518514285714286e-05, + "loss": 0.4035, + "step": 13970 + }, + { + "epoch": 194.17, + "learning_rate": 2.5173714285714287e-05, + "loss": 0.4052, + "step": 13980 + }, + { + "epoch": 194.3, + "learning_rate": 2.5162285714285717e-05, + "loss": 0.4067, + "step": 13990 + }, + { + "epoch": 194.44, + "learning_rate": 2.5150857142857144e-05, + "loss": 0.4033, + "step": 14000 + }, + { + "epoch": 194.58, + "learning_rate": 2.5139428571428574e-05, + "loss": 0.4022, + "step": 14010 + }, + { + "epoch": 194.72, + "learning_rate": 2.5128e-05, + "loss": 0.3968, + "step": 14020 + }, + { + "epoch": 194.86, + "learning_rate": 2.511657142857143e-05, + "loss": 0.3857, + "step": 14030 + }, + { + "epoch": 195.0, + "learning_rate": 2.5105142857142858e-05, + "loss": 0.4141, + "step": 14040 + }, + { + "epoch": 195.0, + "eval_loss": 0.5754216909408569, + "eval_runtime": 126.7389, + "eval_samples_per_second": 4.198, + "eval_steps_per_second": 0.529, + "eval_wer": 0.2240791926463971, + "step": 14040 + }, + { + "epoch": 195.14, + "learning_rate": 2.5093714285714284e-05, + "loss": 0.4004, + "step": 14050 + }, + { + "epoch": 195.28, + "learning_rate": 2.5082285714285718e-05, + "loss": 0.3963, + "step": 14060 + }, + { + "epoch": 195.42, + "learning_rate": 2.5070857142857145e-05, + "loss": 0.4018, + "step": 14070 + }, + { + "epoch": 195.55, + "learning_rate": 2.5059428571428575e-05, + "loss": 0.4029, + "step": 14080 + }, + { + "epoch": 195.69, + "learning_rate": 2.5048e-05, + "loss": 0.3987, + "step": 14090 + }, + { + "epoch": 195.83, + "learning_rate": 2.503657142857143e-05, + "loss": 0.3961, + "step": 14100 + }, + { + "epoch": 195.97, + "learning_rate": 2.5025142857142858e-05, + "loss": 0.4053, + "step": 14110 + }, + { + "epoch": 196.0, + "eval_loss": 0.5560808181762695, + "eval_runtime": 126.8825, + "eval_samples_per_second": 4.193, + "eval_steps_per_second": 0.528, + "eval_wer": 0.22420775213730154, + "step": 14112 + }, + { + "epoch": 196.11, + "learning_rate": 2.5013714285714285e-05, + "loss": 0.4202, + "step": 14120 + }, + { + "epoch": 196.25, + "learning_rate": 2.5002285714285715e-05, + "loss": 0.4187, + "step": 14130 + }, + { + "epoch": 196.39, + "learning_rate": 2.4990857142857142e-05, + "loss": 0.4128, + "step": 14140 + }, + { + "epoch": 196.53, + "learning_rate": 2.4979428571428575e-05, + "loss": 0.4069, + "step": 14150 + }, + { + "epoch": 196.66, + "learning_rate": 2.4968000000000002e-05, + "loss": 0.4, + "step": 14160 + }, + { + "epoch": 196.8, + "learning_rate": 2.4956571428571432e-05, + "loss": 0.3941, + "step": 14170 + }, + { + "epoch": 196.94, + "learning_rate": 2.494514285714286e-05, + "loss": 0.421, + "step": 14180 + }, + { + "epoch": 197.0, + "eval_loss": 0.5242465734481812, + "eval_runtime": 128.0943, + "eval_samples_per_second": 4.153, + "eval_steps_per_second": 0.523, + "eval_wer": 0.22774313813717298, + "step": 14184 + }, + { + "epoch": 197.08, + "learning_rate": 2.4933714285714286e-05, + "loss": 0.4313, + "step": 14190 + }, + { + "epoch": 197.22, + "learning_rate": 2.4922285714285716e-05, + "loss": 0.4142, + "step": 14200 + }, + { + "epoch": 197.36, + "learning_rate": 2.4910857142857143e-05, + "loss": 0.4052, + "step": 14210 + }, + { + "epoch": 197.5, + "learning_rate": 2.4899428571428573e-05, + "loss": 0.4005, + "step": 14220 + }, + { + "epoch": 197.64, + "learning_rate": 2.4888e-05, + "loss": 0.3993, + "step": 14230 + }, + { + "epoch": 197.78, + "learning_rate": 2.4876571428571433e-05, + "loss": 0.4046, + "step": 14240 + }, + { + "epoch": 197.91, + "learning_rate": 2.486514285714286e-05, + "loss": 0.397, + "step": 14250 + }, + { + "epoch": 198.0, + "eval_loss": 0.5273396372795105, + "eval_runtime": 127.0167, + "eval_samples_per_second": 4.188, + "eval_steps_per_second": 0.527, + "eval_wer": 0.22510766857363246, + "step": 14256 + }, + { + "epoch": 198.06, + "learning_rate": 2.485371428571429e-05, + "loss": 0.4213, + "step": 14260 + }, + { + "epoch": 198.19, + "learning_rate": 2.4842285714285717e-05, + "loss": 0.4053, + "step": 14270 + }, + { + "epoch": 198.33, + "learning_rate": 2.4830857142857143e-05, + "loss": 0.3978, + "step": 14280 + }, + { + "epoch": 198.47, + "learning_rate": 2.4819428571428574e-05, + "loss": 0.3965, + "step": 14290 + }, + { + "epoch": 198.61, + "learning_rate": 2.4808e-05, + "loss": 0.3828, + "step": 14300 + }, + { + "epoch": 198.75, + "learning_rate": 2.479657142857143e-05, + "loss": 0.3982, + "step": 14310 + }, + { + "epoch": 198.89, + "learning_rate": 2.4785142857142857e-05, + "loss": 0.405, + "step": 14320 + }, + { + "epoch": 199.0, + "eval_loss": 0.5428474545478821, + "eval_runtime": 126.5539, + "eval_samples_per_second": 4.204, + "eval_steps_per_second": 0.529, + "eval_wer": 0.22575046602815452, + "step": 14328 + }, + { + "epoch": 199.03, + "learning_rate": 2.477371428571429e-05, + "loss": 0.4208, + "step": 14330 + }, + { + "epoch": 199.17, + "learning_rate": 2.4762285714285717e-05, + "loss": 0.3896, + "step": 14340 + }, + { + "epoch": 199.3, + "learning_rate": 2.4750857142857144e-05, + "loss": 0.3862, + "step": 14350 + }, + { + "epoch": 199.44, + "learning_rate": 2.4739428571428574e-05, + "loss": 0.3953, + "step": 14360 + }, + { + "epoch": 199.58, + "learning_rate": 2.4728e-05, + "loss": 0.3884, + "step": 14370 + }, + { + "epoch": 199.72, + "learning_rate": 2.471657142857143e-05, + "loss": 0.3968, + "step": 14380 + }, + { + "epoch": 199.86, + "learning_rate": 2.4705142857142858e-05, + "loss": 0.3959, + "step": 14390 + }, + { + "epoch": 200.0, + "learning_rate": 2.4693714285714288e-05, + "loss": 0.3915, + "step": 14400 + }, + { + "epoch": 200.0, + "eval_loss": 0.5354220867156982, + "eval_runtime": 127.3795, + "eval_samples_per_second": 4.176, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2198367294465514, + "step": 14400 + }, + { + "epoch": 200.14, + "learning_rate": 2.4682285714285715e-05, + "loss": 0.4045, + "step": 14410 + }, + { + "epoch": 200.28, + "learning_rate": 2.467085714285714e-05, + "loss": 0.3774, + "step": 14420 + }, + { + "epoch": 200.42, + "learning_rate": 2.4659428571428575e-05, + "loss": 0.3959, + "step": 14430 + }, + { + "epoch": 200.55, + "learning_rate": 2.4648000000000002e-05, + "loss": 0.4019, + "step": 14440 + }, + { + "epoch": 200.69, + "learning_rate": 2.4636571428571432e-05, + "loss": 0.3907, + "step": 14450 + }, + { + "epoch": 200.83, + "learning_rate": 2.462514285714286e-05, + "loss": 0.3856, + "step": 14460 + }, + { + "epoch": 200.97, + "learning_rate": 2.461371428571429e-05, + "loss": 0.4005, + "step": 14470 + }, + { + "epoch": 201.0, + "eval_loss": 0.5071948170661926, + "eval_runtime": 127.5448, + "eval_samples_per_second": 4.171, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21482290930127917, + "step": 14472 + }, + { + "epoch": 201.11, + "learning_rate": 2.4602285714285716e-05, + "loss": 0.4015, + "step": 14480 + }, + { + "epoch": 201.25, + "learning_rate": 2.4590857142857142e-05, + "loss": 0.3985, + "step": 14490 + }, + { + "epoch": 201.39, + "learning_rate": 2.4579428571428572e-05, + "loss": 0.3819, + "step": 14500 + }, + { + "epoch": 201.53, + "learning_rate": 2.4568e-05, + "loss": 0.3951, + "step": 14510 + }, + { + "epoch": 201.66, + "learning_rate": 2.4556571428571433e-05, + "loss": 0.3966, + "step": 14520 + }, + { + "epoch": 201.8, + "learning_rate": 2.454514285714286e-05, + "loss": 0.3948, + "step": 14530 + }, + { + "epoch": 201.94, + "learning_rate": 2.453371428571429e-05, + "loss": 0.3947, + "step": 14540 + }, + { + "epoch": 202.0, + "eval_loss": 0.5165221691131592, + "eval_runtime": 127.3841, + "eval_samples_per_second": 4.176, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2141158321013049, + "step": 14544 + }, + { + "epoch": 202.08, + "learning_rate": 2.4522285714285716e-05, + "loss": 0.4134, + "step": 14550 + }, + { + "epoch": 202.22, + "learning_rate": 2.4510857142857143e-05, + "loss": 0.3991, + "step": 14560 + }, + { + "epoch": 202.36, + "learning_rate": 2.4499428571428573e-05, + "loss": 0.3891, + "step": 14570 + }, + { + "epoch": 202.5, + "learning_rate": 2.4488e-05, + "loss": 0.3922, + "step": 14580 + }, + { + "epoch": 202.64, + "learning_rate": 2.447657142857143e-05, + "loss": 0.3831, + "step": 14590 + }, + { + "epoch": 202.78, + "learning_rate": 2.4465142857142857e-05, + "loss": 0.384, + "step": 14600 + }, + { + "epoch": 202.91, + "learning_rate": 2.445371428571429e-05, + "loss": 0.38, + "step": 14610 + }, + { + "epoch": 203.0, + "eval_loss": 0.5260880589485168, + "eval_runtime": 127.624, + "eval_samples_per_second": 4.168, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21328019541042617, + "step": 14616 + }, + { + "epoch": 203.06, + "learning_rate": 2.4442285714285717e-05, + "loss": 0.3908, + "step": 14620 + }, + { + "epoch": 203.19, + "learning_rate": 2.4430857142857144e-05, + "loss": 0.383, + "step": 14630 + }, + { + "epoch": 203.33, + "learning_rate": 2.4419428571428574e-05, + "loss": 0.396, + "step": 14640 + }, + { + "epoch": 203.47, + "learning_rate": 2.4408e-05, + "loss": 0.4059, + "step": 14650 + }, + { + "epoch": 203.61, + "learning_rate": 2.439657142857143e-05, + "loss": 0.3888, + "step": 14660 + }, + { + "epoch": 203.75, + "learning_rate": 2.4385142857142858e-05, + "loss": 0.3719, + "step": 14670 + }, + { + "epoch": 203.89, + "learning_rate": 2.4373714285714288e-05, + "loss": 0.3818, + "step": 14680 + }, + { + "epoch": 204.0, + "eval_loss": 0.523131251335144, + "eval_runtime": 127.6827, + "eval_samples_per_second": 4.167, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21302307642861734, + "step": 14688 + }, + { + "epoch": 204.03, + "learning_rate": 2.4362285714285715e-05, + "loss": 0.3938, + "step": 14690 + }, + { + "epoch": 204.17, + "learning_rate": 2.435085714285714e-05, + "loss": 0.3906, + "step": 14700 + }, + { + "epoch": 204.3, + "learning_rate": 2.4339428571428575e-05, + "loss": 0.3778, + "step": 14710 + }, + { + "epoch": 204.44, + "learning_rate": 2.4328e-05, + "loss": 0.3911, + "step": 14720 + }, + { + "epoch": 204.58, + "learning_rate": 2.431657142857143e-05, + "loss": 0.3983, + "step": 14730 + }, + { + "epoch": 204.72, + "learning_rate": 2.430514285714286e-05, + "loss": 0.3912, + "step": 14740 + }, + { + "epoch": 204.86, + "learning_rate": 2.429371428571429e-05, + "loss": 0.3843, + "step": 14750 + }, + { + "epoch": 205.0, + "learning_rate": 2.4282285714285715e-05, + "loss": 0.3969, + "step": 14760 + }, + { + "epoch": 205.0, + "eval_loss": 0.5149098038673401, + "eval_runtime": 126.6947, + "eval_samples_per_second": 4.199, + "eval_steps_per_second": 0.529, + "eval_wer": 0.218486854792055, + "step": 14760 + }, + { + "epoch": 205.14, + "learning_rate": 2.4270857142857142e-05, + "loss": 0.3879, + "step": 14770 + }, + { + "epoch": 205.28, + "learning_rate": 2.4259428571428572e-05, + "loss": 0.3884, + "step": 14780 + }, + { + "epoch": 205.42, + "learning_rate": 2.4248e-05, + "loss": 0.3928, + "step": 14790 + }, + { + "epoch": 205.55, + "learning_rate": 2.4236571428571432e-05, + "loss": 0.3855, + "step": 14800 + }, + { + "epoch": 205.69, + "learning_rate": 2.422514285714286e-05, + "loss": 0.3773, + "step": 14810 + }, + { + "epoch": 205.83, + "learning_rate": 2.421371428571429e-05, + "loss": 0.4001, + "step": 14820 + }, + { + "epoch": 205.97, + "learning_rate": 2.4202285714285716e-05, + "loss": 0.398, + "step": 14830 + }, + { + "epoch": 206.0, + "eval_loss": 0.5272911787033081, + "eval_runtime": 127.6597, + "eval_samples_per_second": 4.167, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2271646204281031, + "step": 14832 + }, + { + "epoch": 206.11, + "learning_rate": 2.4190857142857146e-05, + "loss": 0.3972, + "step": 14840 + }, + { + "epoch": 206.25, + "learning_rate": 2.4179428571428573e-05, + "loss": 0.3885, + "step": 14850 + }, + { + "epoch": 206.39, + "learning_rate": 2.4168e-05, + "loss": 0.3912, + "step": 14860 + }, + { + "epoch": 206.53, + "learning_rate": 2.415657142857143e-05, + "loss": 0.3981, + "step": 14870 + }, + { + "epoch": 206.66, + "learning_rate": 2.4145142857142857e-05, + "loss": 0.3858, + "step": 14880 + }, + { + "epoch": 206.8, + "learning_rate": 2.4134857142857145e-05, + "loss": 0.4078, + "step": 14890 + }, + { + "epoch": 206.94, + "learning_rate": 2.4123428571428576e-05, + "loss": 0.3968, + "step": 14900 + }, + { + "epoch": 207.0, + "eval_loss": 0.541669487953186, + "eval_runtime": 128.4083, + "eval_samples_per_second": 4.143, + "eval_steps_per_second": 0.522, + "eval_wer": 0.2240149129009449, + "step": 14904 + }, + { + "epoch": 207.08, + "learning_rate": 2.4112000000000002e-05, + "loss": 0.4084, + "step": 14910 + }, + { + "epoch": 207.22, + "learning_rate": 2.410057142857143e-05, + "loss": 0.3817, + "step": 14920 + }, + { + "epoch": 207.36, + "learning_rate": 2.408914285714286e-05, + "loss": 0.3848, + "step": 14930 + }, + { + "epoch": 207.5, + "learning_rate": 2.4077714285714286e-05, + "loss": 0.3853, + "step": 14940 + }, + { + "epoch": 207.64, + "learning_rate": 2.4066285714285716e-05, + "loss": 0.3866, + "step": 14950 + }, + { + "epoch": 207.78, + "learning_rate": 2.4054857142857143e-05, + "loss": 0.3928, + "step": 14960 + }, + { + "epoch": 207.91, + "learning_rate": 2.4043428571428576e-05, + "loss": 0.3851, + "step": 14970 + }, + { + "epoch": 208.0, + "eval_loss": 0.5208941102027893, + "eval_runtime": 127.3223, + "eval_samples_per_second": 4.178, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2159156649739667, + "step": 14976 + }, + { + "epoch": 208.06, + "learning_rate": 2.4032000000000003e-05, + "loss": 0.4015, + "step": 14980 + }, + { + "epoch": 208.19, + "learning_rate": 2.402057142857143e-05, + "loss": 0.3934, + "step": 14990 + }, + { + "epoch": 208.33, + "learning_rate": 2.400914285714286e-05, + "loss": 0.3866, + "step": 15000 + }, + { + "epoch": 208.47, + "learning_rate": 2.3997714285714287e-05, + "loss": 0.3785, + "step": 15010 + }, + { + "epoch": 208.61, + "learning_rate": 2.3986285714285717e-05, + "loss": 0.3869, + "step": 15020 + }, + { + "epoch": 208.75, + "learning_rate": 2.3974857142857144e-05, + "loss": 0.3955, + "step": 15030 + }, + { + "epoch": 208.89, + "learning_rate": 2.3963428571428574e-05, + "loss": 0.382, + "step": 15040 + }, + { + "epoch": 209.0, + "eval_loss": 0.5109542608261108, + "eval_runtime": 127.681, + "eval_samples_per_second": 4.167, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21546570675580123, + "step": 15048 + }, + { + "epoch": 209.03, + "learning_rate": 2.3952e-05, + "loss": 0.4053, + "step": 15050 + }, + { + "epoch": 209.17, + "learning_rate": 2.3940571428571427e-05, + "loss": 0.3793, + "step": 15060 + }, + { + "epoch": 209.3, + "learning_rate": 2.392914285714286e-05, + "loss": 0.3878, + "step": 15070 + }, + { + "epoch": 209.44, + "learning_rate": 2.3917714285714287e-05, + "loss": 0.3934, + "step": 15080 + }, + { + "epoch": 209.58, + "learning_rate": 2.3906285714285718e-05, + "loss": 0.3937, + "step": 15090 + }, + { + "epoch": 209.72, + "learning_rate": 2.3894857142857144e-05, + "loss": 0.389, + "step": 15100 + }, + { + "epoch": 209.86, + "learning_rate": 2.3883428571428574e-05, + "loss": 0.3825, + "step": 15110 + }, + { + "epoch": 210.0, + "learning_rate": 2.3872e-05, + "loss": 0.3948, + "step": 15120 + }, + { + "epoch": 210.0, + "eval_loss": 0.5414634346961975, + "eval_runtime": 127.0964, + "eval_samples_per_second": 4.186, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2198367294465514, + "step": 15120 + }, + { + "epoch": 210.14, + "learning_rate": 2.3860571428571428e-05, + "loss": 0.3957, + "step": 15130 + }, + { + "epoch": 210.28, + "learning_rate": 2.3849142857142858e-05, + "loss": 0.3914, + "step": 15140 + }, + { + "epoch": 210.42, + "learning_rate": 2.3837714285714285e-05, + "loss": 0.3972, + "step": 15150 + }, + { + "epoch": 210.55, + "learning_rate": 2.3826285714285718e-05, + "loss": 0.3871, + "step": 15160 + }, + { + "epoch": 210.69, + "learning_rate": 2.3814857142857145e-05, + "loss": 0.3884, + "step": 15170 + }, + { + "epoch": 210.83, + "learning_rate": 2.3803428571428575e-05, + "loss": 0.3883, + "step": 15180 + }, + { + "epoch": 210.97, + "learning_rate": 2.3792000000000002e-05, + "loss": 0.3956, + "step": 15190 + }, + { + "epoch": 211.0, + "eval_loss": 0.5356243848800659, + "eval_runtime": 127.0016, + "eval_samples_per_second": 4.189, + "eval_steps_per_second": 0.528, + "eval_wer": 0.22157228257376102, + "step": 15192 + }, + { + "epoch": 211.11, + "learning_rate": 2.378057142857143e-05, + "loss": 0.4, + "step": 15200 + }, + { + "epoch": 211.25, + "learning_rate": 2.376914285714286e-05, + "loss": 0.4111, + "step": 15210 + }, + { + "epoch": 211.39, + "learning_rate": 2.3757714285714286e-05, + "loss": 0.3937, + "step": 15220 + }, + { + "epoch": 211.53, + "learning_rate": 2.3746285714285716e-05, + "loss": 0.4102, + "step": 15230 + }, + { + "epoch": 211.66, + "learning_rate": 2.3734857142857142e-05, + "loss": 0.4125, + "step": 15240 + }, + { + "epoch": 211.8, + "learning_rate": 2.3723428571428576e-05, + "loss": 0.424, + "step": 15250 + }, + { + "epoch": 211.94, + "learning_rate": 2.3712000000000003e-05, + "loss": 0.4069, + "step": 15260 + }, + { + "epoch": 212.0, + "eval_loss": 0.5360356569290161, + "eval_runtime": 127.0581, + "eval_samples_per_second": 4.187, + "eval_steps_per_second": 0.527, + "eval_wer": 0.22125088384649996, + "step": 15264 + }, + { + "epoch": 212.08, + "learning_rate": 2.370057142857143e-05, + "loss": 0.4226, + "step": 15270 + }, + { + "epoch": 212.22, + "learning_rate": 2.368914285714286e-05, + "loss": 0.3931, + "step": 15280 + }, + { + "epoch": 212.36, + "learning_rate": 2.3677714285714286e-05, + "loss": 0.3989, + "step": 15290 + }, + { + "epoch": 212.5, + "learning_rate": 2.3666285714285716e-05, + "loss": 0.3985, + "step": 15300 + }, + { + "epoch": 212.64, + "learning_rate": 2.3654857142857143e-05, + "loss": 0.432, + "step": 15310 + }, + { + "epoch": 212.78, + "learning_rate": 2.3643428571428573e-05, + "loss": 0.4059, + "step": 15320 + }, + { + "epoch": 212.91, + "learning_rate": 2.3632e-05, + "loss": 0.4019, + "step": 15330 + }, + { + "epoch": 213.0, + "eval_loss": 0.539585530757904, + "eval_runtime": 127.9801, + "eval_samples_per_second": 4.157, + "eval_steps_per_second": 0.524, + "eval_wer": 0.21951533071929036, + "step": 15336 + }, + { + "epoch": 213.06, + "learning_rate": 2.3620571428571434e-05, + "loss": 0.4063, + "step": 15340 + }, + { + "epoch": 213.19, + "learning_rate": 2.360914285714286e-05, + "loss": 0.3971, + "step": 15350 + }, + { + "epoch": 213.33, + "learning_rate": 2.3597714285714287e-05, + "loss": 0.3807, + "step": 15360 + }, + { + "epoch": 213.47, + "learning_rate": 2.3586285714285717e-05, + "loss": 0.4047, + "step": 15370 + }, + { + "epoch": 213.61, + "learning_rate": 2.3574857142857144e-05, + "loss": 0.3996, + "step": 15380 + }, + { + "epoch": 213.75, + "learning_rate": 2.3563428571428574e-05, + "loss": 0.3939, + "step": 15390 + }, + { + "epoch": 213.89, + "learning_rate": 2.3552e-05, + "loss": 0.3954, + "step": 15400 + }, + { + "epoch": 214.0, + "eval_loss": 0.5369138121604919, + "eval_runtime": 127.0549, + "eval_samples_per_second": 4.187, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2199010091920036, + "step": 15408 + }, + { + "epoch": 214.03, + "learning_rate": 2.354057142857143e-05, + "loss": 0.4054, + "step": 15410 + }, + { + "epoch": 214.17, + "learning_rate": 2.3529142857142858e-05, + "loss": 0.3985, + "step": 15420 + }, + { + "epoch": 214.3, + "learning_rate": 2.3517714285714284e-05, + "loss": 0.4083, + "step": 15430 + }, + { + "epoch": 214.44, + "learning_rate": 2.3506285714285718e-05, + "loss": 0.4104, + "step": 15440 + }, + { + "epoch": 214.58, + "learning_rate": 2.3494857142857145e-05, + "loss": 0.3968, + "step": 15450 + }, + { + "epoch": 214.72, + "learning_rate": 2.3483428571428575e-05, + "loss": 0.4049, + "step": 15460 + }, + { + "epoch": 214.86, + "learning_rate": 2.3472e-05, + "loss": 0.3865, + "step": 15470 + }, + { + "epoch": 215.0, + "learning_rate": 2.3460571428571432e-05, + "loss": 0.3942, + "step": 15480 + }, + { + "epoch": 215.0, + "eval_loss": 0.5369403958320618, + "eval_runtime": 127.3171, + "eval_samples_per_second": 4.179, + "eval_steps_per_second": 0.526, + "eval_wer": 0.22176512181011762, + "step": 15480 + }, + { + "epoch": 215.14, + "learning_rate": 2.344914285714286e-05, + "loss": 0.4099, + "step": 15490 + }, + { + "epoch": 215.28, + "learning_rate": 2.3437714285714285e-05, + "loss": 0.4002, + "step": 15500 + }, + { + "epoch": 215.42, + "learning_rate": 2.3426285714285715e-05, + "loss": 0.3907, + "step": 15510 + }, + { + "epoch": 215.55, + "learning_rate": 2.3414857142857142e-05, + "loss": 0.3832, + "step": 15520 + }, + { + "epoch": 215.69, + "learning_rate": 2.3403428571428576e-05, + "loss": 0.3933, + "step": 15530 + }, + { + "epoch": 215.83, + "learning_rate": 2.3392000000000002e-05, + "loss": 0.3892, + "step": 15540 + }, + { + "epoch": 215.97, + "learning_rate": 2.3380571428571432e-05, + "loss": 0.3916, + "step": 15550 + }, + { + "epoch": 216.0, + "eval_loss": 0.5501964688301086, + "eval_runtime": 126.9278, + "eval_samples_per_second": 4.191, + "eval_steps_per_second": 0.528, + "eval_wer": 0.2166870219193932, + "step": 15552 + }, + { + "epoch": 216.11, + "learning_rate": 2.336914285714286e-05, + "loss": 0.3875, + "step": 15560 + }, + { + "epoch": 216.25, + "learning_rate": 2.3357714285714286e-05, + "loss": 0.3972, + "step": 15570 + }, + { + "epoch": 216.39, + "learning_rate": 2.3346285714285716e-05, + "loss": 0.3932, + "step": 15580 + }, + { + "epoch": 216.53, + "learning_rate": 2.3334857142857143e-05, + "loss": 0.3922, + "step": 15590 + }, + { + "epoch": 216.66, + "learning_rate": 2.3323428571428573e-05, + "loss": 0.3913, + "step": 15600 + }, + { + "epoch": 216.8, + "learning_rate": 2.3312e-05, + "loss": 0.3907, + "step": 15610 + }, + { + "epoch": 216.94, + "learning_rate": 2.3300571428571433e-05, + "loss": 0.3955, + "step": 15620 + }, + { + "epoch": 217.0, + "eval_loss": 0.5321688055992126, + "eval_runtime": 127.6819, + "eval_samples_per_second": 4.167, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2142443915922093, + "step": 15624 + }, + { + "epoch": 217.08, + "learning_rate": 2.328914285714286e-05, + "loss": 0.4039, + "step": 15630 + }, + { + "epoch": 217.22, + "learning_rate": 2.3277714285714287e-05, + "loss": 0.3947, + "step": 15640 + }, + { + "epoch": 217.36, + "learning_rate": 2.3266285714285717e-05, + "loss": 0.3859, + "step": 15650 + }, + { + "epoch": 217.5, + "learning_rate": 2.3254857142857144e-05, + "loss": 0.382, + "step": 15660 + }, + { + "epoch": 217.64, + "learning_rate": 2.3243428571428574e-05, + "loss": 0.3756, + "step": 15670 + }, + { + "epoch": 217.78, + "learning_rate": 2.3232e-05, + "loss": 0.3834, + "step": 15680 + }, + { + "epoch": 217.91, + "learning_rate": 2.322057142857143e-05, + "loss": 0.394, + "step": 15690 + }, + { + "epoch": 218.0, + "eval_loss": 0.5397269129753113, + "eval_runtime": 127.3826, + "eval_samples_per_second": 4.176, + "eval_steps_per_second": 0.526, + "eval_wer": 0.22350067493732725, + "step": 15696 + }, + { + "epoch": 218.06, + "learning_rate": 2.3209142857142857e-05, + "loss": 0.416, + "step": 15700 + }, + { + "epoch": 218.19, + "learning_rate": 2.3197714285714284e-05, + "loss": 0.3871, + "step": 15710 + }, + { + "epoch": 218.33, + "learning_rate": 2.3186285714285718e-05, + "loss": 0.3857, + "step": 15720 + }, + { + "epoch": 218.47, + "learning_rate": 2.3174857142857144e-05, + "loss": 0.3968, + "step": 15730 + }, + { + "epoch": 218.61, + "learning_rate": 2.3163428571428575e-05, + "loss": 0.3794, + "step": 15740 + }, + { + "epoch": 218.75, + "learning_rate": 2.3152e-05, + "loss": 0.3811, + "step": 15750 + }, + { + "epoch": 218.89, + "learning_rate": 2.314057142857143e-05, + "loss": 0.3831, + "step": 15760 + }, + { + "epoch": 219.0, + "eval_loss": 0.5671437382698059, + "eval_runtime": 128.5451, + "eval_samples_per_second": 4.139, + "eval_steps_per_second": 0.521, + "eval_wer": 0.22022240791926465, + "step": 15768 + }, + { + "epoch": 219.03, + "learning_rate": 2.3129142857142858e-05, + "loss": 0.3876, + "step": 15770 + }, + { + "epoch": 219.17, + "learning_rate": 2.3117714285714285e-05, + "loss": 0.3828, + "step": 15780 + }, + { + "epoch": 219.3, + "learning_rate": 2.3106285714285715e-05, + "loss": 0.3922, + "step": 15790 + }, + { + "epoch": 219.44, + "learning_rate": 2.3094857142857142e-05, + "loss": 0.3816, + "step": 15800 + }, + { + "epoch": 219.58, + "learning_rate": 2.3083428571428575e-05, + "loss": 0.3737, + "step": 15810 + }, + { + "epoch": 219.72, + "learning_rate": 2.3072000000000002e-05, + "loss": 0.3986, + "step": 15820 + }, + { + "epoch": 219.86, + "learning_rate": 2.3060571428571432e-05, + "loss": 0.3789, + "step": 15830 + }, + { + "epoch": 220.0, + "learning_rate": 2.304914285714286e-05, + "loss": 0.3765, + "step": 15840 + }, + { + "epoch": 220.0, + "eval_loss": 0.5617607235908508, + "eval_runtime": 127.3793, + "eval_samples_per_second": 4.177, + "eval_steps_per_second": 0.526, + "eval_wer": 0.21597994471941892, + "step": 15840 + }, + { + "epoch": 220.14, + "learning_rate": 2.3037714285714286e-05, + "loss": 0.3871, + "step": 15850 + }, + { + "epoch": 220.28, + "learning_rate": 2.3026285714285716e-05, + "loss": 0.3947, + "step": 15860 + }, + { + "epoch": 220.42, + "learning_rate": 2.3014857142857143e-05, + "loss": 0.3818, + "step": 15870 + }, + { + "epoch": 220.55, + "learning_rate": 2.3003428571428573e-05, + "loss": 0.3721, + "step": 15880 + }, + { + "epoch": 220.69, + "learning_rate": 2.2992e-05, + "loss": 0.3883, + "step": 15890 + }, + { + "epoch": 220.83, + "learning_rate": 2.2980571428571433e-05, + "loss": 0.4033, + "step": 15900 + }, + { + "epoch": 220.97, + "learning_rate": 2.296914285714286e-05, + "loss": 0.3981, + "step": 15910 + }, + { + "epoch": 221.0, + "eval_loss": 0.5713575482368469, + "eval_runtime": 126.5742, + "eval_samples_per_second": 4.203, + "eval_steps_per_second": 0.529, + "eval_wer": 0.22324355595551842, + "step": 15912 + }, + { + "epoch": 221.11, + "learning_rate": 2.2957714285714286e-05, + "loss": 0.3892, + "step": 15920 + }, + { + "epoch": 221.25, + "learning_rate": 2.2946285714285717e-05, + "loss": 0.3892, + "step": 15930 + }, + { + "epoch": 221.39, + "learning_rate": 2.2934857142857143e-05, + "loss": 0.3867, + "step": 15940 + }, + { + "epoch": 221.53, + "learning_rate": 2.2923428571428573e-05, + "loss": 0.3921, + "step": 15950 + }, + { + "epoch": 221.66, + "learning_rate": 2.2912e-05, + "loss": 0.3886, + "step": 15960 + }, + { + "epoch": 221.8, + "learning_rate": 2.290057142857143e-05, + "loss": 0.3905, + "step": 15970 + }, + { + "epoch": 221.94, + "learning_rate": 2.2889142857142857e-05, + "loss": 0.4021, + "step": 15980 + }, + { + "epoch": 222.0, + "eval_loss": 0.5142927169799805, + "eval_runtime": 127.2639, + "eval_samples_per_second": 4.18, + "eval_steps_per_second": 0.526, + "eval_wer": 0.22112232435559556, + "step": 15984 + }, + { + "epoch": 222.08, + "learning_rate": 2.287771428571429e-05, + "loss": 0.3982, + "step": 15990 + }, + { + "epoch": 222.22, + "learning_rate": 2.2866285714285717e-05, + "loss": 0.3925, + "step": 16000 + }, + { + "epoch": 222.36, + "learning_rate": 2.2854857142857144e-05, + "loss": 0.3915, + "step": 16010 + }, + { + "epoch": 222.5, + "learning_rate": 2.2843428571428574e-05, + "loss": 0.3783, + "step": 16020 + }, + { + "epoch": 222.64, + "learning_rate": 2.2832e-05, + "loss": 0.3833, + "step": 16030 + }, + { + "epoch": 222.78, + "learning_rate": 2.282057142857143e-05, + "loss": 0.3953, + "step": 16040 + }, + { + "epoch": 222.91, + "learning_rate": 2.2809142857142858e-05, + "loss": 0.3818, + "step": 16050 + }, + { + "epoch": 223.0, + "eval_loss": 0.5358201861381531, + "eval_runtime": 127.528, + "eval_samples_per_second": 4.172, + "eval_steps_per_second": 0.525, + "eval_wer": 0.22022240791926465, + "step": 16056 + }, + { + "epoch": 223.06, + "learning_rate": 2.279771428571429e-05, + "loss": 0.4022, + "step": 16060 + }, + { + "epoch": 223.19, + "learning_rate": 2.2786285714285715e-05, + "loss": 0.3842, + "step": 16070 + }, + { + "epoch": 223.33, + "learning_rate": 2.277485714285714e-05, + "loss": 0.3812, + "step": 16080 + }, + { + "epoch": 223.47, + "learning_rate": 2.2763428571428575e-05, + "loss": 0.3936, + "step": 16090 + }, + { + "epoch": 223.61, + "learning_rate": 2.2752000000000002e-05, + "loss": 0.3716, + "step": 16100 + }, + { + "epoch": 223.75, + "learning_rate": 2.2740571428571432e-05, + "loss": 0.3698, + "step": 16110 + }, + { + "epoch": 223.89, + "learning_rate": 2.272914285714286e-05, + "loss": 0.3828, + "step": 16120 + }, + { + "epoch": 224.0, + "eval_loss": 0.5450764298439026, + "eval_runtime": 126.5777, + "eval_samples_per_second": 4.203, + "eval_steps_per_second": 0.529, + "eval_wer": 0.2157228257376101, + "step": 16128 + }, + { + "epoch": 224.03, + "learning_rate": 2.271771428571429e-05, + "loss": 0.3967, + "step": 16130 + }, + { + "epoch": 224.17, + "learning_rate": 2.2706285714285715e-05, + "loss": 0.3818, + "step": 16140 + }, + { + "epoch": 224.3, + "learning_rate": 2.2694857142857142e-05, + "loss": 0.3762, + "step": 16150 + }, + { + "epoch": 224.44, + "learning_rate": 2.2683428571428572e-05, + "loss": 0.3738, + "step": 16160 + }, + { + "epoch": 224.58, + "learning_rate": 2.2672e-05, + "loss": 0.3877, + "step": 16170 + }, + { + "epoch": 224.72, + "learning_rate": 2.2660571428571433e-05, + "loss": 0.3896, + "step": 16180 + }, + { + "epoch": 224.86, + "learning_rate": 2.264914285714286e-05, + "loss": 0.3784, + "step": 16190 + }, + { + "epoch": 225.0, + "learning_rate": 2.263771428571429e-05, + "loss": 0.3783, + "step": 16200 + }, + { + "epoch": 225.0, + "eval_loss": 0.5434143543243408, + "eval_runtime": 127.518, + "eval_samples_per_second": 4.172, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21861541428295944, + "step": 16200 + }, + { + "epoch": 225.14, + "learning_rate": 2.2626285714285716e-05, + "loss": 0.3869, + "step": 16210 + }, + { + "epoch": 225.28, + "learning_rate": 2.2614857142857143e-05, + "loss": 0.3874, + "step": 16220 + }, + { + "epoch": 225.42, + "learning_rate": 2.2603428571428573e-05, + "loss": 0.3839, + "step": 16230 + }, + { + "epoch": 225.55, + "learning_rate": 2.2592e-05, + "loss": 0.3919, + "step": 16240 + }, + { + "epoch": 225.69, + "learning_rate": 2.2580571428571433e-05, + "loss": 0.3909, + "step": 16250 + }, + { + "epoch": 225.83, + "learning_rate": 2.2569142857142857e-05, + "loss": 0.3762, + "step": 16260 + }, + { + "epoch": 225.97, + "learning_rate": 2.255771428571429e-05, + "loss": 0.3915, + "step": 16270 + }, + { + "epoch": 226.0, + "eval_loss": 0.530297040939331, + "eval_runtime": 128.081, + "eval_samples_per_second": 4.154, + "eval_steps_per_second": 0.523, + "eval_wer": 0.21662274217394098, + "step": 16272 + }, + { + "epoch": 226.11, + "learning_rate": 2.2546285714285717e-05, + "loss": 0.3744, + "step": 16280 + }, + { + "epoch": 226.25, + "learning_rate": 2.2534857142857144e-05, + "loss": 0.3863, + "step": 16290 + }, + { + "epoch": 226.39, + "learning_rate": 2.2523428571428574e-05, + "loss": 0.3839, + "step": 16300 + }, + { + "epoch": 226.53, + "learning_rate": 2.2512e-05, + "loss": 0.3845, + "step": 16310 + }, + { + "epoch": 226.66, + "learning_rate": 2.250057142857143e-05, + "loss": 0.3789, + "step": 16320 + }, + { + "epoch": 226.8, + "learning_rate": 2.2489142857142858e-05, + "loss": 0.37, + "step": 16330 + }, + { + "epoch": 226.94, + "learning_rate": 2.247771428571429e-05, + "loss": 0.3892, + "step": 16340 + }, + { + "epoch": 227.0, + "eval_loss": 0.527522623538971, + "eval_runtime": 126.2931, + "eval_samples_per_second": 4.212, + "eval_steps_per_second": 0.531, + "eval_wer": 0.2174583788648197, + "step": 16344 + }, + { + "epoch": 227.08, + "learning_rate": 2.2466285714285714e-05, + "loss": 0.3844, + "step": 16350 + }, + { + "epoch": 227.22, + "learning_rate": 2.245485714285714e-05, + "loss": 0.3787, + "step": 16360 + }, + { + "epoch": 227.36, + "learning_rate": 2.2443428571428575e-05, + "loss": 0.3882, + "step": 16370 + }, + { + "epoch": 227.5, + "learning_rate": 2.2432e-05, + "loss": 0.3859, + "step": 16380 + }, + { + "epoch": 227.64, + "learning_rate": 2.242057142857143e-05, + "loss": 0.3873, + "step": 16390 + }, + { + "epoch": 227.78, + "learning_rate": 2.2409142857142858e-05, + "loss": 0.3734, + "step": 16400 + }, + { + "epoch": 227.91, + "learning_rate": 2.239771428571429e-05, + "loss": 0.3798, + "step": 16410 + }, + { + "epoch": 228.0, + "eval_loss": 0.5114896297454834, + "eval_runtime": 127.8208, + "eval_samples_per_second": 4.162, + "eval_steps_per_second": 0.524, + "eval_wer": 0.2111589638105033, + "step": 16416 + }, + { + "epoch": 228.06, + "learning_rate": 2.2386285714285715e-05, + "loss": 0.3844, + "step": 16420 + }, + { + "epoch": 228.19, + "learning_rate": 2.2374857142857142e-05, + "loss": 0.3793, + "step": 16430 + }, + { + "epoch": 228.33, + "learning_rate": 2.2363428571428572e-05, + "loss": 0.3727, + "step": 16440 + }, + { + "epoch": 228.47, + "learning_rate": 2.2352e-05, + "loss": 0.3816, + "step": 16450 + }, + { + "epoch": 228.61, + "learning_rate": 2.2340571428571432e-05, + "loss": 0.3725, + "step": 16460 + }, + { + "epoch": 228.75, + "learning_rate": 2.232914285714286e-05, + "loss": 0.3943, + "step": 16470 + }, + { + "epoch": 228.89, + "learning_rate": 2.231771428571429e-05, + "loss": 0.3705, + "step": 16480 + }, + { + "epoch": 229.0, + "eval_loss": 0.5377914309501648, + "eval_runtime": 126.7115, + "eval_samples_per_second": 4.199, + "eval_steps_per_second": 0.529, + "eval_wer": 0.218486854792055, + "step": 16488 + }, + { + "epoch": 229.03, + "learning_rate": 2.2306285714285716e-05, + "loss": 0.3983, + "step": 16490 + }, + { + "epoch": 229.17, + "learning_rate": 2.2294857142857143e-05, + "loss": 0.3833, + "step": 16500 + }, + { + "epoch": 229.3, + "learning_rate": 2.2283428571428573e-05, + "loss": 0.3674, + "step": 16510 + }, + { + "epoch": 229.44, + "learning_rate": 2.2272e-05, + "loss": 0.3739, + "step": 16520 + }, + { + "epoch": 229.58, + "learning_rate": 2.2260571428571433e-05, + "loss": 0.3735, + "step": 16530 + }, + { + "epoch": 229.72, + "learning_rate": 2.2249142857142856e-05, + "loss": 0.3786, + "step": 16540 + }, + { + "epoch": 229.86, + "learning_rate": 2.223771428571429e-05, + "loss": 0.3694, + "step": 16550 + }, + { + "epoch": 230.0, + "learning_rate": 2.2226285714285717e-05, + "loss": 0.3835, + "step": 16560 + }, + { + "epoch": 230.0, + "eval_loss": 0.5216724276542664, + "eval_runtime": 127.2271, + "eval_samples_per_second": 4.181, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21257311821045188, + "step": 16560 + }, + { + "epoch": 230.14, + "learning_rate": 2.2214857142857143e-05, + "loss": 0.3745, + "step": 16570 + }, + { + "epoch": 230.28, + "learning_rate": 2.2203428571428574e-05, + "loss": 0.3798, + "step": 16580 + }, + { + "epoch": 230.42, + "learning_rate": 2.2192e-05, + "loss": 0.3752, + "step": 16590 + }, + { + "epoch": 230.55, + "learning_rate": 2.218057142857143e-05, + "loss": 0.3647, + "step": 16600 + }, + { + "epoch": 230.69, + "learning_rate": 2.2169142857142857e-05, + "loss": 0.3739, + "step": 16610 + }, + { + "epoch": 230.83, + "learning_rate": 2.215771428571429e-05, + "loss": 0.3849, + "step": 16620 + }, + { + "epoch": 230.97, + "learning_rate": 2.2146285714285714e-05, + "loss": 0.3832, + "step": 16630 + }, + { + "epoch": 231.0, + "eval_loss": 0.5503403544425964, + "eval_runtime": 126.4784, + "eval_samples_per_second": 4.206, + "eval_steps_per_second": 0.53, + "eval_wer": 0.2207366458828823, + "step": 16632 + }, + { + "epoch": 231.11, + "learning_rate": 2.2134857142857148e-05, + "loss": 0.3927, + "step": 16640 + }, + { + "epoch": 231.25, + "learning_rate": 2.2123428571428574e-05, + "loss": 0.3767, + "step": 16650 + }, + { + "epoch": 231.39, + "learning_rate": 2.2112e-05, + "loss": 0.3856, + "step": 16660 + }, + { + "epoch": 231.53, + "learning_rate": 2.210057142857143e-05, + "loss": 0.3707, + "step": 16670 + }, + { + "epoch": 231.66, + "learning_rate": 2.2089142857142858e-05, + "loss": 0.3756, + "step": 16680 + }, + { + "epoch": 231.8, + "learning_rate": 2.2077714285714288e-05, + "loss": 0.387, + "step": 16690 + }, + { + "epoch": 231.94, + "learning_rate": 2.2066285714285715e-05, + "loss": 0.3907, + "step": 16700 + }, + { + "epoch": 232.0, + "eval_loss": 0.5515126585960388, + "eval_runtime": 126.8614, + "eval_samples_per_second": 4.194, + "eval_steps_per_second": 0.528, + "eval_wer": 0.21777977759208073, + "step": 16704 + }, + { + "epoch": 232.08, + "learning_rate": 2.205485714285715e-05, + "loss": 0.413, + "step": 16710 + }, + { + "epoch": 232.22, + "learning_rate": 2.2043428571428575e-05, + "loss": 0.4042, + "step": 16720 + }, + { + "epoch": 232.36, + "learning_rate": 2.2032e-05, + "loss": 0.3902, + "step": 16730 + }, + { + "epoch": 232.5, + "learning_rate": 2.2020571428571432e-05, + "loss": 0.4067, + "step": 16740 + }, + { + "epoch": 232.64, + "learning_rate": 2.200914285714286e-05, + "loss": 0.3891, + "step": 16750 + }, + { + "epoch": 232.78, + "learning_rate": 2.199771428571429e-05, + "loss": 0.3868, + "step": 16760 + }, + { + "epoch": 232.91, + "learning_rate": 2.1986285714285716e-05, + "loss": 0.3988, + "step": 16770 + }, + { + "epoch": 233.0, + "eval_loss": 0.5221549868583679, + "eval_runtime": 126.9494, + "eval_samples_per_second": 4.191, + "eval_steps_per_second": 0.528, + "eval_wer": 0.2224079192646397, + "step": 16776 + }, + { + "epoch": 233.06, + "learning_rate": 2.1974857142857146e-05, + "loss": 0.3965, + "step": 16780 + }, + { + "epoch": 233.19, + "learning_rate": 2.1963428571428572e-05, + "loss": 0.3933, + "step": 16790 + }, + { + "epoch": 233.33, + "learning_rate": 2.1952e-05, + "loss": 0.3846, + "step": 16800 + }, + { + "epoch": 233.47, + "learning_rate": 2.1940571428571433e-05, + "loss": 0.3735, + "step": 16810 + }, + { + "epoch": 233.61, + "learning_rate": 2.1929142857142856e-05, + "loss": 0.3728, + "step": 16820 + }, + { + "epoch": 233.75, + "learning_rate": 2.191771428571429e-05, + "loss": 0.3789, + "step": 16830 + }, + { + "epoch": 233.89, + "learning_rate": 2.1906285714285716e-05, + "loss": 0.3785, + "step": 16840 + }, + { + "epoch": 234.0, + "eval_loss": 0.5288335680961609, + "eval_runtime": 127.0623, + "eval_samples_per_second": 4.187, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21263739795590408, + "step": 16848 + }, + { + "epoch": 234.03, + "learning_rate": 2.1894857142857146e-05, + "loss": 0.3944, + "step": 16850 + }, + { + "epoch": 234.17, + "learning_rate": 2.1883428571428573e-05, + "loss": 0.3909, + "step": 16860 + }, + { + "epoch": 234.3, + "learning_rate": 2.1872e-05, + "loss": 0.3829, + "step": 16870 + }, + { + "epoch": 234.44, + "learning_rate": 2.186057142857143e-05, + "loss": 0.3774, + "step": 16880 + }, + { + "epoch": 234.58, + "learning_rate": 2.1849142857142857e-05, + "loss": 0.3926, + "step": 16890 + }, + { + "epoch": 234.72, + "learning_rate": 2.183771428571429e-05, + "loss": 0.3868, + "step": 16900 + }, + { + "epoch": 234.86, + "learning_rate": 2.1826285714285714e-05, + "loss": 0.3796, + "step": 16910 + }, + { + "epoch": 235.0, + "learning_rate": 2.1814857142857147e-05, + "loss": 0.3839, + "step": 16920 + }, + { + "epoch": 235.0, + "eval_loss": 0.5226218104362488, + "eval_runtime": 126.6897, + "eval_samples_per_second": 4.199, + "eval_steps_per_second": 0.529, + "eval_wer": 0.21392299286494826, + "step": 16920 + }, + { + "epoch": 235.14, + "learning_rate": 2.1803428571428574e-05, + "loss": 0.3934, + "step": 16930 + }, + { + "epoch": 235.28, + "learning_rate": 2.1792e-05, + "loss": 0.3779, + "step": 16940 + }, + { + "epoch": 235.42, + "learning_rate": 2.178057142857143e-05, + "loss": 0.3731, + "step": 16950 + }, + { + "epoch": 235.55, + "learning_rate": 2.1769142857142858e-05, + "loss": 0.3796, + "step": 16960 + }, + { + "epoch": 235.69, + "learning_rate": 2.1757714285714288e-05, + "loss": 0.3784, + "step": 16970 + }, + { + "epoch": 235.83, + "learning_rate": 2.1746285714285714e-05, + "loss": 0.3918, + "step": 16980 + }, + { + "epoch": 235.97, + "learning_rate": 2.1734857142857148e-05, + "loss": 0.3998, + "step": 16990 + }, + { + "epoch": 236.0, + "eval_loss": 0.5478945374488831, + "eval_runtime": 127.5527, + "eval_samples_per_second": 4.171, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21822973581024618, + "step": 16992 + }, + { + "epoch": 236.11, + "learning_rate": 2.1723428571428575e-05, + "loss": 0.3811, + "step": 17000 + }, + { + "epoch": 236.25, + "learning_rate": 2.1711999999999998e-05, + "loss": 0.3847, + "step": 17010 + }, + { + "epoch": 236.39, + "learning_rate": 2.170057142857143e-05, + "loss": 0.3803, + "step": 17020 + }, + { + "epoch": 236.53, + "learning_rate": 2.168914285714286e-05, + "loss": 0.3816, + "step": 17030 + }, + { + "epoch": 236.66, + "learning_rate": 2.167771428571429e-05, + "loss": 0.3836, + "step": 17040 + }, + { + "epoch": 236.8, + "learning_rate": 2.1666285714285715e-05, + "loss": 0.377, + "step": 17050 + }, + { + "epoch": 236.94, + "learning_rate": 2.1654857142857145e-05, + "loss": 0.3792, + "step": 17060 + }, + { + "epoch": 237.0, + "eval_loss": 0.5297938585281372, + "eval_runtime": 127.4494, + "eval_samples_per_second": 4.174, + "eval_steps_per_second": 0.526, + "eval_wer": 0.22285787748280517, + "step": 17064 + }, + { + "epoch": 237.08, + "learning_rate": 2.1643428571428572e-05, + "loss": 0.3822, + "step": 17070 + }, + { + "epoch": 237.22, + "learning_rate": 2.1632e-05, + "loss": 0.3792, + "step": 17080 + }, + { + "epoch": 237.36, + "learning_rate": 2.1620571428571432e-05, + "loss": 0.3734, + "step": 17090 + }, + { + "epoch": 237.5, + "learning_rate": 2.1609142857142856e-05, + "loss": 0.3717, + "step": 17100 + }, + { + "epoch": 237.64, + "learning_rate": 2.159771428571429e-05, + "loss": 0.3774, + "step": 17110 + }, + { + "epoch": 237.78, + "learning_rate": 2.1586285714285716e-05, + "loss": 0.3773, + "step": 17120 + }, + { + "epoch": 237.91, + "learning_rate": 2.1574857142857146e-05, + "loss": 0.3791, + "step": 17130 + }, + { + "epoch": 238.0, + "eval_loss": 0.539785623550415, + "eval_runtime": 127.0733, + "eval_samples_per_second": 4.187, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21463007006492255, + "step": 17136 + }, + { + "epoch": 238.06, + "learning_rate": 2.1563428571428573e-05, + "loss": 0.383, + "step": 17140 + }, + { + "epoch": 238.19, + "learning_rate": 2.1552e-05, + "loss": 0.3684, + "step": 17150 + }, + { + "epoch": 238.33, + "learning_rate": 2.154057142857143e-05, + "loss": 0.3665, + "step": 17160 + }, + { + "epoch": 238.47, + "learning_rate": 2.1529142857142857e-05, + "loss": 0.3815, + "step": 17170 + }, + { + "epoch": 238.61, + "learning_rate": 2.151771428571429e-05, + "loss": 0.3755, + "step": 17180 + }, + { + "epoch": 238.75, + "learning_rate": 2.1506285714285713e-05, + "loss": 0.3757, + "step": 17190 + }, + { + "epoch": 238.89, + "learning_rate": 2.1494857142857147e-05, + "loss": 0.3673, + "step": 17200 + }, + { + "epoch": 239.0, + "eval_loss": 0.5475865006446838, + "eval_runtime": 127.6236, + "eval_samples_per_second": 4.169, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2152085877739924, + "step": 17208 + }, + { + "epoch": 239.03, + "learning_rate": 2.1483428571428574e-05, + "loss": 0.3767, + "step": 17210 + }, + { + "epoch": 239.17, + "learning_rate": 2.1472000000000004e-05, + "loss": 0.3712, + "step": 17220 + }, + { + "epoch": 239.3, + "learning_rate": 2.146057142857143e-05, + "loss": 0.3845, + "step": 17230 + }, + { + "epoch": 239.44, + "learning_rate": 2.1449142857142857e-05, + "loss": 0.3722, + "step": 17240 + }, + { + "epoch": 239.58, + "learning_rate": 2.1437714285714287e-05, + "loss": 0.3766, + "step": 17250 + }, + { + "epoch": 239.72, + "learning_rate": 2.1426285714285714e-05, + "loss": 0.3854, + "step": 17260 + }, + { + "epoch": 239.86, + "learning_rate": 2.1414857142857148e-05, + "loss": 0.3791, + "step": 17270 + }, + { + "epoch": 240.0, + "learning_rate": 2.1403428571428574e-05, + "loss": 0.3697, + "step": 17280 + }, + { + "epoch": 240.0, + "eval_loss": 0.5310242176055908, + "eval_runtime": 127.5358, + "eval_samples_per_second": 4.171, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2182940155556984, + "step": 17280 + }, + { + "epoch": 240.14, + "learning_rate": 2.1392000000000005e-05, + "loss": 0.3814, + "step": 17290 + }, + { + "epoch": 240.28, + "learning_rate": 2.138057142857143e-05, + "loss": 0.3737, + "step": 17300 + }, + { + "epoch": 240.42, + "learning_rate": 2.1369142857142858e-05, + "loss": 0.3751, + "step": 17310 + }, + { + "epoch": 240.55, + "learning_rate": 2.1357714285714288e-05, + "loss": 0.3633, + "step": 17320 + }, + { + "epoch": 240.69, + "learning_rate": 2.1346285714285715e-05, + "loss": 0.3752, + "step": 17330 + }, + { + "epoch": 240.83, + "learning_rate": 2.1334857142857145e-05, + "loss": 0.3813, + "step": 17340 + }, + { + "epoch": 240.97, + "learning_rate": 2.1323428571428572e-05, + "loss": 0.3855, + "step": 17350 + }, + { + "epoch": 241.0, + "eval_loss": 0.5410667657852173, + "eval_runtime": 127.4511, + "eval_samples_per_second": 4.174, + "eval_steps_per_second": 0.526, + "eval_wer": 0.22131516359195216, + "step": 17352 + }, + { + "epoch": 241.11, + "learning_rate": 2.1312000000000005e-05, + "loss": 0.3842, + "step": 17360 + }, + { + "epoch": 241.25, + "learning_rate": 2.1300571428571432e-05, + "loss": 0.3719, + "step": 17370 + }, + { + "epoch": 241.39, + "learning_rate": 2.1289142857142855e-05, + "loss": 0.3669, + "step": 17380 + }, + { + "epoch": 241.53, + "learning_rate": 2.127771428571429e-05, + "loss": 0.3697, + "step": 17390 + }, + { + "epoch": 241.66, + "learning_rate": 2.1266285714285716e-05, + "loss": 0.3787, + "step": 17400 + }, + { + "epoch": 241.8, + "learning_rate": 2.1254857142857146e-05, + "loss": 0.3762, + "step": 17410 + }, + { + "epoch": 241.94, + "learning_rate": 2.1243428571428573e-05, + "loss": 0.3775, + "step": 17420 + }, + { + "epoch": 242.0, + "eval_loss": 0.5311770439147949, + "eval_runtime": 127.1239, + "eval_samples_per_second": 4.185, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2183582953011506, + "step": 17424 + }, + { + "epoch": 242.08, + "learning_rate": 2.1232000000000003e-05, + "loss": 0.3688, + "step": 17430 + }, + { + "epoch": 242.22, + "learning_rate": 2.122057142857143e-05, + "loss": 0.3667, + "step": 17440 + }, + { + "epoch": 242.36, + "learning_rate": 2.1209142857142856e-05, + "loss": 0.3672, + "step": 17450 + }, + { + "epoch": 242.5, + "learning_rate": 2.119771428571429e-05, + "loss": 0.3739, + "step": 17460 + }, + { + "epoch": 242.64, + "learning_rate": 2.1186285714285716e-05, + "loss": 0.3708, + "step": 17470 + }, + { + "epoch": 242.78, + "learning_rate": 2.1174857142857147e-05, + "loss": 0.3725, + "step": 17480 + }, + { + "epoch": 242.91, + "learning_rate": 2.1163428571428573e-05, + "loss": 0.3789, + "step": 17490 + }, + { + "epoch": 243.0, + "eval_loss": 0.5228763222694397, + "eval_runtime": 127.1414, + "eval_samples_per_second": 4.184, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21565854599215786, + "step": 17496 + }, + { + "epoch": 243.06, + "learning_rate": 2.1152000000000003e-05, + "loss": 0.3899, + "step": 17500 + }, + { + "epoch": 243.19, + "learning_rate": 2.114057142857143e-05, + "loss": 0.361, + "step": 17510 + }, + { + "epoch": 243.33, + "learning_rate": 2.1129142857142857e-05, + "loss": 0.3783, + "step": 17520 + }, + { + "epoch": 243.47, + "learning_rate": 2.1117714285714287e-05, + "loss": 0.3716, + "step": 17530 + }, + { + "epoch": 243.61, + "learning_rate": 2.1106285714285714e-05, + "loss": 0.3682, + "step": 17540 + }, + { + "epoch": 243.75, + "learning_rate": 2.1094857142857147e-05, + "loss": 0.3562, + "step": 17550 + }, + { + "epoch": 243.89, + "learning_rate": 2.1083428571428574e-05, + "loss": 0.3733, + "step": 17560 + }, + { + "epoch": 244.0, + "eval_loss": 0.5239570140838623, + "eval_runtime": 127.2839, + "eval_samples_per_second": 4.18, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2182940155556984, + "step": 17568 + }, + { + "epoch": 244.03, + "learning_rate": 2.1072000000000004e-05, + "loss": 0.3958, + "step": 17570 + }, + { + "epoch": 244.17, + "learning_rate": 2.106057142857143e-05, + "loss": 0.3679, + "step": 17580 + }, + { + "epoch": 244.3, + "learning_rate": 2.1049142857142858e-05, + "loss": 0.3655, + "step": 17590 + }, + { + "epoch": 244.44, + "learning_rate": 2.1037714285714288e-05, + "loss": 0.3695, + "step": 17600 + }, + { + "epoch": 244.58, + "learning_rate": 2.1026285714285715e-05, + "loss": 0.3638, + "step": 17610 + }, + { + "epoch": 244.72, + "learning_rate": 2.1014857142857145e-05, + "loss": 0.3743, + "step": 17620 + }, + { + "epoch": 244.86, + "learning_rate": 2.100342857142857e-05, + "loss": 0.3629, + "step": 17630 + }, + { + "epoch": 245.0, + "learning_rate": 2.0992000000000005e-05, + "loss": 0.3632, + "step": 17640 + }, + { + "epoch": 245.0, + "eval_loss": 0.5427106618881226, + "eval_runtime": 126.9592, + "eval_samples_per_second": 4.19, + "eval_steps_per_second": 0.528, + "eval_wer": 0.21951533071929036, + "step": 17640 + }, + { + "epoch": 245.14, + "learning_rate": 2.0980571428571432e-05, + "loss": 0.3745, + "step": 17650 + }, + { + "epoch": 245.28, + "learning_rate": 2.0969142857142855e-05, + "loss": 0.3814, + "step": 17660 + }, + { + "epoch": 245.42, + "learning_rate": 2.095771428571429e-05, + "loss": 0.3704, + "step": 17670 + }, + { + "epoch": 245.55, + "learning_rate": 2.0946285714285715e-05, + "loss": 0.3802, + "step": 17680 + }, + { + "epoch": 245.69, + "learning_rate": 2.0934857142857146e-05, + "loss": 0.3632, + "step": 17690 + }, + { + "epoch": 245.83, + "learning_rate": 2.0923428571428572e-05, + "loss": 0.3597, + "step": 17700 + }, + { + "epoch": 245.97, + "learning_rate": 2.0912000000000002e-05, + "loss": 0.3716, + "step": 17710 + }, + { + "epoch": 246.0, + "eval_loss": 0.52333664894104, + "eval_runtime": 126.6309, + "eval_samples_per_second": 4.201, + "eval_steps_per_second": 0.529, + "eval_wer": 0.21694414090120204, + "step": 17712 + }, + { + "epoch": 246.11, + "learning_rate": 2.090057142857143e-05, + "loss": 0.3573, + "step": 17720 + }, + { + "epoch": 246.25, + "learning_rate": 2.0889142857142856e-05, + "loss": 0.3728, + "step": 17730 + }, + { + "epoch": 246.39, + "learning_rate": 2.087771428571429e-05, + "loss": 0.364, + "step": 17740 + }, + { + "epoch": 246.53, + "learning_rate": 2.0866285714285716e-05, + "loss": 0.368, + "step": 17750 + }, + { + "epoch": 246.66, + "learning_rate": 2.0854857142857146e-05, + "loss": 0.3642, + "step": 17760 + }, + { + "epoch": 246.8, + "learning_rate": 2.0843428571428573e-05, + "loss": 0.3624, + "step": 17770 + }, + { + "epoch": 246.94, + "learning_rate": 2.0832000000000003e-05, + "loss": 0.3773, + "step": 17780 + }, + { + "epoch": 247.0, + "eval_loss": 0.5474402904510498, + "eval_runtime": 127.2514, + "eval_samples_per_second": 4.181, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21488718904673137, + "step": 17784 + }, + { + "epoch": 247.08, + "learning_rate": 2.082057142857143e-05, + "loss": 0.3685, + "step": 17790 + }, + { + "epoch": 247.22, + "learning_rate": 2.0809142857142857e-05, + "loss": 0.3626, + "step": 17800 + }, + { + "epoch": 247.36, + "learning_rate": 2.0797714285714287e-05, + "loss": 0.366, + "step": 17810 + }, + { + "epoch": 247.5, + "learning_rate": 2.0786285714285714e-05, + "loss": 0.3605, + "step": 17820 + }, + { + "epoch": 247.64, + "learning_rate": 2.0774857142857147e-05, + "loss": 0.3599, + "step": 17830 + }, + { + "epoch": 247.78, + "learning_rate": 2.0763428571428574e-05, + "loss": 0.3649, + "step": 17840 + }, + { + "epoch": 247.91, + "learning_rate": 2.0752000000000004e-05, + "loss": 0.3736, + "step": 17850 + }, + { + "epoch": 248.0, + "eval_loss": 0.551371157169342, + "eval_runtime": 127.1921, + "eval_samples_per_second": 4.183, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2263932634826766, + "step": 17856 + }, + { + "epoch": 248.06, + "learning_rate": 2.074057142857143e-05, + "loss": 0.3745, + "step": 17860 + }, + { + "epoch": 248.19, + "learning_rate": 2.072914285714286e-05, + "loss": 0.3715, + "step": 17870 + }, + { + "epoch": 248.33, + "learning_rate": 2.0717714285714288e-05, + "loss": 0.3635, + "step": 17880 + }, + { + "epoch": 248.47, + "learning_rate": 2.0706285714285714e-05, + "loss": 0.375, + "step": 17890 + }, + { + "epoch": 248.61, + "learning_rate": 2.0694857142857144e-05, + "loss": 0.3646, + "step": 17900 + }, + { + "epoch": 248.75, + "learning_rate": 2.068342857142857e-05, + "loss": 0.3685, + "step": 17910 + }, + { + "epoch": 248.89, + "learning_rate": 2.0672000000000005e-05, + "loss": 0.3635, + "step": 17920 + }, + { + "epoch": 249.0, + "eval_loss": 0.5074180364608765, + "eval_runtime": 127.0945, + "eval_samples_per_second": 4.186, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21867969402841164, + "step": 17928 + }, + { + "epoch": 249.03, + "learning_rate": 2.066057142857143e-05, + "loss": 0.3718, + "step": 17930 + }, + { + "epoch": 249.17, + "learning_rate": 2.064914285714286e-05, + "loss": 0.3672, + "step": 17940 + }, + { + "epoch": 249.3, + "learning_rate": 2.063771428571429e-05, + "loss": 0.3569, + "step": 17950 + }, + { + "epoch": 249.44, + "learning_rate": 2.0626285714285715e-05, + "loss": 0.3723, + "step": 17960 + }, + { + "epoch": 249.58, + "learning_rate": 2.0614857142857145e-05, + "loss": 0.3632, + "step": 17970 + }, + { + "epoch": 249.72, + "learning_rate": 2.0603428571428572e-05, + "loss": 0.376, + "step": 17980 + }, + { + "epoch": 249.86, + "learning_rate": 2.0592000000000002e-05, + "loss": 0.3599, + "step": 17990 + }, + { + "epoch": 250.0, + "learning_rate": 2.058057142857143e-05, + "loss": 0.3746, + "step": 18000 + }, + { + "epoch": 250.0, + "eval_loss": 0.5194135904312134, + "eval_runtime": 126.8277, + "eval_samples_per_second": 4.195, + "eval_steps_per_second": 0.528, + "eval_wer": 0.21925821173748153, + "step": 18000 + }, + { + "epoch": 250.14, + "learning_rate": 2.0569142857142862e-05, + "loss": 0.3784, + "step": 18010 + }, + { + "epoch": 250.28, + "learning_rate": 2.055771428571429e-05, + "loss": 0.3631, + "step": 18020 + }, + { + "epoch": 250.42, + "learning_rate": 2.0546285714285716e-05, + "loss": 0.3666, + "step": 18030 + }, + { + "epoch": 250.55, + "learning_rate": 2.0534857142857146e-05, + "loss": 0.3698, + "step": 18040 + }, + { + "epoch": 250.69, + "learning_rate": 2.0523428571428573e-05, + "loss": 0.3842, + "step": 18050 + }, + { + "epoch": 250.83, + "learning_rate": 2.0512000000000003e-05, + "loss": 0.3751, + "step": 18060 + }, + { + "epoch": 250.97, + "learning_rate": 2.050057142857143e-05, + "loss": 0.381, + "step": 18070 + }, + { + "epoch": 251.0, + "eval_loss": 0.5410602688789368, + "eval_runtime": 127.1031, + "eval_samples_per_second": 4.186, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21932249148293373, + "step": 18072 + }, + { + "epoch": 251.11, + "learning_rate": 2.048914285714286e-05, + "loss": 0.3734, + "step": 18080 + }, + { + "epoch": 251.25, + "learning_rate": 2.0477714285714286e-05, + "loss": 0.3835, + "step": 18090 + }, + { + "epoch": 251.39, + "learning_rate": 2.0466285714285713e-05, + "loss": 0.371, + "step": 18100 + }, + { + "epoch": 251.53, + "learning_rate": 2.0454857142857147e-05, + "loss": 0.3632, + "step": 18110 + }, + { + "epoch": 251.66, + "learning_rate": 2.0443428571428573e-05, + "loss": 0.3697, + "step": 18120 + }, + { + "epoch": 251.8, + "learning_rate": 2.0432000000000004e-05, + "loss": 0.3577, + "step": 18130 + }, + { + "epoch": 251.94, + "learning_rate": 2.042057142857143e-05, + "loss": 0.3762, + "step": 18140 + }, + { + "epoch": 252.0, + "eval_loss": 0.5317391753196716, + "eval_runtime": 126.6971, + "eval_samples_per_second": 4.199, + "eval_steps_per_second": 0.529, + "eval_wer": 0.2152085877739924, + "step": 18144 + }, + { + "epoch": 252.08, + "learning_rate": 2.040914285714286e-05, + "loss": 0.3649, + "step": 18150 + }, + { + "epoch": 252.22, + "learning_rate": 2.0397714285714287e-05, + "loss": 0.3568, + "step": 18160 + }, + { + "epoch": 252.36, + "learning_rate": 2.0386285714285714e-05, + "loss": 0.3589, + "step": 18170 + }, + { + "epoch": 252.5, + "learning_rate": 2.0374857142857144e-05, + "loss": 0.3588, + "step": 18180 + }, + { + "epoch": 252.64, + "learning_rate": 2.036342857142857e-05, + "loss": 0.369, + "step": 18190 + }, + { + "epoch": 252.78, + "learning_rate": 2.0352000000000004e-05, + "loss": 0.3783, + "step": 18200 + }, + { + "epoch": 252.91, + "learning_rate": 2.034057142857143e-05, + "loss": 0.3765, + "step": 18210 + }, + { + "epoch": 253.0, + "eval_loss": 0.5382375121116638, + "eval_runtime": 126.5891, + "eval_samples_per_second": 4.203, + "eval_steps_per_second": 0.529, + "eval_wer": 0.21630134344667995, + "step": 18216 + }, + { + "epoch": 253.06, + "learning_rate": 2.032914285714286e-05, + "loss": 0.3659, + "step": 18220 + }, + { + "epoch": 253.19, + "learning_rate": 2.0317714285714288e-05, + "loss": 0.3708, + "step": 18230 + }, + { + "epoch": 253.33, + "learning_rate": 2.0306285714285715e-05, + "loss": 0.3644, + "step": 18240 + }, + { + "epoch": 253.47, + "learning_rate": 2.0294857142857145e-05, + "loss": 0.3636, + "step": 18250 + }, + { + "epoch": 253.61, + "learning_rate": 2.028342857142857e-05, + "loss": 0.3588, + "step": 18260 + }, + { + "epoch": 253.75, + "learning_rate": 2.0272000000000002e-05, + "loss": 0.3673, + "step": 18270 + }, + { + "epoch": 253.89, + "learning_rate": 2.026057142857143e-05, + "loss": 0.3562, + "step": 18280 + }, + { + "epoch": 254.0, + "eval_loss": 0.5186808705329895, + "eval_runtime": 127.1972, + "eval_samples_per_second": 4.182, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21810117631934178, + "step": 18288 + }, + { + "epoch": 254.03, + "learning_rate": 2.0249142857142862e-05, + "loss": 0.3845, + "step": 18290 + }, + { + "epoch": 254.17, + "learning_rate": 2.023771428571429e-05, + "loss": 0.358, + "step": 18300 + }, + { + "epoch": 254.3, + "learning_rate": 2.0226285714285715e-05, + "loss": 0.3647, + "step": 18310 + }, + { + "epoch": 254.44, + "learning_rate": 2.0214857142857146e-05, + "loss": 0.3598, + "step": 18320 + }, + { + "epoch": 254.58, + "learning_rate": 2.0203428571428572e-05, + "loss": 0.3679, + "step": 18330 + }, + { + "epoch": 254.72, + "learning_rate": 2.0192000000000003e-05, + "loss": 0.3694, + "step": 18340 + }, + { + "epoch": 254.86, + "learning_rate": 2.018057142857143e-05, + "loss": 0.3714, + "step": 18350 + }, + { + "epoch": 255.0, + "learning_rate": 2.016914285714286e-05, + "loss": 0.3697, + "step": 18360 + }, + { + "epoch": 255.0, + "eval_loss": 0.5303229689598083, + "eval_runtime": 126.8978, + "eval_samples_per_second": 4.192, + "eval_steps_per_second": 0.528, + "eval_wer": 0.21777977759208073, + "step": 18360 + }, + { + "epoch": 255.14, + "learning_rate": 2.0157714285714286e-05, + "loss": 0.3713, + "step": 18370 + }, + { + "epoch": 255.28, + "learning_rate": 2.0146285714285713e-05, + "loss": 0.3725, + "step": 18380 + }, + { + "epoch": 255.42, + "learning_rate": 2.0134857142857146e-05, + "loss": 0.3864, + "step": 18390 + }, + { + "epoch": 255.55, + "learning_rate": 2.0123428571428573e-05, + "loss": 0.3863, + "step": 18400 + }, + { + "epoch": 255.69, + "learning_rate": 2.0112000000000003e-05, + "loss": 0.3753, + "step": 18410 + }, + { + "epoch": 255.83, + "learning_rate": 2.010057142857143e-05, + "loss": 0.3759, + "step": 18420 + }, + { + "epoch": 255.97, + "learning_rate": 2.008914285714286e-05, + "loss": 0.3693, + "step": 18430 + }, + { + "epoch": 256.0, + "eval_loss": 0.5515403151512146, + "eval_runtime": 126.9666, + "eval_samples_per_second": 4.19, + "eval_steps_per_second": 0.528, + "eval_wer": 0.22060808639197788, + "step": 18432 + }, + { + "epoch": 256.11, + "learning_rate": 2.0077714285714287e-05, + "loss": 0.3638, + "step": 18440 + }, + { + "epoch": 256.25, + "learning_rate": 2.0066285714285717e-05, + "loss": 0.3735, + "step": 18450 + }, + { + "epoch": 256.39, + "learning_rate": 2.0054857142857144e-05, + "loss": 0.3553, + "step": 18460 + }, + { + "epoch": 256.53, + "learning_rate": 2.004342857142857e-05, + "loss": 0.374, + "step": 18470 + }, + { + "epoch": 256.66, + "learning_rate": 2.0032000000000004e-05, + "loss": 0.3697, + "step": 18480 + }, + { + "epoch": 256.8, + "learning_rate": 2.002057142857143e-05, + "loss": 0.3592, + "step": 18490 + }, + { + "epoch": 256.94, + "learning_rate": 2.000914285714286e-05, + "loss": 0.3691, + "step": 18500 + }, + { + "epoch": 257.0, + "eval_loss": 0.524605929851532, + "eval_runtime": 126.5804, + "eval_samples_per_second": 4.203, + "eval_steps_per_second": 0.529, + "eval_wer": 0.2183582953011506, + "step": 18504 + }, + { + "epoch": 257.08, + "learning_rate": 1.9997714285714288e-05, + "loss": 0.3715, + "step": 18510 + }, + { + "epoch": 257.22, + "learning_rate": 1.9986285714285714e-05, + "loss": 0.3676, + "step": 18520 + }, + { + "epoch": 257.36, + "learning_rate": 1.9974857142857145e-05, + "loss": 0.3593, + "step": 18530 + }, + { + "epoch": 257.5, + "learning_rate": 1.9963428571428575e-05, + "loss": 0.3599, + "step": 18540 + }, + { + "epoch": 257.64, + "learning_rate": 1.9952e-05, + "loss": 0.3556, + "step": 18550 + }, + { + "epoch": 257.78, + "learning_rate": 1.9940571428571428e-05, + "loss": 0.3667, + "step": 18560 + }, + { + "epoch": 257.91, + "learning_rate": 1.9929142857142858e-05, + "loss": 0.3473, + "step": 18570 + }, + { + "epoch": 258.0, + "eval_loss": 0.5581291317939758, + "eval_runtime": 126.9248, + "eval_samples_per_second": 4.191, + "eval_steps_per_second": 0.528, + "eval_wer": 0.2159156649739667, + "step": 18576 + }, + { + "epoch": 258.06, + "learning_rate": 1.991771428571429e-05, + "loss": 0.3741, + "step": 18580 + }, + { + "epoch": 258.19, + "learning_rate": 1.9906285714285715e-05, + "loss": 0.3607, + "step": 18590 + }, + { + "epoch": 258.33, + "learning_rate": 1.9894857142857145e-05, + "loss": 0.3493, + "step": 18600 + }, + { + "epoch": 258.47, + "learning_rate": 1.9883428571428572e-05, + "loss": 0.3548, + "step": 18610 + }, + { + "epoch": 258.61, + "learning_rate": 1.9872000000000002e-05, + "loss": 0.3521, + "step": 18620 + }, + { + "epoch": 258.75, + "learning_rate": 1.9860571428571432e-05, + "loss": 0.3591, + "step": 18630 + }, + { + "epoch": 258.89, + "learning_rate": 1.984914285714286e-05, + "loss": 0.3622, + "step": 18640 + }, + { + "epoch": 259.0, + "eval_loss": 0.5329124927520752, + "eval_runtime": 126.9512, + "eval_samples_per_second": 4.191, + "eval_steps_per_second": 0.528, + "eval_wer": 0.21996528893745582, + "step": 18648 + }, + { + "epoch": 259.03, + "learning_rate": 1.9837714285714286e-05, + "loss": 0.3611, + "step": 18650 + }, + { + "epoch": 259.17, + "learning_rate": 1.9826285714285716e-05, + "loss": 0.3542, + "step": 18660 + }, + { + "epoch": 259.3, + "learning_rate": 1.9814857142857146e-05, + "loss": 0.3711, + "step": 18670 + }, + { + "epoch": 259.44, + "learning_rate": 1.9803428571428573e-05, + "loss": 0.3646, + "step": 18680 + }, + { + "epoch": 259.58, + "learning_rate": 1.9792000000000003e-05, + "loss": 0.3659, + "step": 18690 + }, + { + "epoch": 259.72, + "learning_rate": 1.978057142857143e-05, + "loss": 0.3672, + "step": 18700 + }, + { + "epoch": 259.86, + "learning_rate": 1.9769142857142856e-05, + "loss": 0.3544, + "step": 18710 + }, + { + "epoch": 260.0, + "learning_rate": 1.9757714285714287e-05, + "loss": 0.3677, + "step": 18720 + }, + { + "epoch": 260.0, + "eval_loss": 0.539287805557251, + "eval_runtime": 127.4006, + "eval_samples_per_second": 4.176, + "eval_steps_per_second": 0.526, + "eval_wer": 0.21810117631934178, + "step": 18720 + }, + { + "epoch": 260.14, + "learning_rate": 1.9746285714285717e-05, + "loss": 0.3627, + "step": 18730 + }, + { + "epoch": 260.28, + "learning_rate": 1.9734857142857143e-05, + "loss": 0.36, + "step": 18740 + }, + { + "epoch": 260.42, + "learning_rate": 1.9723428571428574e-05, + "loss": 0.3572, + "step": 18750 + }, + { + "epoch": 260.55, + "learning_rate": 1.9712000000000004e-05, + "loss": 0.3533, + "step": 18760 + }, + { + "epoch": 260.69, + "learning_rate": 1.970057142857143e-05, + "loss": 0.3561, + "step": 18770 + }, + { + "epoch": 260.83, + "learning_rate": 1.9689142857142857e-05, + "loss": 0.3552, + "step": 18780 + }, + { + "epoch": 260.97, + "learning_rate": 1.9677714285714287e-05, + "loss": 0.3593, + "step": 18790 + }, + { + "epoch": 261.0, + "eval_loss": 0.5371309518814087, + "eval_runtime": 126.9581, + "eval_samples_per_second": 4.19, + "eval_steps_per_second": 0.528, + "eval_wer": 0.2247862698463714, + "step": 18792 + }, + { + "epoch": 261.11, + "learning_rate": 1.9666285714285714e-05, + "loss": 0.3667, + "step": 18800 + }, + { + "epoch": 261.25, + "learning_rate": 1.9654857142857144e-05, + "loss": 0.3562, + "step": 18810 + }, + { + "epoch": 261.39, + "learning_rate": 1.9643428571428574e-05, + "loss": 0.3569, + "step": 18820 + }, + { + "epoch": 261.53, + "learning_rate": 1.9632e-05, + "loss": 0.3616, + "step": 18830 + }, + { + "epoch": 261.66, + "learning_rate": 1.962057142857143e-05, + "loss": 0.3511, + "step": 18840 + }, + { + "epoch": 261.8, + "learning_rate": 1.9609142857142858e-05, + "loss": 0.3633, + "step": 18850 + }, + { + "epoch": 261.94, + "learning_rate": 1.9597714285714288e-05, + "loss": 0.3623, + "step": 18860 + }, + { + "epoch": 262.0, + "eval_loss": 0.5376772880554199, + "eval_runtime": 128.7807, + "eval_samples_per_second": 4.131, + "eval_steps_per_second": 0.52, + "eval_wer": 0.21559426624670566, + "step": 18864 + }, + { + "epoch": 262.08, + "learning_rate": 1.9586285714285715e-05, + "loss": 0.3692, + "step": 18870 + }, + { + "epoch": 262.22, + "learning_rate": 1.9574857142857145e-05, + "loss": 0.3574, + "step": 18880 + }, + { + "epoch": 262.36, + "learning_rate": 1.9563428571428572e-05, + "loss": 0.3533, + "step": 18890 + }, + { + "epoch": 262.5, + "learning_rate": 1.9552000000000002e-05, + "loss": 0.3591, + "step": 18900 + }, + { + "epoch": 262.64, + "learning_rate": 1.9540571428571432e-05, + "loss": 0.3548, + "step": 18910 + }, + { + "epoch": 262.78, + "learning_rate": 1.952914285714286e-05, + "loss": 0.3616, + "step": 18920 + }, + { + "epoch": 262.91, + "learning_rate": 1.9517714285714285e-05, + "loss": 0.364, + "step": 18930 + }, + { + "epoch": 263.0, + "eval_loss": 0.528795599937439, + "eval_runtime": 126.9855, + "eval_samples_per_second": 4.189, + "eval_steps_per_second": 0.528, + "eval_wer": 0.2198367294465514, + "step": 18936 + }, + { + "epoch": 263.06, + "learning_rate": 1.9506285714285716e-05, + "loss": 0.3604, + "step": 18940 + }, + { + "epoch": 263.19, + "learning_rate": 1.9494857142857146e-05, + "loss": 0.3568, + "step": 18950 + }, + { + "epoch": 263.33, + "learning_rate": 1.9483428571428572e-05, + "loss": 0.3486, + "step": 18960 + }, + { + "epoch": 263.47, + "learning_rate": 1.9472000000000003e-05, + "loss": 0.3509, + "step": 18970 + }, + { + "epoch": 263.61, + "learning_rate": 1.946057142857143e-05, + "loss": 0.3503, + "step": 18980 + }, + { + "epoch": 263.75, + "learning_rate": 1.944914285714286e-05, + "loss": 0.3699, + "step": 18990 + }, + { + "epoch": 263.89, + "learning_rate": 1.9437714285714286e-05, + "loss": 0.3625, + "step": 19000 + }, + { + "epoch": 264.0, + "eval_loss": 0.5822650194168091, + "eval_runtime": 128.8366, + "eval_samples_per_second": 4.129, + "eval_steps_per_second": 0.52, + "eval_wer": 0.223114996464614, + "step": 19008 + }, + { + "epoch": 264.03, + "learning_rate": 1.9426285714285716e-05, + "loss": 0.373, + "step": 19010 + }, + { + "epoch": 264.17, + "learning_rate": 1.9414857142857143e-05, + "loss": 0.3642, + "step": 19020 + }, + { + "epoch": 264.3, + "learning_rate": 1.9403428571428573e-05, + "loss": 0.3596, + "step": 19030 + }, + { + "epoch": 264.44, + "learning_rate": 1.9392000000000003e-05, + "loss": 0.3698, + "step": 19040 + }, + { + "epoch": 264.58, + "learning_rate": 1.938057142857143e-05, + "loss": 0.3577, + "step": 19050 + }, + { + "epoch": 264.72, + "learning_rate": 1.936914285714286e-05, + "loss": 0.3605, + "step": 19060 + }, + { + "epoch": 264.86, + "learning_rate": 1.9358857142857142e-05, + "loss": 0.357, + "step": 19070 + }, + { + "epoch": 265.0, + "learning_rate": 1.9347428571428572e-05, + "loss": 0.3667, + "step": 19080 + }, + { + "epoch": 265.0, + "eval_loss": 0.524042546749115, + "eval_runtime": 126.7057, + "eval_samples_per_second": 4.199, + "eval_steps_per_second": 0.529, + "eval_wer": 0.22022240791926465, + "step": 19080 + }, + { + "epoch": 265.14, + "learning_rate": 1.9336000000000003e-05, + "loss": 0.3678, + "step": 19090 + }, + { + "epoch": 265.28, + "learning_rate": 1.932457142857143e-05, + "loss": 0.3707, + "step": 19100 + }, + { + "epoch": 265.42, + "learning_rate": 1.931314285714286e-05, + "loss": 0.3548, + "step": 19110 + }, + { + "epoch": 265.55, + "learning_rate": 1.930171428571429e-05, + "loss": 0.3551, + "step": 19120 + }, + { + "epoch": 265.69, + "learning_rate": 1.9290285714285716e-05, + "loss": 0.3801, + "step": 19130 + }, + { + "epoch": 265.83, + "learning_rate": 1.9278857142857143e-05, + "loss": 0.3518, + "step": 19140 + }, + { + "epoch": 265.97, + "learning_rate": 1.9267428571428573e-05, + "loss": 0.3703, + "step": 19150 + }, + { + "epoch": 266.0, + "eval_loss": 0.5182125568389893, + "eval_runtime": 127.5664, + "eval_samples_per_second": 4.17, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21373015362859163, + "step": 19152 + }, + { + "epoch": 266.11, + "learning_rate": 1.9256e-05, + "loss": 0.3655, + "step": 19160 + }, + { + "epoch": 266.25, + "learning_rate": 1.924457142857143e-05, + "loss": 0.3621, + "step": 19170 + }, + { + "epoch": 266.39, + "learning_rate": 1.923314285714286e-05, + "loss": 0.3555, + "step": 19180 + }, + { + "epoch": 266.53, + "learning_rate": 1.9221714285714287e-05, + "loss": 0.3666, + "step": 19190 + }, + { + "epoch": 266.66, + "learning_rate": 1.9210285714285717e-05, + "loss": 0.3609, + "step": 19200 + }, + { + "epoch": 266.8, + "learning_rate": 1.9198857142857144e-05, + "loss": 0.3512, + "step": 19210 + }, + { + "epoch": 266.94, + "learning_rate": 1.9187428571428574e-05, + "loss": 0.3646, + "step": 19220 + }, + { + "epoch": 267.0, + "eval_loss": 0.5210974216461182, + "eval_runtime": 128.3173, + "eval_samples_per_second": 4.146, + "eval_steps_per_second": 0.522, + "eval_wer": 0.2253647875554413, + "step": 19224 + }, + { + "epoch": 267.08, + "learning_rate": 1.9176e-05, + "loss": 0.3745, + "step": 19230 + }, + { + "epoch": 267.22, + "learning_rate": 1.916457142857143e-05, + "loss": 0.3551, + "step": 19240 + }, + { + "epoch": 267.36, + "learning_rate": 1.9153142857142858e-05, + "loss": 0.3442, + "step": 19250 + }, + { + "epoch": 267.5, + "learning_rate": 1.9141714285714288e-05, + "loss": 0.3627, + "step": 19260 + }, + { + "epoch": 267.64, + "learning_rate": 1.9130285714285718e-05, + "loss": 0.3623, + "step": 19270 + }, + { + "epoch": 267.78, + "learning_rate": 1.9118857142857145e-05, + "loss": 0.3599, + "step": 19280 + }, + { + "epoch": 267.91, + "learning_rate": 1.910742857142857e-05, + "loss": 0.3724, + "step": 19290 + }, + { + "epoch": 268.0, + "eval_loss": 0.5475848317146301, + "eval_runtime": 126.8228, + "eval_samples_per_second": 4.195, + "eval_steps_per_second": 0.528, + "eval_wer": 0.21552998650125346, + "step": 19296 + }, + { + "epoch": 268.06, + "learning_rate": 1.9096e-05, + "loss": 0.3527, + "step": 19300 + }, + { + "epoch": 268.19, + "learning_rate": 1.908457142857143e-05, + "loss": 0.3585, + "step": 19310 + }, + { + "epoch": 268.33, + "learning_rate": 1.907314285714286e-05, + "loss": 0.3658, + "step": 19320 + }, + { + "epoch": 268.47, + "learning_rate": 1.906171428571429e-05, + "loss": 0.3594, + "step": 19330 + }, + { + "epoch": 268.61, + "learning_rate": 1.9050285714285715e-05, + "loss": 0.3521, + "step": 19340 + }, + { + "epoch": 268.75, + "learning_rate": 1.9038857142857142e-05, + "loss": 0.3736, + "step": 19350 + }, + { + "epoch": 268.89, + "learning_rate": 1.9027428571428572e-05, + "loss": 0.3767, + "step": 19360 + }, + { + "epoch": 269.0, + "eval_loss": 0.5431725978851318, + "eval_runtime": 126.9814, + "eval_samples_per_second": 4.19, + "eval_steps_per_second": 0.528, + "eval_wer": 0.2184225750466028, + "step": 19368 + }, + { + "epoch": 269.03, + "learning_rate": 1.9016000000000002e-05, + "loss": 0.37, + "step": 19370 + }, + { + "epoch": 269.17, + "learning_rate": 1.900457142857143e-05, + "loss": 0.3706, + "step": 19380 + }, + { + "epoch": 269.3, + "learning_rate": 1.899314285714286e-05, + "loss": 0.3595, + "step": 19390 + }, + { + "epoch": 269.44, + "learning_rate": 1.898171428571429e-05, + "loss": 0.3617, + "step": 19400 + }, + { + "epoch": 269.58, + "learning_rate": 1.8970285714285716e-05, + "loss": 0.3511, + "step": 19410 + }, + { + "epoch": 269.72, + "learning_rate": 1.8958857142857146e-05, + "loss": 0.3618, + "step": 19420 + }, + { + "epoch": 269.86, + "learning_rate": 1.8947428571428573e-05, + "loss": 0.368, + "step": 19430 + }, + { + "epoch": 270.0, + "learning_rate": 1.8936e-05, + "loss": 0.3732, + "step": 19440 + }, + { + "epoch": 270.0, + "eval_loss": 0.5332251191139221, + "eval_runtime": 127.2781, + "eval_samples_per_second": 4.18, + "eval_steps_per_second": 0.526, + "eval_wer": 0.21597994471941892, + "step": 19440 + }, + { + "epoch": 270.14, + "learning_rate": 1.892457142857143e-05, + "loss": 0.362, + "step": 19450 + }, + { + "epoch": 270.28, + "learning_rate": 1.891314285714286e-05, + "loss": 0.366, + "step": 19460 + }, + { + "epoch": 270.42, + "learning_rate": 1.8901714285714287e-05, + "loss": 0.3726, + "step": 19470 + }, + { + "epoch": 270.55, + "learning_rate": 1.8890285714285717e-05, + "loss": 0.3604, + "step": 19480 + }, + { + "epoch": 270.69, + "learning_rate": 1.8878857142857147e-05, + "loss": 0.3519, + "step": 19490 + }, + { + "epoch": 270.83, + "learning_rate": 1.8867428571428574e-05, + "loss": 0.3619, + "step": 19500 + }, + { + "epoch": 270.97, + "learning_rate": 1.8856e-05, + "loss": 0.3511, + "step": 19510 + }, + { + "epoch": 271.0, + "eval_loss": 0.5079948902130127, + "eval_runtime": 127.6184, + "eval_samples_per_second": 4.169, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21546570675580123, + "step": 19512 + }, + { + "epoch": 271.11, + "learning_rate": 1.884457142857143e-05, + "loss": 0.3501, + "step": 19520 + }, + { + "epoch": 271.25, + "learning_rate": 1.8833142857142857e-05, + "loss": 0.3549, + "step": 19530 + }, + { + "epoch": 271.39, + "learning_rate": 1.8821714285714287e-05, + "loss": 0.3494, + "step": 19540 + }, + { + "epoch": 271.53, + "learning_rate": 1.8810285714285718e-05, + "loss": 0.3528, + "step": 19550 + }, + { + "epoch": 271.66, + "learning_rate": 1.8798857142857144e-05, + "loss": 0.3547, + "step": 19560 + }, + { + "epoch": 271.8, + "learning_rate": 1.878742857142857e-05, + "loss": 0.3627, + "step": 19570 + }, + { + "epoch": 271.94, + "learning_rate": 1.8776e-05, + "loss": 0.3611, + "step": 19580 + }, + { + "epoch": 272.0, + "eval_loss": 0.5135419964790344, + "eval_runtime": 127.2161, + "eval_samples_per_second": 4.182, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2152085877739924, + "step": 19584 + }, + { + "epoch": 272.08, + "learning_rate": 1.876457142857143e-05, + "loss": 0.3659, + "step": 19590 + }, + { + "epoch": 272.22, + "learning_rate": 1.8753142857142858e-05, + "loss": 0.365, + "step": 19600 + }, + { + "epoch": 272.36, + "learning_rate": 1.8741714285714288e-05, + "loss": 0.3593, + "step": 19610 + }, + { + "epoch": 272.5, + "learning_rate": 1.8730285714285715e-05, + "loss": 0.361, + "step": 19620 + }, + { + "epoch": 272.64, + "learning_rate": 1.8718857142857145e-05, + "loss": 0.3517, + "step": 19630 + }, + { + "epoch": 272.78, + "learning_rate": 1.8707428571428572e-05, + "loss": 0.3576, + "step": 19640 + }, + { + "epoch": 272.91, + "learning_rate": 1.8696000000000002e-05, + "loss": 0.3644, + "step": 19650 + }, + { + "epoch": 273.0, + "eval_loss": 0.5191617012023926, + "eval_runtime": 128.3341, + "eval_samples_per_second": 4.145, + "eval_steps_per_second": 0.522, + "eval_wer": 0.21225171948319085, + "step": 19656 + }, + { + "epoch": 273.06, + "learning_rate": 1.868457142857143e-05, + "loss": 0.3625, + "step": 19660 + }, + { + "epoch": 273.19, + "learning_rate": 1.867314285714286e-05, + "loss": 0.3509, + "step": 19670 + }, + { + "epoch": 273.33, + "learning_rate": 1.866171428571429e-05, + "loss": 0.346, + "step": 19680 + }, + { + "epoch": 273.47, + "learning_rate": 1.8650285714285716e-05, + "loss": 0.3687, + "step": 19690 + }, + { + "epoch": 273.61, + "learning_rate": 1.8638857142857146e-05, + "loss": 0.3559, + "step": 19700 + }, + { + "epoch": 273.75, + "learning_rate": 1.8627428571428573e-05, + "loss": 0.353, + "step": 19710 + }, + { + "epoch": 273.89, + "learning_rate": 1.8616e-05, + "loss": 0.3532, + "step": 19720 + }, + { + "epoch": 274.0, + "eval_loss": 0.5227620601654053, + "eval_runtime": 127.3304, + "eval_samples_per_second": 4.178, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2158513852285145, + "step": 19728 + }, + { + "epoch": 274.03, + "learning_rate": 1.860457142857143e-05, + "loss": 0.3729, + "step": 19730 + }, + { + "epoch": 274.17, + "learning_rate": 1.859314285714286e-05, + "loss": 0.3517, + "step": 19740 + }, + { + "epoch": 274.3, + "learning_rate": 1.8581714285714286e-05, + "loss": 0.3456, + "step": 19750 + }, + { + "epoch": 274.44, + "learning_rate": 1.8570285714285716e-05, + "loss": 0.3637, + "step": 19760 + }, + { + "epoch": 274.58, + "learning_rate": 1.8558857142857147e-05, + "loss": 0.3711, + "step": 19770 + }, + { + "epoch": 274.72, + "learning_rate": 1.8547428571428573e-05, + "loss": 0.3538, + "step": 19780 + }, + { + "epoch": 274.86, + "learning_rate": 1.8536e-05, + "loss": 0.3454, + "step": 19790 + }, + { + "epoch": 275.0, + "learning_rate": 1.852457142857143e-05, + "loss": 0.3502, + "step": 19800 + }, + { + "epoch": 275.0, + "eval_loss": 0.5399640202522278, + "eval_runtime": 127.5492, + "eval_samples_per_second": 4.171, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21250883846499968, + "step": 19800 + }, + { + "epoch": 275.14, + "learning_rate": 1.8513142857142857e-05, + "loss": 0.3709, + "step": 19810 + }, + { + "epoch": 275.28, + "learning_rate": 1.8501714285714287e-05, + "loss": 0.3538, + "step": 19820 + }, + { + "epoch": 275.42, + "learning_rate": 1.8490285714285717e-05, + "loss": 0.3431, + "step": 19830 + }, + { + "epoch": 275.55, + "learning_rate": 1.8478857142857144e-05, + "loss": 0.3633, + "step": 19840 + }, + { + "epoch": 275.69, + "learning_rate": 1.8467428571428574e-05, + "loss": 0.3642, + "step": 19850 + }, + { + "epoch": 275.83, + "learning_rate": 1.8456e-05, + "loss": 0.3459, + "step": 19860 + }, + { + "epoch": 275.97, + "learning_rate": 1.844457142857143e-05, + "loss": 0.3465, + "step": 19870 + }, + { + "epoch": 276.0, + "eval_loss": 0.5167775750160217, + "eval_runtime": 129.2606, + "eval_samples_per_second": 4.116, + "eval_steps_per_second": 0.518, + "eval_wer": 0.2128302371922607, + "step": 19872 + }, + { + "epoch": 276.11, + "learning_rate": 1.8433142857142858e-05, + "loss": 0.3529, + "step": 19880 + }, + { + "epoch": 276.25, + "learning_rate": 1.8421714285714288e-05, + "loss": 0.3605, + "step": 19890 + }, + { + "epoch": 276.39, + "learning_rate": 1.8410285714285715e-05, + "loss": 0.3572, + "step": 19900 + }, + { + "epoch": 276.53, + "learning_rate": 1.8398857142857145e-05, + "loss": 0.3574, + "step": 19910 + }, + { + "epoch": 276.66, + "learning_rate": 1.8387428571428575e-05, + "loss": 0.3538, + "step": 19920 + }, + { + "epoch": 276.8, + "learning_rate": 1.8376e-05, + "loss": 0.3451, + "step": 19930 + }, + { + "epoch": 276.94, + "learning_rate": 1.836457142857143e-05, + "loss": 0.3511, + "step": 19940 + }, + { + "epoch": 277.0, + "eval_loss": 0.5247382521629333, + "eval_runtime": 127.0619, + "eval_samples_per_second": 4.187, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2119303207559298, + "step": 19944 + }, + { + "epoch": 277.08, + "learning_rate": 1.835314285714286e-05, + "loss": 0.3567, + "step": 19950 + }, + { + "epoch": 277.22, + "learning_rate": 1.834171428571429e-05, + "loss": 0.3639, + "step": 19960 + }, + { + "epoch": 277.36, + "learning_rate": 1.8330285714285715e-05, + "loss": 0.3497, + "step": 19970 + }, + { + "epoch": 277.5, + "learning_rate": 1.8318857142857145e-05, + "loss": 0.3554, + "step": 19980 + }, + { + "epoch": 277.64, + "learning_rate": 1.8307428571428572e-05, + "loss": 0.3615, + "step": 19990 + }, + { + "epoch": 277.78, + "learning_rate": 1.8296e-05, + "loss": 0.3478, + "step": 20000 + }, + { + "epoch": 277.91, + "learning_rate": 1.828457142857143e-05, + "loss": 0.3678, + "step": 20010 + }, + { + "epoch": 278.0, + "eval_loss": 0.540915310382843, + "eval_runtime": 127.3382, + "eval_samples_per_second": 4.178, + "eval_steps_per_second": 0.526, + "eval_wer": 0.21231599922864305, + "step": 20016 + }, + { + "epoch": 278.06, + "learning_rate": 1.827314285714286e-05, + "loss": 0.3747, + "step": 20020 + }, + { + "epoch": 278.19, + "learning_rate": 1.8261714285714286e-05, + "loss": 0.3632, + "step": 20030 + }, + { + "epoch": 278.33, + "learning_rate": 1.8250285714285716e-05, + "loss": 0.363, + "step": 20040 + }, + { + "epoch": 278.47, + "learning_rate": 1.8238857142857146e-05, + "loss": 0.3707, + "step": 20050 + }, + { + "epoch": 278.61, + "learning_rate": 1.8227428571428573e-05, + "loss": 0.3448, + "step": 20060 + }, + { + "epoch": 278.75, + "learning_rate": 1.8216000000000003e-05, + "loss": 0.3649, + "step": 20070 + }, + { + "epoch": 278.89, + "learning_rate": 1.820457142857143e-05, + "loss": 0.3622, + "step": 20080 + }, + { + "epoch": 279.0, + "eval_loss": 0.5203441977500916, + "eval_runtime": 127.0306, + "eval_samples_per_second": 4.188, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21597994471941892, + "step": 20088 + }, + { + "epoch": 279.03, + "learning_rate": 1.8193142857142857e-05, + "loss": 0.3622, + "step": 20090 + }, + { + "epoch": 279.17, + "learning_rate": 1.8181714285714287e-05, + "loss": 0.372, + "step": 20100 + }, + { + "epoch": 279.3, + "learning_rate": 1.8170285714285717e-05, + "loss": 0.3685, + "step": 20110 + }, + { + "epoch": 279.44, + "learning_rate": 1.8158857142857144e-05, + "loss": 0.3536, + "step": 20120 + }, + { + "epoch": 279.58, + "learning_rate": 1.8147428571428574e-05, + "loss": 0.3708, + "step": 20130 + }, + { + "epoch": 279.72, + "learning_rate": 1.8136000000000004e-05, + "loss": 0.3632, + "step": 20140 + }, + { + "epoch": 279.86, + "learning_rate": 1.812457142857143e-05, + "loss": 0.351, + "step": 20150 + }, + { + "epoch": 280.0, + "learning_rate": 1.8113142857142857e-05, + "loss": 0.3438, + "step": 20160 + }, + { + "epoch": 280.0, + "eval_loss": 0.5173397064208984, + "eval_runtime": 127.4311, + "eval_samples_per_second": 4.175, + "eval_steps_per_second": 0.526, + "eval_wer": 0.20839493475605836, + "step": 20160 + }, + { + "epoch": 280.14, + "learning_rate": 1.8101714285714288e-05, + "loss": 0.3658, + "step": 20170 + }, + { + "epoch": 280.28, + "learning_rate": 1.8090285714285714e-05, + "loss": 0.3661, + "step": 20180 + }, + { + "epoch": 280.42, + "learning_rate": 1.8078857142857144e-05, + "loss": 0.3424, + "step": 20190 + }, + { + "epoch": 280.55, + "learning_rate": 1.8067428571428575e-05, + "loss": 0.3609, + "step": 20200 + }, + { + "epoch": 280.69, + "learning_rate": 1.8056e-05, + "loss": 0.3498, + "step": 20210 + }, + { + "epoch": 280.83, + "learning_rate": 1.8044571428571428e-05, + "loss": 0.3478, + "step": 20220 + }, + { + "epoch": 280.97, + "learning_rate": 1.8033142857142858e-05, + "loss": 0.3533, + "step": 20230 + }, + { + "epoch": 281.0, + "eval_loss": 0.5533133745193481, + "eval_runtime": 126.8352, + "eval_samples_per_second": 4.194, + "eval_steps_per_second": 0.528, + "eval_wer": 0.21321591566497397, + "step": 20232 + }, + { + "epoch": 281.11, + "learning_rate": 1.8021714285714288e-05, + "loss": 0.3521, + "step": 20240 + }, + { + "epoch": 281.25, + "learning_rate": 1.8010285714285715e-05, + "loss": 0.355, + "step": 20250 + }, + { + "epoch": 281.39, + "learning_rate": 1.7998857142857145e-05, + "loss": 0.3579, + "step": 20260 + }, + { + "epoch": 281.53, + "learning_rate": 1.7987428571428572e-05, + "loss": 0.3642, + "step": 20270 + }, + { + "epoch": 281.66, + "learning_rate": 1.7976000000000002e-05, + "loss": 0.3551, + "step": 20280 + }, + { + "epoch": 281.8, + "learning_rate": 1.796457142857143e-05, + "loss": 0.3513, + "step": 20290 + }, + { + "epoch": 281.94, + "learning_rate": 1.795314285714286e-05, + "loss": 0.3499, + "step": 20300 + }, + { + "epoch": 282.0, + "eval_loss": 0.5304237008094788, + "eval_runtime": 127.3045, + "eval_samples_per_second": 4.179, + "eval_steps_per_second": 0.526, + "eval_wer": 0.21321591566497397, + "step": 20304 + }, + { + "epoch": 282.08, + "learning_rate": 1.7941714285714286e-05, + "loss": 0.3627, + "step": 20310 + }, + { + "epoch": 282.22, + "learning_rate": 1.7930285714285716e-05, + "loss": 0.3503, + "step": 20320 + }, + { + "epoch": 282.36, + "learning_rate": 1.7918857142857146e-05, + "loss": 0.3462, + "step": 20330 + }, + { + "epoch": 282.5, + "learning_rate": 1.7907428571428573e-05, + "loss": 0.3515, + "step": 20340 + }, + { + "epoch": 282.64, + "learning_rate": 1.7896000000000003e-05, + "loss": 0.3566, + "step": 20350 + }, + { + "epoch": 282.78, + "learning_rate": 1.788457142857143e-05, + "loss": 0.357, + "step": 20360 + }, + { + "epoch": 282.91, + "learning_rate": 1.7873142857142856e-05, + "loss": 0.3573, + "step": 20370 + }, + { + "epoch": 283.0, + "eval_loss": 0.539974570274353, + "eval_runtime": 126.8021, + "eval_samples_per_second": 4.196, + "eval_steps_per_second": 0.528, + "eval_wer": 0.20968052966510253, + "step": 20376 + }, + { + "epoch": 283.06, + "learning_rate": 1.7861714285714286e-05, + "loss": 0.3692, + "step": 20380 + }, + { + "epoch": 283.19, + "learning_rate": 1.7850285714285717e-05, + "loss": 0.3654, + "step": 20390 + }, + { + "epoch": 283.33, + "learning_rate": 1.7838857142857143e-05, + "loss": 0.3614, + "step": 20400 + }, + { + "epoch": 283.47, + "learning_rate": 1.7827428571428573e-05, + "loss": 0.361, + "step": 20410 + }, + { + "epoch": 283.61, + "learning_rate": 1.7816000000000004e-05, + "loss": 0.3479, + "step": 20420 + }, + { + "epoch": 283.75, + "learning_rate": 1.780457142857143e-05, + "loss": 0.3599, + "step": 20430 + }, + { + "epoch": 283.89, + "learning_rate": 1.7793142857142857e-05, + "loss": 0.3575, + "step": 20440 + }, + { + "epoch": 284.0, + "eval_loss": 0.5404777526855469, + "eval_runtime": 127.5484, + "eval_samples_per_second": 4.171, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21154464228321657, + "step": 20448 + }, + { + "epoch": 284.03, + "learning_rate": 1.7781714285714287e-05, + "loss": 0.3489, + "step": 20450 + }, + { + "epoch": 284.17, + "learning_rate": 1.7770285714285714e-05, + "loss": 0.3606, + "step": 20460 + }, + { + "epoch": 284.3, + "learning_rate": 1.7758857142857144e-05, + "loss": 0.3541, + "step": 20470 + }, + { + "epoch": 284.44, + "learning_rate": 1.7747428571428574e-05, + "loss": 0.3759, + "step": 20480 + }, + { + "epoch": 284.58, + "learning_rate": 1.7736e-05, + "loss": 0.3642, + "step": 20490 + }, + { + "epoch": 284.72, + "learning_rate": 1.772457142857143e-05, + "loss": 0.3587, + "step": 20500 + }, + { + "epoch": 284.86, + "learning_rate": 1.7713142857142858e-05, + "loss": 0.3567, + "step": 20510 + }, + { + "epoch": 285.0, + "learning_rate": 1.7701714285714288e-05, + "loss": 0.3712, + "step": 20520 + }, + { + "epoch": 285.0, + "eval_loss": 0.5472289323806763, + "eval_runtime": 127.2476, + "eval_samples_per_second": 4.181, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2174583788648197, + "step": 20520 + }, + { + "epoch": 285.14, + "learning_rate": 1.7690285714285715e-05, + "loss": 0.365, + "step": 20530 + }, + { + "epoch": 285.28, + "learning_rate": 1.7678857142857145e-05, + "loss": 0.3548, + "step": 20540 + }, + { + "epoch": 285.42, + "learning_rate": 1.766742857142857e-05, + "loss": 0.361, + "step": 20550 + }, + { + "epoch": 285.55, + "learning_rate": 1.7656000000000002e-05, + "loss": 0.3403, + "step": 20560 + }, + { + "epoch": 285.69, + "learning_rate": 1.7644571428571432e-05, + "loss": 0.3593, + "step": 20570 + }, + { + "epoch": 285.83, + "learning_rate": 1.763314285714286e-05, + "loss": 0.3485, + "step": 20580 + }, + { + "epoch": 285.97, + "learning_rate": 1.7621714285714285e-05, + "loss": 0.3605, + "step": 20590 + }, + { + "epoch": 286.0, + "eval_loss": 0.5307502746582031, + "eval_runtime": 127.1794, + "eval_samples_per_second": 4.183, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2085234942469628, + "step": 20592 + }, + { + "epoch": 286.11, + "learning_rate": 1.7611428571428574e-05, + "loss": 0.3507, + "step": 20600 + }, + { + "epoch": 286.25, + "learning_rate": 1.76e-05, + "loss": 0.3663, + "step": 20610 + }, + { + "epoch": 286.39, + "learning_rate": 1.758857142857143e-05, + "loss": 0.362, + "step": 20620 + }, + { + "epoch": 286.53, + "learning_rate": 1.7577142857142858e-05, + "loss": 0.3645, + "step": 20630 + }, + { + "epoch": 286.66, + "learning_rate": 1.7565714285714288e-05, + "loss": 0.342, + "step": 20640 + }, + { + "epoch": 286.8, + "learning_rate": 1.7554285714285715e-05, + "loss": 0.346, + "step": 20650 + }, + { + "epoch": 286.94, + "learning_rate": 1.7542857142857145e-05, + "loss": 0.3453, + "step": 20660 + }, + { + "epoch": 287.0, + "eval_loss": 0.520065188407898, + "eval_runtime": 127.137, + "eval_samples_per_second": 4.184, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2128945169377129, + "step": 20664 + }, + { + "epoch": 287.08, + "learning_rate": 1.753142857142857e-05, + "loss": 0.3482, + "step": 20670 + }, + { + "epoch": 287.22, + "learning_rate": 1.752e-05, + "loss": 0.3502, + "step": 20680 + }, + { + "epoch": 287.36, + "learning_rate": 1.7508571428571432e-05, + "loss": 0.3568, + "step": 20690 + }, + { + "epoch": 287.5, + "learning_rate": 1.749714285714286e-05, + "loss": 0.354, + "step": 20700 + }, + { + "epoch": 287.64, + "learning_rate": 1.748571428571429e-05, + "loss": 0.3517, + "step": 20710 + }, + { + "epoch": 287.78, + "learning_rate": 1.7474285714285715e-05, + "loss": 0.356, + "step": 20720 + }, + { + "epoch": 287.91, + "learning_rate": 1.7462857142857142e-05, + "loss": 0.3518, + "step": 20730 + }, + { + "epoch": 288.0, + "eval_loss": 0.5606381893157959, + "eval_runtime": 128.5235, + "eval_samples_per_second": 4.139, + "eval_steps_per_second": 0.521, + "eval_wer": 0.21070900559233785, + "step": 20736 + }, + { + "epoch": 288.06, + "learning_rate": 1.7451428571428572e-05, + "loss": 0.361, + "step": 20740 + }, + { + "epoch": 288.19, + "learning_rate": 1.7440000000000002e-05, + "loss": 0.3486, + "step": 20750 + }, + { + "epoch": 288.33, + "learning_rate": 1.742857142857143e-05, + "loss": 0.3447, + "step": 20760 + }, + { + "epoch": 288.47, + "learning_rate": 1.741714285714286e-05, + "loss": 0.3478, + "step": 20770 + }, + { + "epoch": 288.61, + "learning_rate": 1.740571428571429e-05, + "loss": 0.3517, + "step": 20780 + }, + { + "epoch": 288.75, + "learning_rate": 1.7394285714285716e-05, + "loss": 0.3579, + "step": 20790 + }, + { + "epoch": 288.89, + "learning_rate": 1.7382857142857143e-05, + "loss": 0.3448, + "step": 20800 + }, + { + "epoch": 289.0, + "eval_loss": 0.5287786722183228, + "eval_runtime": 127.502, + "eval_samples_per_second": 4.172, + "eval_steps_per_second": 0.525, + "eval_wer": 0.20672366137430095, + "step": 20808 + }, + { + "epoch": 289.03, + "learning_rate": 1.7371428571428573e-05, + "loss": 0.351, + "step": 20810 + }, + { + "epoch": 289.17, + "learning_rate": 1.736e-05, + "loss": 0.3395, + "step": 20820 + }, + { + "epoch": 289.3, + "learning_rate": 1.734857142857143e-05, + "loss": 0.3343, + "step": 20830 + }, + { + "epoch": 289.44, + "learning_rate": 1.733714285714286e-05, + "loss": 0.3472, + "step": 20840 + }, + { + "epoch": 289.58, + "learning_rate": 1.7325714285714287e-05, + "loss": 0.3489, + "step": 20850 + }, + { + "epoch": 289.72, + "learning_rate": 1.7314285714285717e-05, + "loss": 0.3609, + "step": 20860 + }, + { + "epoch": 289.86, + "learning_rate": 1.7302857142857144e-05, + "loss": 0.3651, + "step": 20870 + }, + { + "epoch": 290.0, + "learning_rate": 1.7291428571428574e-05, + "loss": 0.3509, + "step": 20880 + }, + { + "epoch": 290.0, + "eval_loss": 0.5383898019790649, + "eval_runtime": 128.542, + "eval_samples_per_second": 4.139, + "eval_steps_per_second": 0.521, + "eval_wer": 0.21308735617406954, + "step": 20880 + }, + { + "epoch": 290.14, + "learning_rate": 1.728e-05, + "loss": 0.3531, + "step": 20890 + }, + { + "epoch": 290.28, + "learning_rate": 1.726857142857143e-05, + "loss": 0.3448, + "step": 20900 + }, + { + "epoch": 290.42, + "learning_rate": 1.7257142857142857e-05, + "loss": 0.3492, + "step": 20910 + }, + { + "epoch": 290.55, + "learning_rate": 1.7245714285714288e-05, + "loss": 0.3425, + "step": 20920 + }, + { + "epoch": 290.69, + "learning_rate": 1.7234285714285718e-05, + "loss": 0.3542, + "step": 20930 + }, + { + "epoch": 290.83, + "learning_rate": 1.7222857142857144e-05, + "loss": 0.3422, + "step": 20940 + }, + { + "epoch": 290.97, + "learning_rate": 1.721142857142857e-05, + "loss": 0.3556, + "step": 20950 + }, + { + "epoch": 291.0, + "eval_loss": 0.5217521786689758, + "eval_runtime": 127.3438, + "eval_samples_per_second": 4.178, + "eval_steps_per_second": 0.526, + "eval_wer": 0.21225171948319085, + "step": 20952 + }, + { + "epoch": 291.11, + "learning_rate": 1.72e-05, + "loss": 0.3533, + "step": 20960 + }, + { + "epoch": 291.25, + "learning_rate": 1.718857142857143e-05, + "loss": 0.3515, + "step": 20970 + }, + { + "epoch": 291.39, + "learning_rate": 1.7177142857142858e-05, + "loss": 0.3405, + "step": 20980 + }, + { + "epoch": 291.53, + "learning_rate": 1.716571428571429e-05, + "loss": 0.3434, + "step": 20990 + }, + { + "epoch": 291.66, + "learning_rate": 1.7154285714285715e-05, + "loss": 0.3492, + "step": 21000 + }, + { + "epoch": 291.8, + "learning_rate": 1.7142857142857142e-05, + "loss": 0.3493, + "step": 21010 + }, + { + "epoch": 291.94, + "learning_rate": 1.7131428571428572e-05, + "loss": 0.35, + "step": 21020 + }, + { + "epoch": 292.0, + "eval_loss": 0.5636931657791138, + "eval_runtime": 128.2735, + "eval_samples_per_second": 4.147, + "eval_steps_per_second": 0.522, + "eval_wer": 0.2077521373015363, + "step": 21024 + }, + { + "epoch": 292.08, + "learning_rate": 1.7120000000000002e-05, + "loss": 0.3516, + "step": 21030 + }, + { + "epoch": 292.22, + "learning_rate": 1.710857142857143e-05, + "loss": 0.3451, + "step": 21040 + }, + { + "epoch": 292.36, + "learning_rate": 1.709714285714286e-05, + "loss": 0.3512, + "step": 21050 + }, + { + "epoch": 292.5, + "learning_rate": 1.708571428571429e-05, + "loss": 0.3478, + "step": 21060 + }, + { + "epoch": 292.64, + "learning_rate": 1.7074285714285716e-05, + "loss": 0.3458, + "step": 21070 + }, + { + "epoch": 292.78, + "learning_rate": 1.7062857142857143e-05, + "loss": 0.355, + "step": 21080 + }, + { + "epoch": 292.91, + "learning_rate": 1.7051428571428573e-05, + "loss": 0.3477, + "step": 21090 + }, + { + "epoch": 293.0, + "eval_loss": 0.5156041979789734, + "eval_runtime": 127.172, + "eval_samples_per_second": 4.183, + "eval_steps_per_second": 0.527, + "eval_wer": 0.20890917271967602, + "step": 21096 + }, + { + "epoch": 293.06, + "learning_rate": 1.704e-05, + "loss": 0.3541, + "step": 21100 + }, + { + "epoch": 293.19, + "learning_rate": 1.702857142857143e-05, + "loss": 0.3451, + "step": 21110 + }, + { + "epoch": 293.33, + "learning_rate": 1.701714285714286e-05, + "loss": 0.3389, + "step": 21120 + }, + { + "epoch": 293.47, + "learning_rate": 1.7005714285714286e-05, + "loss": 0.3594, + "step": 21130 + }, + { + "epoch": 293.61, + "learning_rate": 1.6994285714285717e-05, + "loss": 0.3276, + "step": 21140 + }, + { + "epoch": 293.75, + "learning_rate": 1.6982857142857143e-05, + "loss": 0.3441, + "step": 21150 + }, + { + "epoch": 293.89, + "learning_rate": 1.6971428571428574e-05, + "loss": 0.3434, + "step": 21160 + }, + { + "epoch": 294.0, + "eval_loss": 0.5256971120834351, + "eval_runtime": 127.9906, + "eval_samples_per_second": 4.157, + "eval_steps_per_second": 0.523, + "eval_wer": 0.2112232435559555, + "step": 21168 + }, + { + "epoch": 294.03, + "learning_rate": 1.696e-05, + "loss": 0.351, + "step": 21170 + }, + { + "epoch": 294.17, + "learning_rate": 1.694857142857143e-05, + "loss": 0.3497, + "step": 21180 + }, + { + "epoch": 294.3, + "learning_rate": 1.6937142857142857e-05, + "loss": 0.3508, + "step": 21190 + }, + { + "epoch": 294.44, + "learning_rate": 1.6925714285714287e-05, + "loss": 0.3421, + "step": 21200 + }, + { + "epoch": 294.58, + "learning_rate": 1.6914285714285717e-05, + "loss": 0.3302, + "step": 21210 + }, + { + "epoch": 294.72, + "learning_rate": 1.6902857142857144e-05, + "loss": 0.352, + "step": 21220 + }, + { + "epoch": 294.86, + "learning_rate": 1.689142857142857e-05, + "loss": 0.3493, + "step": 21230 + }, + { + "epoch": 295.0, + "learning_rate": 1.688e-05, + "loss": 0.3387, + "step": 21240 + }, + { + "epoch": 295.0, + "eval_loss": 0.530138373374939, + "eval_runtime": 127.4784, + "eval_samples_per_second": 4.173, + "eval_steps_per_second": 0.526, + "eval_wer": 0.21623706370122775, + "step": 21240 + }, + { + "epoch": 295.14, + "learning_rate": 1.686857142857143e-05, + "loss": 0.365, + "step": 21250 + }, + { + "epoch": 295.28, + "learning_rate": 1.6857142857142858e-05, + "loss": 0.3434, + "step": 21260 + }, + { + "epoch": 295.42, + "learning_rate": 1.6845714285714288e-05, + "loss": 0.3437, + "step": 21270 + }, + { + "epoch": 295.55, + "learning_rate": 1.6834285714285715e-05, + "loss": 0.3491, + "step": 21280 + }, + { + "epoch": 295.69, + "learning_rate": 1.6822857142857145e-05, + "loss": 0.3439, + "step": 21290 + }, + { + "epoch": 295.83, + "learning_rate": 1.681142857142857e-05, + "loss": 0.3376, + "step": 21300 + }, + { + "epoch": 295.97, + "learning_rate": 1.6800000000000002e-05, + "loss": 0.3435, + "step": 21310 + }, + { + "epoch": 296.0, + "eval_loss": 0.5422194600105286, + "eval_runtime": 127.4491, + "eval_samples_per_second": 4.174, + "eval_steps_per_second": 0.526, + "eval_wer": 0.21617278395577552, + "step": 21312 + }, + { + "epoch": 296.11, + "learning_rate": 1.678857142857143e-05, + "loss": 0.3357, + "step": 21320 + }, + { + "epoch": 296.25, + "learning_rate": 1.677714285714286e-05, + "loss": 0.3418, + "step": 21330 + }, + { + "epoch": 296.39, + "learning_rate": 1.676571428571429e-05, + "loss": 0.3393, + "step": 21340 + }, + { + "epoch": 296.53, + "learning_rate": 1.6754285714285716e-05, + "loss": 0.3425, + "step": 21350 + }, + { + "epoch": 296.66, + "learning_rate": 1.6742857142857146e-05, + "loss": 0.3447, + "step": 21360 + }, + { + "epoch": 296.8, + "learning_rate": 1.6731428571428572e-05, + "loss": 0.3429, + "step": 21370 + }, + { + "epoch": 296.94, + "learning_rate": 1.672e-05, + "loss": 0.3547, + "step": 21380 + }, + { + "epoch": 297.0, + "eval_loss": 0.5458853840827942, + "eval_runtime": 127.0966, + "eval_samples_per_second": 4.186, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21064472584688565, + "step": 21384 + }, + { + "epoch": 297.08, + "learning_rate": 1.670857142857143e-05, + "loss": 0.3561, + "step": 21390 + }, + { + "epoch": 297.22, + "learning_rate": 1.669714285714286e-05, + "loss": 0.3479, + "step": 21400 + }, + { + "epoch": 297.36, + "learning_rate": 1.6685714285714286e-05, + "loss": 0.3294, + "step": 21410 + }, + { + "epoch": 297.5, + "learning_rate": 1.6674285714285716e-05, + "loss": 0.3351, + "step": 21420 + }, + { + "epoch": 297.64, + "learning_rate": 1.6662857142857146e-05, + "loss": 0.3399, + "step": 21430 + }, + { + "epoch": 297.78, + "learning_rate": 1.6651428571428573e-05, + "loss": 0.3554, + "step": 21440 + }, + { + "epoch": 297.91, + "learning_rate": 1.664e-05, + "loss": 0.3321, + "step": 21450 + }, + { + "epoch": 298.0, + "eval_loss": 0.5524464249610901, + "eval_runtime": 127.5275, + "eval_samples_per_second": 4.172, + "eval_steps_per_second": 0.525, + "eval_wer": 0.20820209551970173, + "step": 21456 + }, + { + "epoch": 298.06, + "learning_rate": 1.662857142857143e-05, + "loss": 0.3653, + "step": 21460 + }, + { + "epoch": 298.19, + "learning_rate": 1.6617142857142857e-05, + "loss": 0.3558, + "step": 21470 + }, + { + "epoch": 298.33, + "learning_rate": 1.6605714285714287e-05, + "loss": 0.331, + "step": 21480 + }, + { + "epoch": 298.47, + "learning_rate": 1.6594285714285717e-05, + "loss": 0.3437, + "step": 21490 + }, + { + "epoch": 298.61, + "learning_rate": 1.6582857142857144e-05, + "loss": 0.3489, + "step": 21500 + }, + { + "epoch": 298.75, + "learning_rate": 1.6571428571428574e-05, + "loss": 0.3478, + "step": 21510 + }, + { + "epoch": 298.89, + "learning_rate": 1.656e-05, + "loss": 0.3428, + "step": 21520 + }, + { + "epoch": 299.0, + "eval_loss": 0.5319285988807678, + "eval_runtime": 128.6276, + "eval_samples_per_second": 4.136, + "eval_steps_per_second": 0.521, + "eval_wer": 0.2141158321013049, + "step": 21528 + }, + { + "epoch": 299.03, + "learning_rate": 1.654857142857143e-05, + "loss": 0.3544, + "step": 21530 + }, + { + "epoch": 299.17, + "learning_rate": 1.6537142857142858e-05, + "loss": 0.3398, + "step": 21540 + }, + { + "epoch": 299.3, + "learning_rate": 1.6525714285714288e-05, + "loss": 0.3388, + "step": 21550 + }, + { + "epoch": 299.44, + "learning_rate": 1.6514285714285714e-05, + "loss": 0.3553, + "step": 21560 + }, + { + "epoch": 299.58, + "learning_rate": 1.6502857142857145e-05, + "loss": 0.333, + "step": 21570 + }, + { + "epoch": 299.72, + "learning_rate": 1.6491428571428575e-05, + "loss": 0.3412, + "step": 21580 + }, + { + "epoch": 299.86, + "learning_rate": 1.648e-05, + "loss": 0.3386, + "step": 21590 + }, + { + "epoch": 300.0, + "learning_rate": 1.6468571428571428e-05, + "loss": 0.3417, + "step": 21600 + }, + { + "epoch": 300.0, + "eval_loss": 0.5320257544517517, + "eval_runtime": 127.0634, + "eval_samples_per_second": 4.187, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21302307642861734, + "step": 21600 + }, + { + "epoch": 300.14, + "learning_rate": 1.645714285714286e-05, + "loss": 0.3276, + "step": 21610 + }, + { + "epoch": 300.28, + "learning_rate": 1.644571428571429e-05, + "loss": 0.3397, + "step": 21620 + }, + { + "epoch": 300.42, + "learning_rate": 1.6434285714285715e-05, + "loss": 0.3452, + "step": 21630 + }, + { + "epoch": 300.55, + "learning_rate": 1.6422857142857145e-05, + "loss": 0.3493, + "step": 21640 + }, + { + "epoch": 300.69, + "learning_rate": 1.6411428571428572e-05, + "loss": 0.3432, + "step": 21650 + }, + { + "epoch": 300.83, + "learning_rate": 1.64e-05, + "loss": 0.3439, + "step": 21660 + }, + { + "epoch": 300.97, + "learning_rate": 1.638857142857143e-05, + "loss": 0.342, + "step": 21670 + }, + { + "epoch": 301.0, + "eval_loss": 0.5574966073036194, + "eval_runtime": 127.8319, + "eval_samples_per_second": 4.162, + "eval_steps_per_second": 0.524, + "eval_wer": 0.21475862955582695, + "step": 21672 + }, + { + "epoch": 301.11, + "learning_rate": 1.637714285714286e-05, + "loss": 0.338, + "step": 21680 + }, + { + "epoch": 301.25, + "learning_rate": 1.6365714285714286e-05, + "loss": 0.3405, + "step": 21690 + }, + { + "epoch": 301.39, + "learning_rate": 1.6354285714285716e-05, + "loss": 0.3345, + "step": 21700 + }, + { + "epoch": 301.53, + "learning_rate": 1.6342857142857146e-05, + "loss": 0.344, + "step": 21710 + }, + { + "epoch": 301.66, + "learning_rate": 1.6331428571428573e-05, + "loss": 0.3445, + "step": 21720 + }, + { + "epoch": 301.8, + "learning_rate": 1.632e-05, + "loss": 0.3389, + "step": 21730 + }, + { + "epoch": 301.94, + "learning_rate": 1.630857142857143e-05, + "loss": 0.3405, + "step": 21740 + }, + { + "epoch": 302.0, + "eval_loss": 0.5350791215896606, + "eval_runtime": 127.9411, + "eval_samples_per_second": 4.158, + "eval_steps_per_second": 0.524, + "eval_wer": 0.21038760686507682, + "step": 21744 + }, + { + "epoch": 302.08, + "learning_rate": 1.6297142857142856e-05, + "loss": 0.3465, + "step": 21750 + }, + { + "epoch": 302.22, + "learning_rate": 1.6285714285714287e-05, + "loss": 0.3492, + "step": 21760 + }, + { + "epoch": 302.36, + "learning_rate": 1.6274285714285717e-05, + "loss": 0.3287, + "step": 21770 + }, + { + "epoch": 302.5, + "learning_rate": 1.6262857142857143e-05, + "loss": 0.3462, + "step": 21780 + }, + { + "epoch": 302.64, + "learning_rate": 1.6251428571428574e-05, + "loss": 0.338, + "step": 21790 + }, + { + "epoch": 302.78, + "learning_rate": 1.6240000000000004e-05, + "loss": 0.3353, + "step": 21800 + }, + { + "epoch": 302.91, + "learning_rate": 1.622857142857143e-05, + "loss": 0.3333, + "step": 21810 + }, + { + "epoch": 303.0, + "eval_loss": 0.5319588780403137, + "eval_runtime": 127.5663, + "eval_samples_per_second": 4.17, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2128302371922607, + "step": 21816 + }, + { + "epoch": 303.06, + "learning_rate": 1.6217142857142857e-05, + "loss": 0.3585, + "step": 21820 + }, + { + "epoch": 303.19, + "learning_rate": 1.6205714285714287e-05, + "loss": 0.3292, + "step": 21830 + }, + { + "epoch": 303.33, + "learning_rate": 1.6194285714285714e-05, + "loss": 0.3426, + "step": 21840 + }, + { + "epoch": 303.47, + "learning_rate": 1.6182857142857144e-05, + "loss": 0.3526, + "step": 21850 + }, + { + "epoch": 303.61, + "learning_rate": 1.6171428571428574e-05, + "loss": 0.3262, + "step": 21860 + }, + { + "epoch": 303.75, + "learning_rate": 1.616e-05, + "loss": 0.3374, + "step": 21870 + }, + { + "epoch": 303.89, + "learning_rate": 1.6148571428571428e-05, + "loss": 0.3349, + "step": 21880 + }, + { + "epoch": 304.0, + "eval_loss": 0.5287381410598755, + "eval_runtime": 127.182, + "eval_samples_per_second": 4.183, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2112232435559555, + "step": 21888 + }, + { + "epoch": 304.03, + "learning_rate": 1.6137142857142858e-05, + "loss": 0.353, + "step": 21890 + }, + { + "epoch": 304.17, + "learning_rate": 1.6125714285714288e-05, + "loss": 0.3508, + "step": 21900 + }, + { + "epoch": 304.3, + "learning_rate": 1.6114285714285715e-05, + "loss": 0.3416, + "step": 21910 + }, + { + "epoch": 304.44, + "learning_rate": 1.6102857142857145e-05, + "loss": 0.3401, + "step": 21920 + }, + { + "epoch": 304.58, + "learning_rate": 1.6091428571428572e-05, + "loss": 0.347, + "step": 21930 + }, + { + "epoch": 304.72, + "learning_rate": 1.6080000000000002e-05, + "loss": 0.3494, + "step": 21940 + }, + { + "epoch": 304.86, + "learning_rate": 1.606857142857143e-05, + "loss": 0.3317, + "step": 21950 + }, + { + "epoch": 305.0, + "learning_rate": 1.605714285714286e-05, + "loss": 0.3458, + "step": 21960 + }, + { + "epoch": 305.0, + "eval_loss": 0.5396945476531982, + "eval_runtime": 127.3454, + "eval_samples_per_second": 4.178, + "eval_steps_per_second": 0.526, + "eval_wer": 0.20768785755608407, + "step": 21960 + }, + { + "epoch": 305.14, + "learning_rate": 1.6045714285714286e-05, + "loss": 0.3378, + "step": 21970 + }, + { + "epoch": 305.28, + "learning_rate": 1.6034285714285716e-05, + "loss": 0.3435, + "step": 21980 + }, + { + "epoch": 305.42, + "learning_rate": 1.6022857142857146e-05, + "loss": 0.3366, + "step": 21990 + }, + { + "epoch": 305.55, + "learning_rate": 1.6011428571428573e-05, + "loss": 0.3335, + "step": 22000 + }, + { + "epoch": 305.69, + "learning_rate": 1.6000000000000003e-05, + "loss": 0.3554, + "step": 22010 + }, + { + "epoch": 305.83, + "learning_rate": 1.598857142857143e-05, + "loss": 0.3311, + "step": 22020 + }, + { + "epoch": 305.97, + "learning_rate": 1.5977142857142856e-05, + "loss": 0.3514, + "step": 22030 + }, + { + "epoch": 306.0, + "eval_loss": 0.5414637327194214, + "eval_runtime": 127.525, + "eval_samples_per_second": 4.172, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2101947676287202, + "step": 22032 + }, + { + "epoch": 306.11, + "learning_rate": 1.5965714285714286e-05, + "loss": 0.3492, + "step": 22040 + }, + { + "epoch": 306.25, + "learning_rate": 1.5954285714285716e-05, + "loss": 0.3464, + "step": 22050 + }, + { + "epoch": 306.39, + "learning_rate": 1.5942857142857143e-05, + "loss": 0.3442, + "step": 22060 + }, + { + "epoch": 306.53, + "learning_rate": 1.5931428571428573e-05, + "loss": 0.3481, + "step": 22070 + }, + { + "epoch": 306.66, + "learning_rate": 1.5920000000000003e-05, + "loss": 0.3354, + "step": 22080 + }, + { + "epoch": 306.8, + "learning_rate": 1.590857142857143e-05, + "loss": 0.3412, + "step": 22090 + }, + { + "epoch": 306.94, + "learning_rate": 1.5897142857142857e-05, + "loss": 0.3685, + "step": 22100 + }, + { + "epoch": 307.0, + "eval_loss": 0.5349737405776978, + "eval_runtime": 129.2084, + "eval_samples_per_second": 4.117, + "eval_steps_per_second": 0.519, + "eval_wer": 0.2110946840650511, + "step": 22104 + }, + { + "epoch": 307.08, + "learning_rate": 1.5885714285714287e-05, + "loss": 0.3528, + "step": 22110 + }, + { + "epoch": 307.22, + "learning_rate": 1.5874285714285714e-05, + "loss": 0.3511, + "step": 22120 + }, + { + "epoch": 307.36, + "learning_rate": 1.5862857142857144e-05, + "loss": 0.3378, + "step": 22130 + }, + { + "epoch": 307.5, + "learning_rate": 1.5851428571428574e-05, + "loss": 0.3421, + "step": 22140 + }, + { + "epoch": 307.64, + "learning_rate": 1.584e-05, + "loss": 0.3457, + "step": 22150 + }, + { + "epoch": 307.78, + "learning_rate": 1.582857142857143e-05, + "loss": 0.3429, + "step": 22160 + }, + { + "epoch": 307.91, + "learning_rate": 1.5817142857142858e-05, + "loss": 0.3487, + "step": 22170 + }, + { + "epoch": 308.0, + "eval_loss": 0.5534842610359192, + "eval_runtime": 128.2353, + "eval_samples_per_second": 4.149, + "eval_steps_per_second": 0.522, + "eval_wer": 0.2206723661374301, + "step": 22176 + }, + { + "epoch": 308.06, + "learning_rate": 1.5805714285714288e-05, + "loss": 0.3495, + "step": 22180 + }, + { + "epoch": 308.19, + "learning_rate": 1.5794285714285715e-05, + "loss": 0.3462, + "step": 22190 + }, + { + "epoch": 308.33, + "learning_rate": 1.5782857142857145e-05, + "loss": 0.3398, + "step": 22200 + }, + { + "epoch": 308.47, + "learning_rate": 1.577142857142857e-05, + "loss": 0.3476, + "step": 22210 + }, + { + "epoch": 308.61, + "learning_rate": 1.576e-05, + "loss": 0.3354, + "step": 22220 + }, + { + "epoch": 308.75, + "learning_rate": 1.5748571428571432e-05, + "loss": 0.3376, + "step": 22230 + }, + { + "epoch": 308.89, + "learning_rate": 1.573714285714286e-05, + "loss": 0.3304, + "step": 22240 + }, + { + "epoch": 309.0, + "eval_loss": 0.5668252110481262, + "eval_runtime": 127.9379, + "eval_samples_per_second": 4.158, + "eval_steps_per_second": 0.524, + "eval_wer": 0.21244455871954748, + "step": 22248 + }, + { + "epoch": 309.03, + "learning_rate": 1.5725714285714285e-05, + "loss": 0.3404, + "step": 22250 + }, + { + "epoch": 309.17, + "learning_rate": 1.5714285714285715e-05, + "loss": 0.3337, + "step": 22260 + }, + { + "epoch": 309.3, + "learning_rate": 1.5702857142857145e-05, + "loss": 0.3386, + "step": 22270 + }, + { + "epoch": 309.44, + "learning_rate": 1.5691428571428572e-05, + "loss": 0.3414, + "step": 22280 + }, + { + "epoch": 309.58, + "learning_rate": 1.5680000000000002e-05, + "loss": 0.3301, + "step": 22290 + }, + { + "epoch": 309.72, + "learning_rate": 1.566857142857143e-05, + "loss": 0.3412, + "step": 22300 + }, + { + "epoch": 309.86, + "learning_rate": 1.5657142857142856e-05, + "loss": 0.3362, + "step": 22310 + }, + { + "epoch": 310.0, + "learning_rate": 1.5645714285714286e-05, + "loss": 0.3368, + "step": 22320 + }, + { + "epoch": 310.0, + "eval_loss": 0.5579137802124023, + "eval_runtime": 127.5474, + "eval_samples_per_second": 4.171, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2199010091920036, + "step": 22320 + }, + { + "epoch": 310.14, + "learning_rate": 1.5634285714285716e-05, + "loss": 0.3489, + "step": 22330 + }, + { + "epoch": 310.28, + "learning_rate": 1.5622857142857143e-05, + "loss": 0.3298, + "step": 22340 + }, + { + "epoch": 310.42, + "learning_rate": 1.5611428571428573e-05, + "loss": 0.3367, + "step": 22350 + }, + { + "epoch": 310.55, + "learning_rate": 1.5600000000000003e-05, + "loss": 0.3299, + "step": 22360 + }, + { + "epoch": 310.69, + "learning_rate": 1.558857142857143e-05, + "loss": 0.3393, + "step": 22370 + }, + { + "epoch": 310.83, + "learning_rate": 1.5577142857142857e-05, + "loss": 0.3461, + "step": 22380 + }, + { + "epoch": 310.97, + "learning_rate": 1.5565714285714287e-05, + "loss": 0.3308, + "step": 22390 + }, + { + "epoch": 311.0, + "eval_loss": 0.5471261739730835, + "eval_runtime": 128.4119, + "eval_samples_per_second": 4.143, + "eval_steps_per_second": 0.522, + "eval_wer": 0.21552998650125346, + "step": 22392 + }, + { + "epoch": 311.11, + "learning_rate": 1.5554285714285713e-05, + "loss": 0.3403, + "step": 22400 + }, + { + "epoch": 311.25, + "learning_rate": 1.5542857142857144e-05, + "loss": 0.3316, + "step": 22410 + }, + { + "epoch": 311.39, + "learning_rate": 1.5531428571428574e-05, + "loss": 0.3355, + "step": 22420 + }, + { + "epoch": 311.53, + "learning_rate": 1.552e-05, + "loss": 0.3388, + "step": 22430 + }, + { + "epoch": 311.66, + "learning_rate": 1.550857142857143e-05, + "loss": 0.3472, + "step": 22440 + }, + { + "epoch": 311.8, + "learning_rate": 1.549714285714286e-05, + "loss": 0.3426, + "step": 22450 + }, + { + "epoch": 311.94, + "learning_rate": 1.5485714285714287e-05, + "loss": 0.3321, + "step": 22460 + }, + { + "epoch": 312.0, + "eval_loss": 0.5645043253898621, + "eval_runtime": 126.8116, + "eval_samples_per_second": 4.195, + "eval_steps_per_second": 0.528, + "eval_wer": 0.2173940991193675, + "step": 22464 + }, + { + "epoch": 312.08, + "learning_rate": 1.5474285714285714e-05, + "loss": 0.3341, + "step": 22470 + }, + { + "epoch": 312.22, + "learning_rate": 1.5462857142857144e-05, + "loss": 0.3421, + "step": 22480 + }, + { + "epoch": 312.36, + "learning_rate": 1.545142857142857e-05, + "loss": 0.3323, + "step": 22490 + }, + { + "epoch": 312.5, + "learning_rate": 1.544e-05, + "loss": 0.3354, + "step": 22500 + }, + { + "epoch": 312.64, + "learning_rate": 1.542857142857143e-05, + "loss": 0.3355, + "step": 22510 + }, + { + "epoch": 312.78, + "learning_rate": 1.5417142857142858e-05, + "loss": 0.3401, + "step": 22520 + }, + { + "epoch": 312.91, + "learning_rate": 1.5405714285714285e-05, + "loss": 0.3364, + "step": 22530 + }, + { + "epoch": 313.0, + "eval_loss": 0.5560274720191956, + "eval_runtime": 127.7166, + "eval_samples_per_second": 4.165, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2206723661374301, + "step": 22536 + }, + { + "epoch": 313.06, + "learning_rate": 1.5394285714285715e-05, + "loss": 0.3483, + "step": 22540 + }, + { + "epoch": 313.19, + "learning_rate": 1.5382857142857145e-05, + "loss": 0.333, + "step": 22550 + }, + { + "epoch": 313.33, + "learning_rate": 1.5371428571428572e-05, + "loss": 0.3303, + "step": 22560 + }, + { + "epoch": 313.47, + "learning_rate": 1.5360000000000002e-05, + "loss": 0.3386, + "step": 22570 + }, + { + "epoch": 313.61, + "learning_rate": 1.534857142857143e-05, + "loss": 0.3326, + "step": 22580 + }, + { + "epoch": 313.75, + "learning_rate": 1.533714285714286e-05, + "loss": 0.3197, + "step": 22590 + }, + { + "epoch": 313.89, + "learning_rate": 1.5325714285714286e-05, + "loss": 0.3356, + "step": 22600 + }, + { + "epoch": 314.0, + "eval_loss": 0.547174334526062, + "eval_runtime": 127.7736, + "eval_samples_per_second": 4.164, + "eval_steps_per_second": 0.524, + "eval_wer": 0.21874397377386384, + "step": 22608 + }, + { + "epoch": 314.03, + "learning_rate": 1.5314285714285716e-05, + "loss": 0.3533, + "step": 22610 + }, + { + "epoch": 314.17, + "learning_rate": 1.5302857142857143e-05, + "loss": 0.3253, + "step": 22620 + }, + { + "epoch": 314.3, + "learning_rate": 1.5291428571428573e-05, + "loss": 0.3524, + "step": 22630 + }, + { + "epoch": 314.44, + "learning_rate": 1.5280000000000003e-05, + "loss": 0.3413, + "step": 22640 + }, + { + "epoch": 314.58, + "learning_rate": 1.526857142857143e-05, + "loss": 0.334, + "step": 22650 + }, + { + "epoch": 314.72, + "learning_rate": 1.525714285714286e-05, + "loss": 0.3331, + "step": 22660 + }, + { + "epoch": 314.86, + "learning_rate": 1.5245714285714286e-05, + "loss": 0.3293, + "step": 22670 + }, + { + "epoch": 315.0, + "learning_rate": 1.5234285714285715e-05, + "loss": 0.3519, + "step": 22680 + }, + { + "epoch": 315.0, + "eval_loss": 0.5757595896720886, + "eval_runtime": 128.3615, + "eval_samples_per_second": 4.145, + "eval_steps_per_second": 0.522, + "eval_wer": 0.21822973581024618, + "step": 22680 + }, + { + "epoch": 315.14, + "learning_rate": 1.5222857142857143e-05, + "loss": 0.3325, + "step": 22690 + }, + { + "epoch": 315.28, + "learning_rate": 1.5211428571428572e-05, + "loss": 0.3337, + "step": 22700 + }, + { + "epoch": 315.42, + "learning_rate": 1.5200000000000002e-05, + "loss": 0.3361, + "step": 22710 + }, + { + "epoch": 315.55, + "learning_rate": 1.518857142857143e-05, + "loss": 0.3291, + "step": 22720 + }, + { + "epoch": 315.69, + "learning_rate": 1.5177142857142859e-05, + "loss": 0.3364, + "step": 22730 + }, + { + "epoch": 315.83, + "learning_rate": 1.5165714285714289e-05, + "loss": 0.3413, + "step": 22740 + }, + { + "epoch": 315.97, + "learning_rate": 1.5154285714285714e-05, + "loss": 0.3374, + "step": 22750 + }, + { + "epoch": 316.0, + "eval_loss": 0.5563779473304749, + "eval_runtime": 128.9511, + "eval_samples_per_second": 4.126, + "eval_steps_per_second": 0.52, + "eval_wer": 0.2239506331554927, + "step": 22752 + }, + { + "epoch": 316.11, + "learning_rate": 1.5142857142857144e-05, + "loss": 0.3334, + "step": 22760 + }, + { + "epoch": 316.25, + "learning_rate": 1.5131428571428572e-05, + "loss": 0.3346, + "step": 22770 + }, + { + "epoch": 316.39, + "learning_rate": 1.5120000000000001e-05, + "loss": 0.3397, + "step": 22780 + }, + { + "epoch": 316.53, + "learning_rate": 1.5108571428571431e-05, + "loss": 0.3403, + "step": 22790 + }, + { + "epoch": 316.66, + "learning_rate": 1.509714285714286e-05, + "loss": 0.3243, + "step": 22800 + }, + { + "epoch": 316.8, + "learning_rate": 1.5085714285714288e-05, + "loss": 0.3283, + "step": 22810 + }, + { + "epoch": 316.94, + "learning_rate": 1.5074285714285715e-05, + "loss": 0.3357, + "step": 22820 + }, + { + "epoch": 317.0, + "eval_loss": 0.5672248601913452, + "eval_runtime": 127.7293, + "eval_samples_per_second": 4.165, + "eval_steps_per_second": 0.525, + "eval_wer": 0.22189368130102205, + "step": 22824 + }, + { + "epoch": 317.08, + "learning_rate": 1.5062857142857143e-05, + "loss": 0.3297, + "step": 22830 + }, + { + "epoch": 317.22, + "learning_rate": 1.5051428571428572e-05, + "loss": 0.3389, + "step": 22840 + }, + { + "epoch": 317.36, + "learning_rate": 1.5040000000000002e-05, + "loss": 0.3312, + "step": 22850 + }, + { + "epoch": 317.5, + "learning_rate": 1.502857142857143e-05, + "loss": 0.3325, + "step": 22860 + }, + { + "epoch": 317.64, + "learning_rate": 1.5017142857142859e-05, + "loss": 0.3303, + "step": 22870 + }, + { + "epoch": 317.78, + "learning_rate": 1.5005714285714289e-05, + "loss": 0.3291, + "step": 22880 + }, + { + "epoch": 317.91, + "learning_rate": 1.4994285714285714e-05, + "loss": 0.3376, + "step": 22890 + }, + { + "epoch": 318.0, + "eval_loss": 0.5642737746238708, + "eval_runtime": 128.1248, + "eval_samples_per_second": 4.152, + "eval_steps_per_second": 0.523, + "eval_wer": 0.2240149129009449, + "step": 22896 + }, + { + "epoch": 318.06, + "learning_rate": 1.4982857142857144e-05, + "loss": 0.3536, + "step": 22900 + }, + { + "epoch": 318.19, + "learning_rate": 1.4971428571428572e-05, + "loss": 0.3318, + "step": 22910 + }, + { + "epoch": 318.33, + "learning_rate": 1.496e-05, + "loss": 0.3242, + "step": 22920 + }, + { + "epoch": 318.47, + "learning_rate": 1.4948571428571431e-05, + "loss": 0.3354, + "step": 22930 + }, + { + "epoch": 318.61, + "learning_rate": 1.493714285714286e-05, + "loss": 0.33, + "step": 22940 + }, + { + "epoch": 318.75, + "learning_rate": 1.4926857142857145e-05, + "loss": 0.3355, + "step": 22950 + }, + { + "epoch": 318.89, + "learning_rate": 1.4915428571428572e-05, + "loss": 0.3237, + "step": 22960 + }, + { + "epoch": 319.0, + "eval_loss": 0.5788535475730896, + "eval_runtime": 127.519, + "eval_samples_per_second": 4.172, + "eval_steps_per_second": 0.525, + "eval_wer": 0.22433631162820594, + "step": 22968 + }, + { + "epoch": 319.03, + "learning_rate": 1.4904e-05, + "loss": 0.3489, + "step": 22970 + }, + { + "epoch": 319.17, + "learning_rate": 1.489257142857143e-05, + "loss": 0.335, + "step": 22980 + }, + { + "epoch": 319.3, + "learning_rate": 1.4881142857142859e-05, + "loss": 0.3265, + "step": 22990 + }, + { + "epoch": 319.44, + "learning_rate": 1.4869714285714287e-05, + "loss": 0.327, + "step": 23000 + }, + { + "epoch": 319.58, + "learning_rate": 1.4858285714285715e-05, + "loss": 0.3293, + "step": 23010 + }, + { + "epoch": 319.72, + "learning_rate": 1.4846857142857146e-05, + "loss": 0.3396, + "step": 23020 + }, + { + "epoch": 319.86, + "learning_rate": 1.4835428571428572e-05, + "loss": 0.332, + "step": 23030 + }, + { + "epoch": 320.0, + "learning_rate": 1.4824e-05, + "loss": 0.3264, + "step": 23040 + }, + { + "epoch": 320.0, + "eval_loss": 0.5625404119491577, + "eval_runtime": 127.2436, + "eval_samples_per_second": 4.181, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2166870219193932, + "step": 23040 + }, + { + "epoch": 320.14, + "learning_rate": 1.4812571428571429e-05, + "loss": 0.3202, + "step": 23050 + }, + { + "epoch": 320.28, + "learning_rate": 1.4801142857142858e-05, + "loss": 0.3211, + "step": 23060 + }, + { + "epoch": 320.42, + "learning_rate": 1.4789714285714288e-05, + "loss": 0.3381, + "step": 23070 + }, + { + "epoch": 320.55, + "learning_rate": 1.4778285714285716e-05, + "loss": 0.3412, + "step": 23080 + }, + { + "epoch": 320.69, + "learning_rate": 1.4766857142857145e-05, + "loss": 0.3416, + "step": 23090 + }, + { + "epoch": 320.83, + "learning_rate": 1.4755428571428571e-05, + "loss": 0.3181, + "step": 23100 + }, + { + "epoch": 320.97, + "learning_rate": 1.4744e-05, + "loss": 0.3363, + "step": 23110 + }, + { + "epoch": 321.0, + "eval_loss": 0.5380253791809082, + "eval_runtime": 128.2706, + "eval_samples_per_second": 4.147, + "eval_steps_per_second": 0.522, + "eval_wer": 0.22009384842836022, + "step": 23112 + }, + { + "epoch": 321.11, + "learning_rate": 1.473257142857143e-05, + "loss": 0.3297, + "step": 23120 + }, + { + "epoch": 321.25, + "learning_rate": 1.4721142857142858e-05, + "loss": 0.3491, + "step": 23130 + }, + { + "epoch": 321.39, + "learning_rate": 1.4709714285714287e-05, + "loss": 0.32, + "step": 23140 + }, + { + "epoch": 321.53, + "learning_rate": 1.4698285714285715e-05, + "loss": 0.3389, + "step": 23150 + }, + { + "epoch": 321.66, + "learning_rate": 1.4686857142857145e-05, + "loss": 0.3482, + "step": 23160 + }, + { + "epoch": 321.8, + "learning_rate": 1.4675428571428572e-05, + "loss": 0.33, + "step": 23170 + }, + { + "epoch": 321.94, + "learning_rate": 1.4664e-05, + "loss": 0.3372, + "step": 23180 + }, + { + "epoch": 322.0, + "eval_loss": 0.5647508502006531, + "eval_runtime": 127.6044, + "eval_samples_per_second": 4.169, + "eval_steps_per_second": 0.525, + "eval_wer": 0.22292215722825737, + "step": 23184 + }, + { + "epoch": 322.08, + "learning_rate": 1.4652571428571429e-05, + "loss": 0.3334, + "step": 23190 + }, + { + "epoch": 322.22, + "learning_rate": 1.4641142857142857e-05, + "loss": 0.3449, + "step": 23200 + }, + { + "epoch": 322.36, + "learning_rate": 1.4629714285714288e-05, + "loss": 0.3284, + "step": 23210 + }, + { + "epoch": 322.5, + "learning_rate": 1.4618285714285716e-05, + "loss": 0.3308, + "step": 23220 + }, + { + "epoch": 322.64, + "learning_rate": 1.4606857142857144e-05, + "loss": 0.3286, + "step": 23230 + }, + { + "epoch": 322.78, + "learning_rate": 1.4595428571428575e-05, + "loss": 0.3345, + "step": 23240 + }, + { + "epoch": 322.91, + "learning_rate": 1.4584e-05, + "loss": 0.3291, + "step": 23250 + }, + { + "epoch": 323.0, + "eval_loss": 0.555727481842041, + "eval_runtime": 127.552, + "eval_samples_per_second": 4.171, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21385871311949606, + "step": 23256 + }, + { + "epoch": 323.06, + "learning_rate": 1.457257142857143e-05, + "loss": 0.3346, + "step": 23260 + }, + { + "epoch": 323.19, + "learning_rate": 1.4561142857142858e-05, + "loss": 0.3224, + "step": 23270 + }, + { + "epoch": 323.33, + "learning_rate": 1.4549714285714287e-05, + "loss": 0.3317, + "step": 23280 + }, + { + "epoch": 323.47, + "learning_rate": 1.4538285714285715e-05, + "loss": 0.3316, + "step": 23290 + }, + { + "epoch": 323.61, + "learning_rate": 1.4526857142857145e-05, + "loss": 0.3284, + "step": 23300 + }, + { + "epoch": 323.75, + "learning_rate": 1.4515428571428574e-05, + "loss": 0.3267, + "step": 23310 + }, + { + "epoch": 323.89, + "learning_rate": 1.4504e-05, + "loss": 0.3345, + "step": 23320 + }, + { + "epoch": 324.0, + "eval_loss": 0.5677399635314941, + "eval_runtime": 127.6647, + "eval_samples_per_second": 4.167, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2223436395191875, + "step": 23328 + }, + { + "epoch": 324.03, + "learning_rate": 1.4492571428571429e-05, + "loss": 0.3446, + "step": 23330 + }, + { + "epoch": 324.17, + "learning_rate": 1.4481142857142857e-05, + "loss": 0.3338, + "step": 23340 + }, + { + "epoch": 324.3, + "learning_rate": 1.4469714285714287e-05, + "loss": 0.3203, + "step": 23350 + }, + { + "epoch": 324.44, + "learning_rate": 1.4458285714285716e-05, + "loss": 0.3417, + "step": 23360 + }, + { + "epoch": 324.58, + "learning_rate": 1.4446857142857144e-05, + "loss": 0.319, + "step": 23370 + }, + { + "epoch": 324.72, + "learning_rate": 1.4435428571428574e-05, + "loss": 0.3321, + "step": 23380 + }, + { + "epoch": 324.86, + "learning_rate": 1.4424e-05, + "loss": 0.3151, + "step": 23390 + }, + { + "epoch": 325.0, + "learning_rate": 1.441257142857143e-05, + "loss": 0.3303, + "step": 23400 + }, + { + "epoch": 325.0, + "eval_loss": 0.5585859417915344, + "eval_runtime": 127.7156, + "eval_samples_per_second": 4.166, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2150157485376358, + "step": 23400 + }, + { + "epoch": 325.14, + "learning_rate": 1.4401142857142858e-05, + "loss": 0.341, + "step": 23410 + }, + { + "epoch": 325.28, + "learning_rate": 1.4389714285714286e-05, + "loss": 0.3334, + "step": 23420 + }, + { + "epoch": 325.42, + "learning_rate": 1.4378285714285715e-05, + "loss": 0.3287, + "step": 23430 + }, + { + "epoch": 325.55, + "learning_rate": 1.4366857142857145e-05, + "loss": 0.3258, + "step": 23440 + }, + { + "epoch": 325.69, + "learning_rate": 1.4355428571428573e-05, + "loss": 0.3344, + "step": 23450 + }, + { + "epoch": 325.83, + "learning_rate": 1.4344e-05, + "loss": 0.3318, + "step": 23460 + }, + { + "epoch": 325.97, + "learning_rate": 1.4332571428571429e-05, + "loss": 0.343, + "step": 23470 + }, + { + "epoch": 326.0, + "eval_loss": 0.5558550953865051, + "eval_runtime": 127.9938, + "eval_samples_per_second": 4.156, + "eval_steps_per_second": 0.523, + "eval_wer": 0.21822973581024618, + "step": 23472 + }, + { + "epoch": 326.11, + "learning_rate": 1.4321142857142857e-05, + "loss": 0.3335, + "step": 23480 + }, + { + "epoch": 326.25, + "learning_rate": 1.4309714285714287e-05, + "loss": 0.3411, + "step": 23490 + }, + { + "epoch": 326.39, + "learning_rate": 1.4298285714285716e-05, + "loss": 0.334, + "step": 23500 + }, + { + "epoch": 326.53, + "learning_rate": 1.4286857142857144e-05, + "loss": 0.3205, + "step": 23510 + }, + { + "epoch": 326.66, + "learning_rate": 1.4275428571428574e-05, + "loss": 0.3226, + "step": 23520 + }, + { + "epoch": 326.8, + "learning_rate": 1.4264e-05, + "loss": 0.3273, + "step": 23530 + }, + { + "epoch": 326.94, + "learning_rate": 1.425257142857143e-05, + "loss": 0.3436, + "step": 23540 + }, + { + "epoch": 327.0, + "eval_loss": 0.5748257040977478, + "eval_runtime": 127.5951, + "eval_samples_per_second": 4.169, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2199010091920036, + "step": 23544 + }, + { + "epoch": 327.08, + "learning_rate": 1.4241142857142858e-05, + "loss": 0.3449, + "step": 23550 + }, + { + "epoch": 327.22, + "learning_rate": 1.4229714285714286e-05, + "loss": 0.3412, + "step": 23560 + }, + { + "epoch": 327.36, + "learning_rate": 1.4218285714285715e-05, + "loss": 0.3231, + "step": 23570 + }, + { + "epoch": 327.5, + "learning_rate": 1.4206857142857145e-05, + "loss": 0.3366, + "step": 23580 + }, + { + "epoch": 327.64, + "learning_rate": 1.4195428571428573e-05, + "loss": 0.3283, + "step": 23590 + }, + { + "epoch": 327.78, + "learning_rate": 1.4184000000000002e-05, + "loss": 0.3284, + "step": 23600 + }, + { + "epoch": 327.91, + "learning_rate": 1.4172571428571429e-05, + "loss": 0.324, + "step": 23610 + }, + { + "epoch": 328.0, + "eval_loss": 0.5584424138069153, + "eval_runtime": 127.1801, + "eval_samples_per_second": 4.183, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2128302371922607, + "step": 23616 + }, + { + "epoch": 328.06, + "learning_rate": 1.4161142857142857e-05, + "loss": 0.338, + "step": 23620 + }, + { + "epoch": 328.19, + "learning_rate": 1.4149714285714287e-05, + "loss": 0.3203, + "step": 23630 + }, + { + "epoch": 328.33, + "learning_rate": 1.4138285714285716e-05, + "loss": 0.3182, + "step": 23640 + }, + { + "epoch": 328.47, + "learning_rate": 1.4126857142857144e-05, + "loss": 0.3251, + "step": 23650 + }, + { + "epoch": 328.61, + "learning_rate": 1.4115428571428574e-05, + "loss": 0.3325, + "step": 23660 + }, + { + "epoch": 328.75, + "learning_rate": 1.4104000000000003e-05, + "loss": 0.3329, + "step": 23670 + }, + { + "epoch": 328.89, + "learning_rate": 1.409257142857143e-05, + "loss": 0.3175, + "step": 23680 + }, + { + "epoch": 329.0, + "eval_loss": 0.5570225715637207, + "eval_runtime": 127.2058, + "eval_samples_per_second": 4.182, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2157871054830623, + "step": 23688 + }, + { + "epoch": 329.03, + "learning_rate": 1.4081142857142858e-05, + "loss": 0.3433, + "step": 23690 + }, + { + "epoch": 329.17, + "learning_rate": 1.4069714285714286e-05, + "loss": 0.3385, + "step": 23700 + }, + { + "epoch": 329.3, + "learning_rate": 1.4058285714285715e-05, + "loss": 0.3192, + "step": 23710 + }, + { + "epoch": 329.44, + "learning_rate": 1.4046857142857145e-05, + "loss": 0.3262, + "step": 23720 + }, + { + "epoch": 329.58, + "learning_rate": 1.4035428571428573e-05, + "loss": 0.3379, + "step": 23730 + }, + { + "epoch": 329.72, + "learning_rate": 1.4024000000000002e-05, + "loss": 0.3397, + "step": 23740 + }, + { + "epoch": 329.86, + "learning_rate": 1.4012571428571428e-05, + "loss": 0.3311, + "step": 23750 + }, + { + "epoch": 330.0, + "learning_rate": 1.4001142857142857e-05, + "loss": 0.3305, + "step": 23760 + }, + { + "epoch": 330.0, + "eval_loss": 0.5594530701637268, + "eval_runtime": 127.7532, + "eval_samples_per_second": 4.164, + "eval_steps_per_second": 0.524, + "eval_wer": 0.21790833708298515, + "step": 23760 + }, + { + "epoch": 330.14, + "learning_rate": 1.3989714285714287e-05, + "loss": 0.3316, + "step": 23770 + }, + { + "epoch": 330.28, + "learning_rate": 1.3978285714285715e-05, + "loss": 0.3227, + "step": 23780 + }, + { + "epoch": 330.42, + "learning_rate": 1.3966857142857144e-05, + "loss": 0.3352, + "step": 23790 + }, + { + "epoch": 330.55, + "learning_rate": 1.3955428571428574e-05, + "loss": 0.324, + "step": 23800 + }, + { + "epoch": 330.69, + "learning_rate": 1.3944000000000002e-05, + "loss": 0.3255, + "step": 23810 + }, + { + "epoch": 330.83, + "learning_rate": 1.3932571428571429e-05, + "loss": 0.3217, + "step": 23820 + }, + { + "epoch": 330.97, + "learning_rate": 1.3921142857142858e-05, + "loss": 0.3316, + "step": 23830 + }, + { + "epoch": 331.0, + "eval_loss": 0.5309335589408875, + "eval_runtime": 127.3837, + "eval_samples_per_second": 4.176, + "eval_steps_per_second": 0.526, + "eval_wer": 0.21700842064665424, + "step": 23832 + }, + { + "epoch": 331.11, + "learning_rate": 1.3909714285714286e-05, + "loss": 0.3223, + "step": 23840 + }, + { + "epoch": 331.25, + "learning_rate": 1.3898285714285716e-05, + "loss": 0.3284, + "step": 23850 + }, + { + "epoch": 331.39, + "learning_rate": 1.3886857142857145e-05, + "loss": 0.3193, + "step": 23860 + }, + { + "epoch": 331.53, + "learning_rate": 1.3875428571428573e-05, + "loss": 0.3327, + "step": 23870 + }, + { + "epoch": 331.66, + "learning_rate": 1.3864000000000001e-05, + "loss": 0.3193, + "step": 23880 + }, + { + "epoch": 331.8, + "learning_rate": 1.3852571428571432e-05, + "loss": 0.3252, + "step": 23890 + }, + { + "epoch": 331.94, + "learning_rate": 1.3841142857142857e-05, + "loss": 0.3322, + "step": 23900 + }, + { + "epoch": 332.0, + "eval_loss": 0.5475938320159912, + "eval_runtime": 127.9497, + "eval_samples_per_second": 4.158, + "eval_steps_per_second": 0.524, + "eval_wer": 0.22009384842836022, + "step": 23904 + }, + { + "epoch": 332.08, + "learning_rate": 1.3829714285714287e-05, + "loss": 0.3417, + "step": 23910 + }, + { + "epoch": 332.22, + "learning_rate": 1.3818285714285715e-05, + "loss": 0.3227, + "step": 23920 + }, + { + "epoch": 332.36, + "learning_rate": 1.3806857142857144e-05, + "loss": 0.3176, + "step": 23930 + }, + { + "epoch": 332.5, + "learning_rate": 1.3795428571428574e-05, + "loss": 0.3267, + "step": 23940 + }, + { + "epoch": 332.64, + "learning_rate": 1.3784000000000002e-05, + "loss": 0.3202, + "step": 23950 + }, + { + "epoch": 332.78, + "learning_rate": 1.377257142857143e-05, + "loss": 0.3121, + "step": 23960 + }, + { + "epoch": 332.91, + "learning_rate": 1.3761142857142857e-05, + "loss": 0.3379, + "step": 23970 + }, + { + "epoch": 333.0, + "eval_loss": 0.5637117624282837, + "eval_runtime": 127.3877, + "eval_samples_per_second": 4.176, + "eval_steps_per_second": 0.526, + "eval_wer": 0.21604422446487112, + "step": 23976 + }, + { + "epoch": 333.06, + "learning_rate": 1.3749714285714286e-05, + "loss": 0.3446, + "step": 23980 + }, + { + "epoch": 333.19, + "learning_rate": 1.3738285714285716e-05, + "loss": 0.3324, + "step": 23990 + }, + { + "epoch": 333.33, + "learning_rate": 1.3726857142857144e-05, + "loss": 0.3264, + "step": 24000 + }, + { + "epoch": 333.47, + "learning_rate": 1.3715428571428573e-05, + "loss": 0.3208, + "step": 24010 + }, + { + "epoch": 333.61, + "learning_rate": 1.3704000000000001e-05, + "loss": 0.3104, + "step": 24020 + }, + { + "epoch": 333.75, + "learning_rate": 1.3692571428571431e-05, + "loss": 0.3336, + "step": 24030 + }, + { + "epoch": 333.89, + "learning_rate": 1.3681142857142856e-05, + "loss": 0.3282, + "step": 24040 + }, + { + "epoch": 334.0, + "eval_loss": 0.5670413970947266, + "eval_runtime": 127.062, + "eval_samples_per_second": 4.187, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21822973581024618, + "step": 24048 + }, + { + "epoch": 334.03, + "learning_rate": 1.3669714285714287e-05, + "loss": 0.3274, + "step": 24050 + }, + { + "epoch": 334.17, + "learning_rate": 1.3658285714285715e-05, + "loss": 0.3227, + "step": 24060 + }, + { + "epoch": 334.3, + "learning_rate": 1.3646857142857143e-05, + "loss": 0.3264, + "step": 24070 + }, + { + "epoch": 334.44, + "learning_rate": 1.3635428571428574e-05, + "loss": 0.3308, + "step": 24080 + }, + { + "epoch": 334.58, + "learning_rate": 1.3624000000000002e-05, + "loss": 0.3272, + "step": 24090 + }, + { + "epoch": 334.72, + "learning_rate": 1.361257142857143e-05, + "loss": 0.3256, + "step": 24100 + }, + { + "epoch": 334.86, + "learning_rate": 1.3601142857142857e-05, + "loss": 0.3057, + "step": 24110 + }, + { + "epoch": 335.0, + "learning_rate": 1.3589714285714286e-05, + "loss": 0.3155, + "step": 24120 + }, + { + "epoch": 335.0, + "eval_loss": 0.5686081051826477, + "eval_runtime": 127.733, + "eval_samples_per_second": 4.165, + "eval_steps_per_second": 0.525, + "eval_wer": 0.22054380664652568, + "step": 24120 + }, + { + "epoch": 335.14, + "learning_rate": 1.3578285714285716e-05, + "loss": 0.3224, + "step": 24130 + }, + { + "epoch": 335.28, + "learning_rate": 1.3566857142857144e-05, + "loss": 0.3217, + "step": 24140 + }, + { + "epoch": 335.42, + "learning_rate": 1.3555428571428573e-05, + "loss": 0.3179, + "step": 24150 + }, + { + "epoch": 335.55, + "learning_rate": 1.3544000000000001e-05, + "loss": 0.3224, + "step": 24160 + }, + { + "epoch": 335.69, + "learning_rate": 1.3532571428571431e-05, + "loss": 0.3187, + "step": 24170 + }, + { + "epoch": 335.83, + "learning_rate": 1.352114285714286e-05, + "loss": 0.3175, + "step": 24180 + }, + { + "epoch": 335.97, + "learning_rate": 1.3509714285714286e-05, + "loss": 0.3426, + "step": 24190 + }, + { + "epoch": 336.0, + "eval_loss": 0.5574333071708679, + "eval_runtime": 127.5728, + "eval_samples_per_second": 4.17, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21597994471941892, + "step": 24192 + }, + { + "epoch": 336.11, + "learning_rate": 1.3498285714285715e-05, + "loss": 0.3233, + "step": 24200 + }, + { + "epoch": 336.25, + "learning_rate": 1.3486857142857143e-05, + "loss": 0.3219, + "step": 24210 + }, + { + "epoch": 336.39, + "learning_rate": 1.3475428571428573e-05, + "loss": 0.3117, + "step": 24220 + }, + { + "epoch": 336.53, + "learning_rate": 1.3464000000000002e-05, + "loss": 0.3291, + "step": 24230 + }, + { + "epoch": 336.66, + "learning_rate": 1.345257142857143e-05, + "loss": 0.3261, + "step": 24240 + }, + { + "epoch": 336.8, + "learning_rate": 1.3441142857142859e-05, + "loss": 0.3171, + "step": 24250 + }, + { + "epoch": 336.94, + "learning_rate": 1.3429714285714285e-05, + "loss": 0.3138, + "step": 24260 + }, + { + "epoch": 337.0, + "eval_loss": 0.5815868973731995, + "eval_runtime": 127.1979, + "eval_samples_per_second": 4.182, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2190010927556727, + "step": 24264 + }, + { + "epoch": 337.08, + "learning_rate": 1.3418285714285716e-05, + "loss": 0.3125, + "step": 24270 + }, + { + "epoch": 337.22, + "learning_rate": 1.3406857142857144e-05, + "loss": 0.3294, + "step": 24280 + }, + { + "epoch": 337.36, + "learning_rate": 1.3395428571428573e-05, + "loss": 0.3145, + "step": 24290 + }, + { + "epoch": 337.5, + "learning_rate": 1.3384000000000001e-05, + "loss": 0.3231, + "step": 24300 + }, + { + "epoch": 337.64, + "learning_rate": 1.3372571428571431e-05, + "loss": 0.3118, + "step": 24310 + }, + { + "epoch": 337.78, + "learning_rate": 1.336114285714286e-05, + "loss": 0.3183, + "step": 24320 + }, + { + "epoch": 337.91, + "learning_rate": 1.3349714285714286e-05, + "loss": 0.3218, + "step": 24330 + }, + { + "epoch": 338.0, + "eval_loss": 0.5863565802574158, + "eval_runtime": 128.2708, + "eval_samples_per_second": 4.147, + "eval_steps_per_second": 0.522, + "eval_wer": 0.22285787748280517, + "step": 24336 + }, + { + "epoch": 338.06, + "learning_rate": 1.3338285714285715e-05, + "loss": 0.3329, + "step": 24340 + }, + { + "epoch": 338.19, + "learning_rate": 1.3326857142857143e-05, + "loss": 0.3213, + "step": 24350 + }, + { + "epoch": 338.33, + "learning_rate": 1.3315428571428573e-05, + "loss": 0.3165, + "step": 24360 + }, + { + "epoch": 338.47, + "learning_rate": 1.3304000000000002e-05, + "loss": 0.3277, + "step": 24370 + }, + { + "epoch": 338.61, + "learning_rate": 1.329257142857143e-05, + "loss": 0.3105, + "step": 24380 + }, + { + "epoch": 338.75, + "learning_rate": 1.3281142857142859e-05, + "loss": 0.315, + "step": 24390 + }, + { + "epoch": 338.89, + "learning_rate": 1.3269714285714285e-05, + "loss": 0.3235, + "step": 24400 + }, + { + "epoch": 339.0, + "eval_loss": 0.5692674517631531, + "eval_runtime": 128.01, + "eval_samples_per_second": 4.156, + "eval_steps_per_second": 0.523, + "eval_wer": 0.22260075850099634, + "step": 24408 + }, + { + "epoch": 339.03, + "learning_rate": 1.3258285714285715e-05, + "loss": 0.3363, + "step": 24410 + }, + { + "epoch": 339.17, + "learning_rate": 1.3246857142857144e-05, + "loss": 0.3169, + "step": 24420 + }, + { + "epoch": 339.3, + "learning_rate": 1.3235428571428572e-05, + "loss": 0.3278, + "step": 24430 + }, + { + "epoch": 339.44, + "learning_rate": 1.3224e-05, + "loss": 0.3236, + "step": 24440 + }, + { + "epoch": 339.58, + "learning_rate": 1.3212571428571431e-05, + "loss": 0.3261, + "step": 24450 + }, + { + "epoch": 339.72, + "learning_rate": 1.320114285714286e-05, + "loss": 0.331, + "step": 24460 + }, + { + "epoch": 339.86, + "learning_rate": 1.3189714285714286e-05, + "loss": 0.321, + "step": 24470 + }, + { + "epoch": 340.0, + "learning_rate": 1.3178285714285715e-05, + "loss": 0.3247, + "step": 24480 + }, + { + "epoch": 340.0, + "eval_loss": 0.5936774015426636, + "eval_runtime": 127.2173, + "eval_samples_per_second": 4.182, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2264575432281288, + "step": 24480 + }, + { + "epoch": 340.14, + "learning_rate": 1.3166857142857143e-05, + "loss": 0.3354, + "step": 24490 + }, + { + "epoch": 340.28, + "learning_rate": 1.3155428571428573e-05, + "loss": 0.3189, + "step": 24500 + }, + { + "epoch": 340.42, + "learning_rate": 1.3144000000000002e-05, + "loss": 0.3363, + "step": 24510 + }, + { + "epoch": 340.55, + "learning_rate": 1.313257142857143e-05, + "loss": 0.3227, + "step": 24520 + }, + { + "epoch": 340.69, + "learning_rate": 1.3121142857142858e-05, + "loss": 0.3187, + "step": 24530 + }, + { + "epoch": 340.83, + "learning_rate": 1.3109714285714289e-05, + "loss": 0.31, + "step": 24540 + }, + { + "epoch": 340.97, + "learning_rate": 1.3098285714285715e-05, + "loss": 0.3189, + "step": 24550 + }, + { + "epoch": 341.0, + "eval_loss": 0.5748247504234314, + "eval_runtime": 127.3037, + "eval_samples_per_second": 4.179, + "eval_steps_per_second": 0.526, + "eval_wer": 0.22440059137365817, + "step": 24552 + }, + { + "epoch": 341.11, + "learning_rate": 1.3086857142857144e-05, + "loss": 0.3359, + "step": 24560 + }, + { + "epoch": 341.25, + "learning_rate": 1.3075428571428572e-05, + "loss": 0.3151, + "step": 24570 + }, + { + "epoch": 341.39, + "learning_rate": 1.3064e-05, + "loss": 0.3155, + "step": 24580 + }, + { + "epoch": 341.53, + "learning_rate": 1.305257142857143e-05, + "loss": 0.3176, + "step": 24590 + }, + { + "epoch": 341.66, + "learning_rate": 1.304114285714286e-05, + "loss": 0.323, + "step": 24600 + }, + { + "epoch": 341.8, + "learning_rate": 1.3029714285714288e-05, + "loss": 0.3086, + "step": 24610 + }, + { + "epoch": 341.94, + "learning_rate": 1.3018285714285714e-05, + "loss": 0.3131, + "step": 24620 + }, + { + "epoch": 342.0, + "eval_loss": 0.5739911198616028, + "eval_runtime": 126.6906, + "eval_samples_per_second": 4.199, + "eval_steps_per_second": 0.529, + "eval_wer": 0.21887253326476827, + "step": 24624 + }, + { + "epoch": 342.08, + "learning_rate": 1.3006857142857143e-05, + "loss": 0.3277, + "step": 24630 + }, + { + "epoch": 342.22, + "learning_rate": 1.2995428571428573e-05, + "loss": 0.329, + "step": 24640 + }, + { + "epoch": 342.36, + "learning_rate": 1.2984000000000001e-05, + "loss": 0.314, + "step": 24650 + }, + { + "epoch": 342.5, + "learning_rate": 1.297257142857143e-05, + "loss": 0.3283, + "step": 24660 + }, + { + "epoch": 342.64, + "learning_rate": 1.2961142857142858e-05, + "loss": 0.305, + "step": 24670 + }, + { + "epoch": 342.78, + "learning_rate": 1.2949714285714288e-05, + "loss": 0.3073, + "step": 24680 + }, + { + "epoch": 342.91, + "learning_rate": 1.2938285714285715e-05, + "loss": 0.3059, + "step": 24690 + }, + { + "epoch": 343.0, + "eval_loss": 0.5659681558609009, + "eval_runtime": 127.8792, + "eval_samples_per_second": 4.16, + "eval_steps_per_second": 0.524, + "eval_wer": 0.22060808639197788, + "step": 24696 + }, + { + "epoch": 343.06, + "learning_rate": 1.2926857142857144e-05, + "loss": 0.3219, + "step": 24700 + }, + { + "epoch": 343.19, + "learning_rate": 1.2915428571428572e-05, + "loss": 0.3166, + "step": 24710 + }, + { + "epoch": 343.33, + "learning_rate": 1.2904e-05, + "loss": 0.2995, + "step": 24720 + }, + { + "epoch": 343.47, + "learning_rate": 1.289257142857143e-05, + "loss": 0.3258, + "step": 24730 + }, + { + "epoch": 343.61, + "learning_rate": 1.2881142857142859e-05, + "loss": 0.3164, + "step": 24740 + }, + { + "epoch": 343.75, + "learning_rate": 1.2869714285714287e-05, + "loss": 0.3244, + "step": 24750 + }, + { + "epoch": 343.89, + "learning_rate": 1.2858285714285714e-05, + "loss": 0.313, + "step": 24760 + }, + { + "epoch": 344.0, + "eval_loss": 0.5701687335968018, + "eval_runtime": 126.9933, + "eval_samples_per_second": 4.189, + "eval_steps_per_second": 0.528, + "eval_wer": 0.2184225750466028, + "step": 24768 + }, + { + "epoch": 344.03, + "learning_rate": 1.2846857142857143e-05, + "loss": 0.3382, + "step": 24770 + }, + { + "epoch": 344.17, + "learning_rate": 1.2835428571428573e-05, + "loss": 0.3139, + "step": 24780 + }, + { + "epoch": 344.3, + "learning_rate": 1.2824000000000001e-05, + "loss": 0.3105, + "step": 24790 + }, + { + "epoch": 344.44, + "learning_rate": 1.281257142857143e-05, + "loss": 0.3246, + "step": 24800 + }, + { + "epoch": 344.58, + "learning_rate": 1.2801142857142858e-05, + "loss": 0.319, + "step": 24810 + }, + { + "epoch": 344.72, + "learning_rate": 1.2789714285714288e-05, + "loss": 0.327, + "step": 24820 + }, + { + "epoch": 344.86, + "learning_rate": 1.2778285714285717e-05, + "loss": 0.309, + "step": 24830 + }, + { + "epoch": 345.0, + "learning_rate": 1.2766857142857143e-05, + "loss": 0.3225, + "step": 24840 + }, + { + "epoch": 345.0, + "eval_loss": 0.5535494685173035, + "eval_runtime": 127.2337, + "eval_samples_per_second": 4.181, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2190010927556727, + "step": 24840 + }, + { + "epoch": 345.14, + "learning_rate": 1.2755428571428572e-05, + "loss": 0.315, + "step": 24850 + }, + { + "epoch": 345.28, + "learning_rate": 1.2744e-05, + "loss": 0.3211, + "step": 24860 + }, + { + "epoch": 345.42, + "learning_rate": 1.273257142857143e-05, + "loss": 0.3284, + "step": 24870 + }, + { + "epoch": 345.55, + "learning_rate": 1.2721142857142859e-05, + "loss": 0.3073, + "step": 24880 + }, + { + "epoch": 345.69, + "learning_rate": 1.2709714285714287e-05, + "loss": 0.3138, + "step": 24890 + }, + { + "epoch": 345.83, + "learning_rate": 1.2698285714285716e-05, + "loss": 0.3164, + "step": 24900 + }, + { + "epoch": 345.97, + "learning_rate": 1.2686857142857142e-05, + "loss": 0.3145, + "step": 24910 + }, + { + "epoch": 346.0, + "eval_loss": 0.557106077671051, + "eval_runtime": 126.8039, + "eval_samples_per_second": 4.195, + "eval_steps_per_second": 0.528, + "eval_wer": 0.21630134344667995, + "step": 24912 + }, + { + "epoch": 346.11, + "learning_rate": 1.2675428571428573e-05, + "loss": 0.3095, + "step": 24920 + }, + { + "epoch": 346.25, + "learning_rate": 1.2664000000000001e-05, + "loss": 0.3195, + "step": 24930 + }, + { + "epoch": 346.39, + "learning_rate": 1.265257142857143e-05, + "loss": 0.308, + "step": 24940 + }, + { + "epoch": 346.53, + "learning_rate": 1.2641142857142858e-05, + "loss": 0.3259, + "step": 24950 + }, + { + "epoch": 346.66, + "learning_rate": 1.2629714285714288e-05, + "loss": 0.31, + "step": 24960 + }, + { + "epoch": 346.8, + "learning_rate": 1.2618285714285717e-05, + "loss": 0.2986, + "step": 24970 + }, + { + "epoch": 346.94, + "learning_rate": 1.2606857142857143e-05, + "loss": 0.3176, + "step": 24980 + }, + { + "epoch": 347.0, + "eval_loss": 0.5592583417892456, + "eval_runtime": 127.1696, + "eval_samples_per_second": 4.183, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2157228257376101, + "step": 24984 + }, + { + "epoch": 347.08, + "learning_rate": 1.2595428571428572e-05, + "loss": 0.3141, + "step": 24990 + }, + { + "epoch": 347.22, + "learning_rate": 1.2584e-05, + "loss": 0.3057, + "step": 25000 + }, + { + "epoch": 347.36, + "learning_rate": 1.257257142857143e-05, + "loss": 0.3009, + "step": 25010 + }, + { + "epoch": 347.5, + "learning_rate": 1.2561142857142859e-05, + "loss": 0.321, + "step": 25020 + }, + { + "epoch": 347.64, + "learning_rate": 1.2549714285714287e-05, + "loss": 0.3198, + "step": 25030 + }, + { + "epoch": 347.78, + "learning_rate": 1.2538285714285716e-05, + "loss": 0.3112, + "step": 25040 + }, + { + "epoch": 347.91, + "learning_rate": 1.2526857142857142e-05, + "loss": 0.3288, + "step": 25050 + }, + { + "epoch": 348.0, + "eval_loss": 0.5682421326637268, + "eval_runtime": 127.5142, + "eval_samples_per_second": 4.172, + "eval_steps_per_second": 0.525, + "eval_wer": 0.22035096741016905, + "step": 25056 + }, + { + "epoch": 348.06, + "learning_rate": 1.2515428571428572e-05, + "loss": 0.3296, + "step": 25060 + }, + { + "epoch": 348.19, + "learning_rate": 1.2504000000000001e-05, + "loss": 0.3205, + "step": 25070 + }, + { + "epoch": 348.33, + "learning_rate": 1.249257142857143e-05, + "loss": 0.3197, + "step": 25080 + }, + { + "epoch": 348.47, + "learning_rate": 1.2481142857142858e-05, + "loss": 0.3178, + "step": 25090 + }, + { + "epoch": 348.61, + "learning_rate": 1.2469714285714288e-05, + "loss": 0.3292, + "step": 25100 + }, + { + "epoch": 348.75, + "learning_rate": 1.2458285714285716e-05, + "loss": 0.3191, + "step": 25110 + }, + { + "epoch": 348.89, + "learning_rate": 1.2446857142857145e-05, + "loss": 0.3154, + "step": 25120 + }, + { + "epoch": 349.0, + "eval_loss": 0.5349848866462708, + "eval_runtime": 127.1745, + "eval_samples_per_second": 4.183, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2159156649739667, + "step": 25128 + }, + { + "epoch": 349.03, + "learning_rate": 1.2435428571428572e-05, + "loss": 0.337, + "step": 25130 + }, + { + "epoch": 349.17, + "learning_rate": 1.2424e-05, + "loss": 0.3103, + "step": 25140 + }, + { + "epoch": 349.3, + "learning_rate": 1.241257142857143e-05, + "loss": 0.3042, + "step": 25150 + }, + { + "epoch": 349.44, + "learning_rate": 1.2401142857142859e-05, + "loss": 0.3256, + "step": 25160 + }, + { + "epoch": 349.58, + "learning_rate": 1.2389714285714287e-05, + "loss": 0.3106, + "step": 25170 + }, + { + "epoch": 349.72, + "learning_rate": 1.2378285714285715e-05, + "loss": 0.3204, + "step": 25180 + }, + { + "epoch": 349.86, + "learning_rate": 1.2366857142857146e-05, + "loss": 0.3139, + "step": 25190 + }, + { + "epoch": 350.0, + "learning_rate": 1.2355428571428572e-05, + "loss": 0.3159, + "step": 25200 + }, + { + "epoch": 350.0, + "eval_loss": 0.5652676224708557, + "eval_runtime": 127.4724, + "eval_samples_per_second": 4.173, + "eval_steps_per_second": 0.526, + "eval_wer": 0.22035096741016905, + "step": 25200 + }, + { + "epoch": 350.14, + "learning_rate": 1.2344e-05, + "loss": 0.327, + "step": 25210 + }, + { + "epoch": 350.28, + "learning_rate": 1.233257142857143e-05, + "loss": 0.322, + "step": 25220 + }, + { + "epoch": 350.42, + "learning_rate": 1.2321142857142858e-05, + "loss": 0.313, + "step": 25230 + }, + { + "epoch": 350.55, + "learning_rate": 1.2309714285714288e-05, + "loss": 0.3005, + "step": 25240 + }, + { + "epoch": 350.69, + "learning_rate": 1.2298285714285716e-05, + "loss": 0.3246, + "step": 25250 + }, + { + "epoch": 350.83, + "learning_rate": 1.2286857142857145e-05, + "loss": 0.3184, + "step": 25260 + }, + { + "epoch": 350.97, + "learning_rate": 1.2275428571428571e-05, + "loss": 0.3029, + "step": 25270 + }, + { + "epoch": 351.0, + "eval_loss": 0.5536702871322632, + "eval_runtime": 127.3844, + "eval_samples_per_second": 4.176, + "eval_steps_per_second": 0.526, + "eval_wer": 0.21328019541042617, + "step": 25272 + }, + { + "epoch": 351.11, + "learning_rate": 1.2264e-05, + "loss": 0.3155, + "step": 25280 + }, + { + "epoch": 351.25, + "learning_rate": 1.225257142857143e-05, + "loss": 0.3209, + "step": 25290 + }, + { + "epoch": 351.39, + "learning_rate": 1.2241142857142858e-05, + "loss": 0.3118, + "step": 25300 + }, + { + "epoch": 351.53, + "learning_rate": 1.2229714285714287e-05, + "loss": 0.3052, + "step": 25310 + }, + { + "epoch": 351.66, + "learning_rate": 1.2218285714285715e-05, + "loss": 0.3203, + "step": 25320 + }, + { + "epoch": 351.8, + "learning_rate": 1.2206857142857145e-05, + "loss": 0.3159, + "step": 25330 + }, + { + "epoch": 351.94, + "learning_rate": 1.2195428571428572e-05, + "loss": 0.3177, + "step": 25340 + }, + { + "epoch": 352.0, + "eval_loss": 0.5842908024787903, + "eval_runtime": 128.0953, + "eval_samples_per_second": 4.153, + "eval_steps_per_second": 0.523, + "eval_wer": 0.21867969402841164, + "step": 25344 + }, + { + "epoch": 352.08, + "learning_rate": 1.2184e-05, + "loss": 0.326, + "step": 25350 + }, + { + "epoch": 352.22, + "learning_rate": 1.2172571428571429e-05, + "loss": 0.3209, + "step": 25360 + }, + { + "epoch": 352.36, + "learning_rate": 1.2161142857142857e-05, + "loss": 0.3155, + "step": 25370 + }, + { + "epoch": 352.5, + "learning_rate": 1.2149714285714288e-05, + "loss": 0.3216, + "step": 25380 + }, + { + "epoch": 352.64, + "learning_rate": 1.2138285714285716e-05, + "loss": 0.3237, + "step": 25390 + }, + { + "epoch": 352.78, + "learning_rate": 1.2126857142857144e-05, + "loss": 0.3122, + "step": 25400 + }, + { + "epoch": 352.91, + "learning_rate": 1.2115428571428571e-05, + "loss": 0.31, + "step": 25410 + }, + { + "epoch": 353.0, + "eval_loss": 0.559213399887085, + "eval_runtime": 127.4985, + "eval_samples_per_second": 4.173, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21758693835572412, + "step": 25416 + }, + { + "epoch": 353.06, + "learning_rate": 1.2104e-05, + "loss": 0.3156, + "step": 25420 + }, + { + "epoch": 353.19, + "learning_rate": 1.209257142857143e-05, + "loss": 0.3105, + "step": 25430 + }, + { + "epoch": 353.33, + "learning_rate": 1.2081142857142858e-05, + "loss": 0.3049, + "step": 25440 + }, + { + "epoch": 353.47, + "learning_rate": 1.2069714285714287e-05, + "loss": 0.32, + "step": 25450 + }, + { + "epoch": 353.61, + "learning_rate": 1.2058285714285715e-05, + "loss": 0.3125, + "step": 25460 + }, + { + "epoch": 353.75, + "learning_rate": 1.2046857142857145e-05, + "loss": 0.316, + "step": 25470 + }, + { + "epoch": 353.89, + "learning_rate": 1.2035428571428574e-05, + "loss": 0.3008, + "step": 25480 + }, + { + "epoch": 354.0, + "eval_loss": 0.5820884108543396, + "eval_runtime": 127.4376, + "eval_samples_per_second": 4.175, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2157228257376101, + "step": 25488 + }, + { + "epoch": 354.03, + "learning_rate": 1.2024e-05, + "loss": 0.3235, + "step": 25490 + }, + { + "epoch": 354.17, + "learning_rate": 1.2012571428571429e-05, + "loss": 0.3112, + "step": 25500 + }, + { + "epoch": 354.3, + "learning_rate": 1.2001142857142857e-05, + "loss": 0.312, + "step": 25510 + }, + { + "epoch": 354.44, + "learning_rate": 1.1989714285714287e-05, + "loss": 0.3179, + "step": 25520 + }, + { + "epoch": 354.58, + "learning_rate": 1.1978285714285716e-05, + "loss": 0.3225, + "step": 25530 + }, + { + "epoch": 354.72, + "learning_rate": 1.1966857142857144e-05, + "loss": 0.3127, + "step": 25540 + }, + { + "epoch": 354.86, + "learning_rate": 1.1955428571428573e-05, + "loss": 0.3099, + "step": 25550 + }, + { + "epoch": 355.0, + "learning_rate": 1.1944e-05, + "loss": 0.31, + "step": 25560 + }, + { + "epoch": 355.0, + "eval_loss": 0.5679353475570679, + "eval_runtime": 127.2089, + "eval_samples_per_second": 4.182, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21392299286494826, + "step": 25560 + }, + { + "epoch": 355.14, + "learning_rate": 1.193257142857143e-05, + "loss": 0.3156, + "step": 25570 + }, + { + "epoch": 355.28, + "learning_rate": 1.1921142857142858e-05, + "loss": 0.3201, + "step": 25580 + }, + { + "epoch": 355.42, + "learning_rate": 1.1909714285714286e-05, + "loss": 0.3217, + "step": 25590 + }, + { + "epoch": 355.55, + "learning_rate": 1.1898285714285715e-05, + "loss": 0.296, + "step": 25600 + }, + { + "epoch": 355.69, + "learning_rate": 1.1888000000000002e-05, + "loss": 0.3064, + "step": 25610 + }, + { + "epoch": 355.83, + "learning_rate": 1.187657142857143e-05, + "loss": 0.3019, + "step": 25620 + }, + { + "epoch": 355.97, + "learning_rate": 1.1865142857142857e-05, + "loss": 0.311, + "step": 25630 + }, + { + "epoch": 356.0, + "eval_loss": 0.5527079701423645, + "eval_runtime": 127.5178, + "eval_samples_per_second": 4.172, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2152085877739924, + "step": 25632 + }, + { + "epoch": 356.11, + "learning_rate": 1.1853714285714286e-05, + "loss": 0.3193, + "step": 25640 + }, + { + "epoch": 356.25, + "learning_rate": 1.1842285714285716e-05, + "loss": 0.3121, + "step": 25650 + }, + { + "epoch": 356.39, + "learning_rate": 1.1830857142857144e-05, + "loss": 0.3043, + "step": 25660 + }, + { + "epoch": 356.53, + "learning_rate": 1.1819428571428573e-05, + "loss": 0.3139, + "step": 25670 + }, + { + "epoch": 356.66, + "learning_rate": 1.1808000000000001e-05, + "loss": 0.3104, + "step": 25680 + }, + { + "epoch": 356.8, + "learning_rate": 1.1796571428571431e-05, + "loss": 0.3069, + "step": 25690 + }, + { + "epoch": 356.94, + "learning_rate": 1.1785142857142858e-05, + "loss": 0.3107, + "step": 25700 + }, + { + "epoch": 357.0, + "eval_loss": 0.5629017949104309, + "eval_runtime": 127.5742, + "eval_samples_per_second": 4.17, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21475862955582695, + "step": 25704 + }, + { + "epoch": 357.08, + "learning_rate": 1.1773714285714286e-05, + "loss": 0.3196, + "step": 25710 + }, + { + "epoch": 357.22, + "learning_rate": 1.1762285714285715e-05, + "loss": 0.3103, + "step": 25720 + }, + { + "epoch": 357.36, + "learning_rate": 1.1750857142857143e-05, + "loss": 0.2973, + "step": 25730 + }, + { + "epoch": 357.5, + "learning_rate": 1.1739428571428573e-05, + "loss": 0.315, + "step": 25740 + }, + { + "epoch": 357.64, + "learning_rate": 1.1728000000000002e-05, + "loss": 0.3181, + "step": 25750 + }, + { + "epoch": 357.78, + "learning_rate": 1.171657142857143e-05, + "loss": 0.311, + "step": 25760 + }, + { + "epoch": 357.91, + "learning_rate": 1.1705142857142857e-05, + "loss": 0.3245, + "step": 25770 + }, + { + "epoch": 358.0, + "eval_loss": 0.5606277585029602, + "eval_runtime": 127.3828, + "eval_samples_per_second": 4.176, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2142443915922093, + "step": 25776 + }, + { + "epoch": 358.06, + "learning_rate": 1.1693714285714286e-05, + "loss": 0.3183, + "step": 25780 + }, + { + "epoch": 358.19, + "learning_rate": 1.1682285714285716e-05, + "loss": 0.3092, + "step": 25790 + }, + { + "epoch": 358.33, + "learning_rate": 1.1670857142857144e-05, + "loss": 0.308, + "step": 25800 + }, + { + "epoch": 358.47, + "learning_rate": 1.1659428571428573e-05, + "loss": 0.3201, + "step": 25810 + }, + { + "epoch": 358.61, + "learning_rate": 1.1648000000000001e-05, + "loss": 0.3107, + "step": 25820 + }, + { + "epoch": 358.75, + "learning_rate": 1.1636571428571431e-05, + "loss": 0.3064, + "step": 25830 + }, + { + "epoch": 358.89, + "learning_rate": 1.1625142857142858e-05, + "loss": 0.3049, + "step": 25840 + }, + { + "epoch": 359.0, + "eval_loss": 0.561586320400238, + "eval_runtime": 127.7151, + "eval_samples_per_second": 4.166, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21662274217394098, + "step": 25848 + }, + { + "epoch": 359.03, + "learning_rate": 1.1613714285714286e-05, + "loss": 0.3173, + "step": 25850 + }, + { + "epoch": 359.17, + "learning_rate": 1.1602285714285715e-05, + "loss": 0.3135, + "step": 25860 + }, + { + "epoch": 359.3, + "learning_rate": 1.1590857142857143e-05, + "loss": 0.3112, + "step": 25870 + }, + { + "epoch": 359.44, + "learning_rate": 1.1579428571428573e-05, + "loss": 0.3201, + "step": 25880 + }, + { + "epoch": 359.58, + "learning_rate": 1.1568000000000002e-05, + "loss": 0.3095, + "step": 25890 + }, + { + "epoch": 359.72, + "learning_rate": 1.155657142857143e-05, + "loss": 0.3046, + "step": 25900 + }, + { + "epoch": 359.86, + "learning_rate": 1.1545142857142857e-05, + "loss": 0.2984, + "step": 25910 + }, + { + "epoch": 360.0, + "learning_rate": 1.1533714285714285e-05, + "loss": 0.3176, + "step": 25920 + }, + { + "epoch": 360.0, + "eval_loss": 0.5738566517829895, + "eval_runtime": 127.7406, + "eval_samples_per_second": 4.165, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2183582953011506, + "step": 25920 + }, + { + "epoch": 360.14, + "learning_rate": 1.1522285714285715e-05, + "loss": 0.3069, + "step": 25930 + }, + { + "epoch": 360.28, + "learning_rate": 1.1510857142857144e-05, + "loss": 0.3033, + "step": 25940 + }, + { + "epoch": 360.42, + "learning_rate": 1.1499428571428572e-05, + "loss": 0.3029, + "step": 25950 + }, + { + "epoch": 360.55, + "learning_rate": 1.1488e-05, + "loss": 0.3044, + "step": 25960 + }, + { + "epoch": 360.69, + "learning_rate": 1.1476571428571431e-05, + "loss": 0.3164, + "step": 25970 + }, + { + "epoch": 360.83, + "learning_rate": 1.146514285714286e-05, + "loss": 0.3017, + "step": 25980 + }, + { + "epoch": 360.97, + "learning_rate": 1.1453714285714286e-05, + "loss": 0.3159, + "step": 25990 + }, + { + "epoch": 361.0, + "eval_loss": 0.5599928498268127, + "eval_runtime": 127.1562, + "eval_samples_per_second": 4.184, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21700842064665424, + "step": 25992 + }, + { + "epoch": 361.11, + "learning_rate": 1.1442285714285715e-05, + "loss": 0.3171, + "step": 26000 + }, + { + "epoch": 361.25, + "learning_rate": 1.1430857142857143e-05, + "loss": 0.3139, + "step": 26010 + }, + { + "epoch": 361.39, + "learning_rate": 1.1419428571428573e-05, + "loss": 0.3055, + "step": 26020 + }, + { + "epoch": 361.53, + "learning_rate": 1.1408000000000002e-05, + "loss": 0.3156, + "step": 26030 + }, + { + "epoch": 361.66, + "learning_rate": 1.139657142857143e-05, + "loss": 0.3168, + "step": 26040 + }, + { + "epoch": 361.8, + "learning_rate": 1.1385142857142858e-05, + "loss": 0.308, + "step": 26050 + }, + { + "epoch": 361.94, + "learning_rate": 1.1373714285714285e-05, + "loss": 0.3151, + "step": 26060 + }, + { + "epoch": 362.0, + "eval_loss": 0.5731268525123596, + "eval_runtime": 127.5452, + "eval_samples_per_second": 4.171, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21732981937391527, + "step": 26064 + }, + { + "epoch": 362.08, + "learning_rate": 1.1362285714285715e-05, + "loss": 0.3227, + "step": 26070 + }, + { + "epoch": 362.22, + "learning_rate": 1.1350857142857144e-05, + "loss": 0.3123, + "step": 26080 + }, + { + "epoch": 362.36, + "learning_rate": 1.1339428571428572e-05, + "loss": 0.3087, + "step": 26090 + }, + { + "epoch": 362.5, + "learning_rate": 1.1328e-05, + "loss": 0.3093, + "step": 26100 + }, + { + "epoch": 362.64, + "learning_rate": 1.131657142857143e-05, + "loss": 0.2948, + "step": 26110 + }, + { + "epoch": 362.78, + "learning_rate": 1.130514285714286e-05, + "loss": 0.3202, + "step": 26120 + }, + { + "epoch": 362.91, + "learning_rate": 1.1293714285714286e-05, + "loss": 0.3087, + "step": 26130 + }, + { + "epoch": 363.0, + "eval_loss": 0.561343789100647, + "eval_runtime": 127.1289, + "eval_samples_per_second": 4.185, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2168155814102976, + "step": 26136 + }, + { + "epoch": 363.06, + "learning_rate": 1.1282285714285714e-05, + "loss": 0.3233, + "step": 26140 + }, + { + "epoch": 363.19, + "learning_rate": 1.1270857142857143e-05, + "loss": 0.3135, + "step": 26150 + }, + { + "epoch": 363.33, + "learning_rate": 1.1259428571428573e-05, + "loss": 0.3076, + "step": 26160 + }, + { + "epoch": 363.47, + "learning_rate": 1.1248000000000001e-05, + "loss": 0.3142, + "step": 26170 + }, + { + "epoch": 363.61, + "learning_rate": 1.123657142857143e-05, + "loss": 0.2967, + "step": 26180 + }, + { + "epoch": 363.75, + "learning_rate": 1.1225142857142858e-05, + "loss": 0.3211, + "step": 26190 + }, + { + "epoch": 363.89, + "learning_rate": 1.1213714285714285e-05, + "loss": 0.3096, + "step": 26200 + }, + { + "epoch": 364.0, + "eval_loss": 0.5749143362045288, + "eval_runtime": 127.1039, + "eval_samples_per_second": 4.186, + "eval_steps_per_second": 0.527, + "eval_wer": 0.22215080028283088, + "step": 26208 + }, + { + "epoch": 364.03, + "learning_rate": 1.1202285714285715e-05, + "loss": 0.3153, + "step": 26210 + }, + { + "epoch": 364.17, + "learning_rate": 1.1190857142857144e-05, + "loss": 0.3128, + "step": 26220 + }, + { + "epoch": 364.3, + "learning_rate": 1.1179428571428572e-05, + "loss": 0.3177, + "step": 26230 + }, + { + "epoch": 364.44, + "learning_rate": 1.1168e-05, + "loss": 0.3111, + "step": 26240 + }, + { + "epoch": 364.58, + "learning_rate": 1.115657142857143e-05, + "loss": 0.3035, + "step": 26250 + }, + { + "epoch": 364.72, + "learning_rate": 1.1145142857142859e-05, + "loss": 0.3091, + "step": 26260 + }, + { + "epoch": 364.86, + "learning_rate": 1.1133714285714287e-05, + "loss": 0.2928, + "step": 26270 + }, + { + "epoch": 365.0, + "learning_rate": 1.1122285714285714e-05, + "loss": 0.3036, + "step": 26280 + }, + { + "epoch": 365.0, + "eval_loss": 0.5757818222045898, + "eval_runtime": 127.8972, + "eval_samples_per_second": 4.16, + "eval_steps_per_second": 0.524, + "eval_wer": 0.21315163591952177, + "step": 26280 + }, + { + "epoch": 365.14, + "learning_rate": 1.1110857142857143e-05, + "loss": 0.3134, + "step": 26290 + }, + { + "epoch": 365.28, + "learning_rate": 1.1099428571428573e-05, + "loss": 0.3114, + "step": 26300 + }, + { + "epoch": 365.42, + "learning_rate": 1.1088000000000001e-05, + "loss": 0.3012, + "step": 26310 + }, + { + "epoch": 365.55, + "learning_rate": 1.107657142857143e-05, + "loss": 0.3032, + "step": 26320 + }, + { + "epoch": 365.69, + "learning_rate": 1.1065142857142858e-05, + "loss": 0.31, + "step": 26330 + }, + { + "epoch": 365.83, + "learning_rate": 1.1053714285714288e-05, + "loss": 0.302, + "step": 26340 + }, + { + "epoch": 365.97, + "learning_rate": 1.1042285714285715e-05, + "loss": 0.3119, + "step": 26350 + }, + { + "epoch": 366.0, + "eval_loss": 0.5846285820007324, + "eval_runtime": 127.2101, + "eval_samples_per_second": 4.182, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2190010927556727, + "step": 26352 + }, + { + "epoch": 366.11, + "learning_rate": 1.1030857142857143e-05, + "loss": 0.3134, + "step": 26360 + }, + { + "epoch": 366.25, + "learning_rate": 1.1019428571428572e-05, + "loss": 0.3165, + "step": 26370 + }, + { + "epoch": 366.39, + "learning_rate": 1.1008e-05, + "loss": 0.2971, + "step": 26380 + }, + { + "epoch": 366.53, + "learning_rate": 1.099657142857143e-05, + "loss": 0.3045, + "step": 26390 + }, + { + "epoch": 366.66, + "learning_rate": 1.0985142857142859e-05, + "loss": 0.3027, + "step": 26400 + }, + { + "epoch": 366.8, + "learning_rate": 1.0973714285714287e-05, + "loss": 0.3028, + "step": 26410 + }, + { + "epoch": 366.94, + "learning_rate": 1.0962285714285714e-05, + "loss": 0.3114, + "step": 26420 + }, + { + "epoch": 367.0, + "eval_loss": 0.5844096541404724, + "eval_runtime": 127.3965, + "eval_samples_per_second": 4.176, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2118017612650254, + "step": 26424 + }, + { + "epoch": 367.08, + "learning_rate": 1.0950857142857143e-05, + "loss": 0.3128, + "step": 26430 + }, + { + "epoch": 367.22, + "learning_rate": 1.0939428571428573e-05, + "loss": 0.3174, + "step": 26440 + }, + { + "epoch": 367.36, + "learning_rate": 1.0928000000000001e-05, + "loss": 0.2992, + "step": 26450 + }, + { + "epoch": 367.5, + "learning_rate": 1.091657142857143e-05, + "loss": 0.3083, + "step": 26460 + }, + { + "epoch": 367.64, + "learning_rate": 1.0905142857142858e-05, + "loss": 0.3001, + "step": 26470 + }, + { + "epoch": 367.78, + "learning_rate": 1.0893714285714288e-05, + "loss": 0.2972, + "step": 26480 + }, + { + "epoch": 367.91, + "learning_rate": 1.0882285714285715e-05, + "loss": 0.2967, + "step": 26490 + }, + { + "epoch": 368.0, + "eval_loss": 0.5493323802947998, + "eval_runtime": 127.7103, + "eval_samples_per_second": 4.166, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21488718904673137, + "step": 26496 + }, + { + "epoch": 368.06, + "learning_rate": 1.0870857142857143e-05, + "loss": 0.3151, + "step": 26500 + }, + { + "epoch": 368.19, + "learning_rate": 1.0859428571428572e-05, + "loss": 0.3126, + "step": 26510 + }, + { + "epoch": 368.33, + "learning_rate": 1.0848e-05, + "loss": 0.2982, + "step": 26520 + }, + { + "epoch": 368.47, + "learning_rate": 1.083657142857143e-05, + "loss": 0.3047, + "step": 26530 + }, + { + "epoch": 368.61, + "learning_rate": 1.0825142857142859e-05, + "loss": 0.3113, + "step": 26540 + }, + { + "epoch": 368.75, + "learning_rate": 1.0813714285714287e-05, + "loss": 0.3079, + "step": 26550 + }, + { + "epoch": 368.89, + "learning_rate": 1.0802285714285716e-05, + "loss": 0.2968, + "step": 26560 + }, + { + "epoch": 369.0, + "eval_loss": 0.5780913829803467, + "eval_runtime": 127.2345, + "eval_samples_per_second": 4.181, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21392299286494826, + "step": 26568 + }, + { + "epoch": 369.03, + "learning_rate": 1.0790857142857142e-05, + "loss": 0.3115, + "step": 26570 + }, + { + "epoch": 369.17, + "learning_rate": 1.0779428571428572e-05, + "loss": 0.3035, + "step": 26580 + }, + { + "epoch": 369.3, + "learning_rate": 1.0768000000000001e-05, + "loss": 0.3111, + "step": 26590 + }, + { + "epoch": 369.44, + "learning_rate": 1.075657142857143e-05, + "loss": 0.3215, + "step": 26600 + }, + { + "epoch": 369.58, + "learning_rate": 1.0745142857142858e-05, + "loss": 0.3022, + "step": 26610 + }, + { + "epoch": 369.72, + "learning_rate": 1.0733714285714288e-05, + "loss": 0.3108, + "step": 26620 + }, + { + "epoch": 369.86, + "learning_rate": 1.0722285714285716e-05, + "loss": 0.3085, + "step": 26630 + }, + { + "epoch": 370.0, + "learning_rate": 1.0710857142857143e-05, + "loss": 0.3074, + "step": 26640 + }, + { + "epoch": 370.0, + "eval_loss": 0.5902389287948608, + "eval_runtime": 127.1766, + "eval_samples_per_second": 4.183, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21925821173748153, + "step": 26640 + }, + { + "epoch": 370.14, + "learning_rate": 1.0699428571428572e-05, + "loss": 0.3239, + "step": 26650 + }, + { + "epoch": 370.28, + "learning_rate": 1.0688e-05, + "loss": 0.3109, + "step": 26660 + }, + { + "epoch": 370.42, + "learning_rate": 1.067657142857143e-05, + "loss": 0.3017, + "step": 26670 + }, + { + "epoch": 370.55, + "learning_rate": 1.0665142857142859e-05, + "loss": 0.3058, + "step": 26680 + }, + { + "epoch": 370.69, + "learning_rate": 1.0653714285714287e-05, + "loss": 0.3129, + "step": 26690 + }, + { + "epoch": 370.83, + "learning_rate": 1.0642285714285715e-05, + "loss": 0.3124, + "step": 26700 + }, + { + "epoch": 370.97, + "learning_rate": 1.0630857142857142e-05, + "loss": 0.3282, + "step": 26710 + }, + { + "epoch": 371.0, + "eval_loss": 0.5664863586425781, + "eval_runtime": 127.595, + "eval_samples_per_second": 4.169, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2198367294465514, + "step": 26712 + }, + { + "epoch": 371.11, + "learning_rate": 1.0619428571428572e-05, + "loss": 0.2997, + "step": 26720 + }, + { + "epoch": 371.25, + "learning_rate": 1.0608e-05, + "loss": 0.3231, + "step": 26730 + }, + { + "epoch": 371.39, + "learning_rate": 1.059657142857143e-05, + "loss": 0.305, + "step": 26740 + }, + { + "epoch": 371.53, + "learning_rate": 1.0585142857142858e-05, + "loss": 0.3049, + "step": 26750 + }, + { + "epoch": 371.66, + "learning_rate": 1.0573714285714288e-05, + "loss": 0.3148, + "step": 26760 + }, + { + "epoch": 371.8, + "learning_rate": 1.0562285714285716e-05, + "loss": 0.3171, + "step": 26770 + }, + { + "epoch": 371.94, + "learning_rate": 1.0550857142857143e-05, + "loss": 0.3073, + "step": 26780 + }, + { + "epoch": 372.0, + "eval_loss": 0.5752547383308411, + "eval_runtime": 127.7559, + "eval_samples_per_second": 4.164, + "eval_steps_per_second": 0.524, + "eval_wer": 0.21797261682843735, + "step": 26784 + }, + { + "epoch": 372.08, + "learning_rate": 1.0539428571428571e-05, + "loss": 0.3085, + "step": 26790 + }, + { + "epoch": 372.22, + "learning_rate": 1.0528e-05, + "loss": 0.3147, + "step": 26800 + }, + { + "epoch": 372.36, + "learning_rate": 1.051657142857143e-05, + "loss": 0.2957, + "step": 26810 + }, + { + "epoch": 372.5, + "learning_rate": 1.0505142857142858e-05, + "loss": 0.3089, + "step": 26820 + }, + { + "epoch": 372.64, + "learning_rate": 1.0493714285714287e-05, + "loss": 0.3013, + "step": 26830 + }, + { + "epoch": 372.78, + "learning_rate": 1.0482285714285715e-05, + "loss": 0.3019, + "step": 26840 + }, + { + "epoch": 372.91, + "learning_rate": 1.0470857142857142e-05, + "loss": 0.3032, + "step": 26850 + }, + { + "epoch": 373.0, + "eval_loss": 0.5805571675300598, + "eval_runtime": 127.696, + "eval_samples_per_second": 4.166, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21238027897409525, + "step": 26856 + }, + { + "epoch": 373.06, + "learning_rate": 1.0459428571428572e-05, + "loss": 0.3093, + "step": 26860 + }, + { + "epoch": 373.19, + "learning_rate": 1.0448e-05, + "loss": 0.301, + "step": 26870 + }, + { + "epoch": 373.33, + "learning_rate": 1.0436571428571429e-05, + "loss": 0.3029, + "step": 26880 + }, + { + "epoch": 373.47, + "learning_rate": 1.0425142857142857e-05, + "loss": 0.3054, + "step": 26890 + }, + { + "epoch": 373.61, + "learning_rate": 1.0413714285714288e-05, + "loss": 0.2979, + "step": 26900 + }, + { + "epoch": 373.75, + "learning_rate": 1.0402285714285716e-05, + "loss": 0.304, + "step": 26910 + }, + { + "epoch": 373.89, + "learning_rate": 1.0390857142857144e-05, + "loss": 0.3115, + "step": 26920 + }, + { + "epoch": 374.0, + "eval_loss": 0.5527946352958679, + "eval_runtime": 127.7117, + "eval_samples_per_second": 4.166, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2141801118467571, + "step": 26928 + }, + { + "epoch": 374.03, + "learning_rate": 1.0379428571428571e-05, + "loss": 0.309, + "step": 26930 + }, + { + "epoch": 374.17, + "learning_rate": 1.0368e-05, + "loss": 0.3109, + "step": 26940 + }, + { + "epoch": 374.3, + "learning_rate": 1.035657142857143e-05, + "loss": 0.3045, + "step": 26950 + }, + { + "epoch": 374.44, + "learning_rate": 1.0345142857142858e-05, + "loss": 0.296, + "step": 26960 + }, + { + "epoch": 374.58, + "learning_rate": 1.0333714285714287e-05, + "loss": 0.3002, + "step": 26970 + }, + { + "epoch": 374.72, + "learning_rate": 1.0322285714285715e-05, + "loss": 0.3086, + "step": 26980 + }, + { + "epoch": 374.86, + "learning_rate": 1.0310857142857145e-05, + "loss": 0.3019, + "step": 26990 + }, + { + "epoch": 375.0, + "learning_rate": 1.0299428571428572e-05, + "loss": 0.3176, + "step": 27000 + }, + { + "epoch": 375.0, + "eval_loss": 0.5563069581985474, + "eval_runtime": 127.1087, + "eval_samples_per_second": 4.185, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21443723082856592, + "step": 27000 + }, + { + "epoch": 375.14, + "learning_rate": 1.0288e-05, + "loss": 0.3046, + "step": 27010 + }, + { + "epoch": 375.28, + "learning_rate": 1.0276571428571429e-05, + "loss": 0.298, + "step": 27020 + }, + { + "epoch": 375.42, + "learning_rate": 1.0265142857142857e-05, + "loss": 0.3131, + "step": 27030 + }, + { + "epoch": 375.55, + "learning_rate": 1.0253714285714287e-05, + "loss": 0.3012, + "step": 27040 + }, + { + "epoch": 375.69, + "learning_rate": 1.0242285714285716e-05, + "loss": 0.3021, + "step": 27050 + }, + { + "epoch": 375.83, + "learning_rate": 1.0230857142857144e-05, + "loss": 0.2958, + "step": 27060 + }, + { + "epoch": 375.97, + "learning_rate": 1.0219428571428571e-05, + "loss": 0.299, + "step": 27070 + }, + { + "epoch": 376.0, + "eval_loss": 0.5808618068695068, + "eval_runtime": 127.2602, + "eval_samples_per_second": 4.18, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2150157485376358, + "step": 27072 + }, + { + "epoch": 376.11, + "learning_rate": 1.0208e-05, + "loss": 0.3075, + "step": 27080 + }, + { + "epoch": 376.25, + "learning_rate": 1.019657142857143e-05, + "loss": 0.3029, + "step": 27090 + }, + { + "epoch": 376.39, + "learning_rate": 1.0185142857142858e-05, + "loss": 0.2944, + "step": 27100 + }, + { + "epoch": 376.53, + "learning_rate": 1.0173714285714287e-05, + "loss": 0.2871, + "step": 27110 + }, + { + "epoch": 376.66, + "learning_rate": 1.0162285714285715e-05, + "loss": 0.2995, + "step": 27120 + }, + { + "epoch": 376.8, + "learning_rate": 1.0150857142857145e-05, + "loss": 0.301, + "step": 27130 + }, + { + "epoch": 376.94, + "learning_rate": 1.0139428571428572e-05, + "loss": 0.3116, + "step": 27140 + }, + { + "epoch": 377.0, + "eval_loss": 0.5838585495948792, + "eval_runtime": 127.4329, + "eval_samples_per_second": 4.175, + "eval_steps_per_second": 0.526, + "eval_wer": 0.21540142701034903, + "step": 27144 + }, + { + "epoch": 377.08, + "learning_rate": 1.0128e-05, + "loss": 0.3094, + "step": 27150 + }, + { + "epoch": 377.22, + "learning_rate": 1.0116571428571429e-05, + "loss": 0.3051, + "step": 27160 + }, + { + "epoch": 377.36, + "learning_rate": 1.0105142857142857e-05, + "loss": 0.2927, + "step": 27170 + }, + { + "epoch": 377.5, + "learning_rate": 1.0093714285714287e-05, + "loss": 0.299, + "step": 27180 + }, + { + "epoch": 377.64, + "learning_rate": 1.0082285714285716e-05, + "loss": 0.2988, + "step": 27190 + }, + { + "epoch": 377.78, + "learning_rate": 1.0070857142857144e-05, + "loss": 0.3071, + "step": 27200 + }, + { + "epoch": 377.91, + "learning_rate": 1.0059428571428573e-05, + "loss": 0.3033, + "step": 27210 + }, + { + "epoch": 378.0, + "eval_loss": 0.5670997500419617, + "eval_runtime": 126.8069, + "eval_samples_per_second": 4.195, + "eval_steps_per_second": 0.528, + "eval_wer": 0.2157871054830623, + "step": 27216 + }, + { + "epoch": 378.06, + "learning_rate": 1.0048e-05, + "loss": 0.312, + "step": 27220 + }, + { + "epoch": 378.19, + "learning_rate": 1.003657142857143e-05, + "loss": 0.3041, + "step": 27230 + }, + { + "epoch": 378.33, + "learning_rate": 1.0025142857142858e-05, + "loss": 0.2955, + "step": 27240 + }, + { + "epoch": 378.47, + "learning_rate": 1.0013714285714286e-05, + "loss": 0.309, + "step": 27250 + }, + { + "epoch": 378.61, + "learning_rate": 1.0002285714285715e-05, + "loss": 0.2993, + "step": 27260 + }, + { + "epoch": 378.75, + "learning_rate": 9.990857142857143e-06, + "loss": 0.2972, + "step": 27270 + }, + { + "epoch": 378.89, + "learning_rate": 9.979428571428572e-06, + "loss": 0.2973, + "step": 27280 + }, + { + "epoch": 379.0, + "eval_loss": 0.5771830677986145, + "eval_runtime": 129.2111, + "eval_samples_per_second": 4.117, + "eval_steps_per_second": 0.519, + "eval_wer": 0.21816545606479398, + "step": 27288 + }, + { + "epoch": 379.03, + "learning_rate": 9.968000000000002e-06, + "loss": 0.3161, + "step": 27290 + }, + { + "epoch": 379.17, + "learning_rate": 9.95657142857143e-06, + "loss": 0.302, + "step": 27300 + }, + { + "epoch": 379.3, + "learning_rate": 9.945142857142857e-06, + "loss": 0.2982, + "step": 27310 + }, + { + "epoch": 379.44, + "learning_rate": 9.933714285714287e-06, + "loss": 0.3061, + "step": 27320 + }, + { + "epoch": 379.58, + "learning_rate": 9.922285714285716e-06, + "loss": 0.2974, + "step": 27330 + }, + { + "epoch": 379.72, + "learning_rate": 9.910857142857144e-06, + "loss": 0.3046, + "step": 27340 + }, + { + "epoch": 379.86, + "learning_rate": 9.899428571428572e-06, + "loss": 0.3036, + "step": 27350 + }, + { + "epoch": 380.0, + "learning_rate": 9.888000000000001e-06, + "loss": 0.2995, + "step": 27360 + }, + { + "epoch": 380.0, + "eval_loss": 0.556514322757721, + "eval_runtime": 127.9999, + "eval_samples_per_second": 4.156, + "eval_steps_per_second": 0.523, + "eval_wer": 0.21732981937391527, + "step": 27360 + }, + { + "epoch": 380.14, + "learning_rate": 9.87657142857143e-06, + "loss": 0.2934, + "step": 27370 + }, + { + "epoch": 380.28, + "learning_rate": 9.865142857142858e-06, + "loss": 0.3023, + "step": 27380 + }, + { + "epoch": 380.42, + "learning_rate": 9.853714285714286e-06, + "loss": 0.3107, + "step": 27390 + }, + { + "epoch": 380.55, + "learning_rate": 9.842285714285715e-06, + "loss": 0.2996, + "step": 27400 + }, + { + "epoch": 380.69, + "learning_rate": 9.830857142857145e-06, + "loss": 0.2994, + "step": 27410 + }, + { + "epoch": 380.83, + "learning_rate": 9.819428571428572e-06, + "loss": 0.2977, + "step": 27420 + }, + { + "epoch": 380.97, + "learning_rate": 9.808000000000002e-06, + "loss": 0.31, + "step": 27430 + }, + { + "epoch": 381.0, + "eval_loss": 0.5602931976318359, + "eval_runtime": 127.2803, + "eval_samples_per_second": 4.18, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2174583788648197, + "step": 27432 + }, + { + "epoch": 381.11, + "learning_rate": 9.79657142857143e-06, + "loss": 0.2976, + "step": 27440 + }, + { + "epoch": 381.25, + "learning_rate": 9.785142857142857e-06, + "loss": 0.312, + "step": 27450 + }, + { + "epoch": 381.39, + "learning_rate": 9.773714285714287e-06, + "loss": 0.3043, + "step": 27460 + }, + { + "epoch": 381.53, + "learning_rate": 9.762285714285715e-06, + "loss": 0.2948, + "step": 27470 + }, + { + "epoch": 381.66, + "learning_rate": 9.750857142857144e-06, + "loss": 0.305, + "step": 27480 + }, + { + "epoch": 381.8, + "learning_rate": 9.739428571428572e-06, + "loss": 0.2911, + "step": 27490 + }, + { + "epoch": 381.94, + "learning_rate": 9.728e-06, + "loss": 0.3032, + "step": 27500 + }, + { + "epoch": 382.0, + "eval_loss": 0.564012885093689, + "eval_runtime": 127.2664, + "eval_samples_per_second": 4.18, + "eval_steps_per_second": 0.526, + "eval_wer": 0.21559426624670566, + "step": 27504 + }, + { + "epoch": 382.08, + "learning_rate": 9.716571428571429e-06, + "loss": 0.3042, + "step": 27510 + }, + { + "epoch": 382.22, + "learning_rate": 9.705142857142858e-06, + "loss": 0.2982, + "step": 27520 + }, + { + "epoch": 382.36, + "learning_rate": 9.693714285714286e-06, + "loss": 0.2954, + "step": 27530 + }, + { + "epoch": 382.5, + "learning_rate": 9.682285714285714e-06, + "loss": 0.2983, + "step": 27540 + }, + { + "epoch": 382.64, + "learning_rate": 9.670857142857145e-06, + "loss": 0.3075, + "step": 27550 + }, + { + "epoch": 382.78, + "learning_rate": 9.659428571428571e-06, + "loss": 0.3007, + "step": 27560 + }, + { + "epoch": 382.91, + "learning_rate": 9.648000000000001e-06, + "loss": 0.3072, + "step": 27570 + }, + { + "epoch": 383.0, + "eval_loss": 0.5639933943748474, + "eval_runtime": 127.2296, + "eval_samples_per_second": 4.181, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2158513852285145, + "step": 27576 + }, + { + "epoch": 383.06, + "learning_rate": 9.63657142857143e-06, + "loss": 0.3122, + "step": 27580 + }, + { + "epoch": 383.19, + "learning_rate": 9.625142857142858e-06, + "loss": 0.3043, + "step": 27590 + }, + { + "epoch": 383.33, + "learning_rate": 9.613714285714287e-06, + "loss": 0.3036, + "step": 27600 + }, + { + "epoch": 383.47, + "learning_rate": 9.602285714285715e-06, + "loss": 0.3053, + "step": 27610 + }, + { + "epoch": 383.61, + "learning_rate": 9.590857142857144e-06, + "loss": 0.296, + "step": 27620 + }, + { + "epoch": 383.75, + "learning_rate": 9.579428571428572e-06, + "loss": 0.3031, + "step": 27630 + }, + { + "epoch": 383.89, + "learning_rate": 9.568e-06, + "loss": 0.2927, + "step": 27640 + }, + { + "epoch": 384.0, + "eval_loss": 0.5589981079101562, + "eval_runtime": 127.3544, + "eval_samples_per_second": 4.177, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2150157485376358, + "step": 27648 + }, + { + "epoch": 384.03, + "learning_rate": 9.556571428571429e-06, + "loss": 0.3078, + "step": 27650 + }, + { + "epoch": 384.17, + "learning_rate": 9.545142857142859e-06, + "loss": 0.3122, + "step": 27660 + }, + { + "epoch": 384.3, + "learning_rate": 9.533714285714286e-06, + "loss": 0.2892, + "step": 27670 + }, + { + "epoch": 384.44, + "learning_rate": 9.522285714285714e-06, + "loss": 0.2977, + "step": 27680 + }, + { + "epoch": 384.58, + "learning_rate": 9.510857142857144e-06, + "loss": 0.288, + "step": 27690 + }, + { + "epoch": 384.72, + "learning_rate": 9.499428571428571e-06, + "loss": 0.301, + "step": 27700 + }, + { + "epoch": 384.86, + "learning_rate": 9.488000000000001e-06, + "loss": 0.3021, + "step": 27710 + }, + { + "epoch": 385.0, + "learning_rate": 9.47657142857143e-06, + "loss": 0.2952, + "step": 27720 + }, + { + "epoch": 385.0, + "eval_loss": 0.5467908978462219, + "eval_runtime": 127.421, + "eval_samples_per_second": 4.175, + "eval_steps_per_second": 0.526, + "eval_wer": 0.21238027897409525, + "step": 27720 + }, + { + "epoch": 385.14, + "learning_rate": 9.465142857142858e-06, + "loss": 0.3072, + "step": 27730 + }, + { + "epoch": 385.28, + "learning_rate": 9.453714285714287e-06, + "loss": 0.2963, + "step": 27740 + }, + { + "epoch": 385.42, + "learning_rate": 9.442285714285715e-06, + "loss": 0.303, + "step": 27750 + }, + { + "epoch": 385.55, + "learning_rate": 9.430857142857144e-06, + "loss": 0.2958, + "step": 27760 + }, + { + "epoch": 385.69, + "learning_rate": 9.419428571428572e-06, + "loss": 0.292, + "step": 27770 + }, + { + "epoch": 385.83, + "learning_rate": 9.408e-06, + "loss": 0.2982, + "step": 27780 + }, + { + "epoch": 385.97, + "learning_rate": 9.396571428571429e-06, + "loss": 0.2989, + "step": 27790 + }, + { + "epoch": 386.0, + "eval_loss": 0.5719983577728271, + "eval_runtime": 127.6754, + "eval_samples_per_second": 4.167, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21392299286494826, + "step": 27792 + }, + { + "epoch": 386.11, + "learning_rate": 9.385142857142859e-06, + "loss": 0.3006, + "step": 27800 + }, + { + "epoch": 386.25, + "learning_rate": 9.373714285714286e-06, + "loss": 0.2907, + "step": 27810 + }, + { + "epoch": 386.39, + "learning_rate": 9.362285714285714e-06, + "loss": 0.2897, + "step": 27820 + }, + { + "epoch": 386.53, + "learning_rate": 9.350857142857144e-06, + "loss": 0.2985, + "step": 27830 + }, + { + "epoch": 386.66, + "learning_rate": 9.339428571428573e-06, + "loss": 0.3031, + "step": 27840 + }, + { + "epoch": 386.8, + "learning_rate": 9.328000000000001e-06, + "loss": 0.2963, + "step": 27850 + }, + { + "epoch": 386.94, + "learning_rate": 9.31657142857143e-06, + "loss": 0.3011, + "step": 27860 + }, + { + "epoch": 387.0, + "eval_loss": 0.566278338432312, + "eval_runtime": 127.666, + "eval_samples_per_second": 4.167, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21225171948319085, + "step": 27864 + }, + { + "epoch": 387.08, + "learning_rate": 9.305142857142858e-06, + "loss": 0.3074, + "step": 27870 + }, + { + "epoch": 387.22, + "learning_rate": 9.293714285714286e-06, + "loss": 0.3026, + "step": 27880 + }, + { + "epoch": 387.36, + "learning_rate": 9.282285714285715e-06, + "loss": 0.2886, + "step": 27890 + }, + { + "epoch": 387.5, + "learning_rate": 9.270857142857143e-06, + "loss": 0.3046, + "step": 27900 + }, + { + "epoch": 387.64, + "learning_rate": 9.259428571428572e-06, + "loss": 0.2967, + "step": 27910 + }, + { + "epoch": 387.78, + "learning_rate": 9.248e-06, + "loss": 0.297, + "step": 27920 + }, + { + "epoch": 387.91, + "learning_rate": 9.236571428571429e-06, + "loss": 0.303, + "step": 27930 + }, + { + "epoch": 388.0, + "eval_loss": 0.5730054378509521, + "eval_runtime": 127.1382, + "eval_samples_per_second": 4.184, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21437295108311372, + "step": 27936 + }, + { + "epoch": 388.06, + "learning_rate": 9.225142857142859e-06, + "loss": 0.3036, + "step": 27940 + }, + { + "epoch": 388.19, + "learning_rate": 9.213714285714287e-06, + "loss": 0.2958, + "step": 27950 + }, + { + "epoch": 388.33, + "learning_rate": 9.202285714285714e-06, + "loss": 0.3009, + "step": 27960 + }, + { + "epoch": 388.47, + "learning_rate": 9.190857142857144e-06, + "loss": 0.3122, + "step": 27970 + }, + { + "epoch": 388.61, + "learning_rate": 9.179428571428573e-06, + "loss": 0.2893, + "step": 27980 + }, + { + "epoch": 388.75, + "learning_rate": 9.168000000000001e-06, + "loss": 0.292, + "step": 27990 + }, + { + "epoch": 388.89, + "learning_rate": 9.15657142857143e-06, + "loss": 0.2961, + "step": 28000 + }, + { + "epoch": 389.0, + "eval_loss": 0.5954252481460571, + "eval_runtime": 127.419, + "eval_samples_per_second": 4.175, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2119303207559298, + "step": 28008 + }, + { + "epoch": 389.03, + "learning_rate": 9.145142857142858e-06, + "loss": 0.3136, + "step": 28010 + }, + { + "epoch": 389.17, + "learning_rate": 9.133714285714286e-06, + "loss": 0.3014, + "step": 28020 + }, + { + "epoch": 389.3, + "learning_rate": 9.122285714285715e-06, + "loss": 0.295, + "step": 28030 + }, + { + "epoch": 389.44, + "learning_rate": 9.110857142857143e-06, + "loss": 0.3022, + "step": 28040 + }, + { + "epoch": 389.58, + "learning_rate": 9.099428571428572e-06, + "loss": 0.2818, + "step": 28050 + }, + { + "epoch": 389.72, + "learning_rate": 9.088000000000002e-06, + "loss": 0.3084, + "step": 28060 + }, + { + "epoch": 389.86, + "learning_rate": 9.076571428571429e-06, + "loss": 0.3002, + "step": 28070 + }, + { + "epoch": 390.0, + "learning_rate": 9.065142857142859e-06, + "loss": 0.2913, + "step": 28080 + }, + { + "epoch": 390.0, + "eval_loss": 0.582231342792511, + "eval_runtime": 127.688, + "eval_samples_per_second": 4.166, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21045188661052902, + "step": 28080 + }, + { + "epoch": 390.14, + "learning_rate": 9.053714285714287e-06, + "loss": 0.2997, + "step": 28090 + }, + { + "epoch": 390.28, + "learning_rate": 9.042285714285714e-06, + "loss": 0.3097, + "step": 28100 + }, + { + "epoch": 390.42, + "learning_rate": 9.030857142857144e-06, + "loss": 0.298, + "step": 28110 + }, + { + "epoch": 390.55, + "learning_rate": 9.019428571428572e-06, + "loss": 0.2966, + "step": 28120 + }, + { + "epoch": 390.69, + "learning_rate": 9.008e-06, + "loss": 0.2918, + "step": 28130 + }, + { + "epoch": 390.83, + "learning_rate": 8.99657142857143e-06, + "loss": 0.2912, + "step": 28140 + }, + { + "epoch": 390.97, + "learning_rate": 8.985142857142858e-06, + "loss": 0.3051, + "step": 28150 + }, + { + "epoch": 391.0, + "eval_loss": 0.5716819763183594, + "eval_runtime": 126.9654, + "eval_samples_per_second": 4.19, + "eval_steps_per_second": 0.528, + "eval_wer": 0.2096162499196503, + "step": 28152 + }, + { + "epoch": 391.11, + "learning_rate": 8.973714285714286e-06, + "loss": 0.2957, + "step": 28160 + }, + { + "epoch": 391.25, + "learning_rate": 8.962285714285715e-06, + "loss": 0.3064, + "step": 28170 + }, + { + "epoch": 391.39, + "learning_rate": 8.950857142857143e-06, + "loss": 0.2947, + "step": 28180 + }, + { + "epoch": 391.53, + "learning_rate": 8.939428571428571e-06, + "loss": 0.297, + "step": 28190 + }, + { + "epoch": 391.66, + "learning_rate": 8.928000000000002e-06, + "loss": 0.2996, + "step": 28200 + }, + { + "epoch": 391.8, + "learning_rate": 8.916571428571428e-06, + "loss": 0.285, + "step": 28210 + }, + { + "epoch": 391.94, + "learning_rate": 8.905142857142858e-06, + "loss": 0.2977, + "step": 28220 + }, + { + "epoch": 392.0, + "eval_loss": 0.5687692761421204, + "eval_runtime": 127.6383, + "eval_samples_per_second": 4.168, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21263739795590408, + "step": 28224 + }, + { + "epoch": 392.08, + "learning_rate": 8.893714285714287e-06, + "loss": 0.2909, + "step": 28230 + }, + { + "epoch": 392.22, + "learning_rate": 8.882285714285715e-06, + "loss": 0.2987, + "step": 28240 + }, + { + "epoch": 392.36, + "learning_rate": 8.870857142857144e-06, + "loss": 0.2926, + "step": 28250 + }, + { + "epoch": 392.5, + "learning_rate": 8.859428571428572e-06, + "loss": 0.294, + "step": 28260 + }, + { + "epoch": 392.64, + "learning_rate": 8.848e-06, + "loss": 0.2923, + "step": 28270 + }, + { + "epoch": 392.78, + "learning_rate": 8.836571428571429e-06, + "loss": 0.2898, + "step": 28280 + }, + { + "epoch": 392.91, + "learning_rate": 8.825142857142858e-06, + "loss": 0.2927, + "step": 28290 + }, + { + "epoch": 393.0, + "eval_loss": 0.5599448680877686, + "eval_runtime": 127.291, + "eval_samples_per_second": 4.179, + "eval_steps_per_second": 0.526, + "eval_wer": 0.21090184482869448, + "step": 28296 + }, + { + "epoch": 393.06, + "learning_rate": 8.813714285714286e-06, + "loss": 0.2989, + "step": 28300 + }, + { + "epoch": 393.19, + "learning_rate": 8.802285714285716e-06, + "loss": 0.3125, + "step": 28310 + }, + { + "epoch": 393.33, + "learning_rate": 8.790857142857143e-06, + "loss": 0.2907, + "step": 28320 + }, + { + "epoch": 393.47, + "learning_rate": 8.779428571428571e-06, + "loss": 0.2978, + "step": 28330 + }, + { + "epoch": 393.61, + "learning_rate": 8.768000000000001e-06, + "loss": 0.2925, + "step": 28340 + }, + { + "epoch": 393.75, + "learning_rate": 8.75657142857143e-06, + "loss": 0.2909, + "step": 28350 + }, + { + "epoch": 393.89, + "learning_rate": 8.745142857142858e-06, + "loss": 0.2913, + "step": 28360 + }, + { + "epoch": 394.0, + "eval_loss": 0.5809375047683716, + "eval_runtime": 127.3235, + "eval_samples_per_second": 4.178, + "eval_steps_per_second": 0.526, + "eval_wer": 0.21244455871954748, + "step": 28368 + }, + { + "epoch": 394.03, + "learning_rate": 8.733714285714287e-06, + "loss": 0.3167, + "step": 28370 + }, + { + "epoch": 394.17, + "learning_rate": 8.722285714285715e-06, + "loss": 0.3044, + "step": 28380 + }, + { + "epoch": 394.3, + "learning_rate": 8.710857142857144e-06, + "loss": 0.2927, + "step": 28390 + }, + { + "epoch": 394.44, + "learning_rate": 8.699428571428572e-06, + "loss": 0.2808, + "step": 28400 + }, + { + "epoch": 394.58, + "learning_rate": 8.688e-06, + "loss": 0.2957, + "step": 28410 + }, + { + "epoch": 394.72, + "learning_rate": 8.676571428571429e-06, + "loss": 0.3006, + "step": 28420 + }, + { + "epoch": 394.86, + "learning_rate": 8.665142857142857e-06, + "loss": 0.2908, + "step": 28430 + }, + { + "epoch": 395.0, + "learning_rate": 8.653714285714286e-06, + "loss": 0.2988, + "step": 28440 + }, + { + "epoch": 395.0, + "eval_loss": 0.5650379061698914, + "eval_runtime": 127.6228, + "eval_samples_per_second": 4.169, + "eval_steps_per_second": 0.525, + "eval_wer": 0.20974480941055473, + "step": 28440 + }, + { + "epoch": 395.14, + "learning_rate": 8.642285714285716e-06, + "loss": 0.3058, + "step": 28450 + }, + { + "epoch": 395.28, + "learning_rate": 8.630857142857143e-06, + "loss": 0.2991, + "step": 28460 + }, + { + "epoch": 395.42, + "learning_rate": 8.619428571428571e-06, + "loss": 0.2985, + "step": 28470 + }, + { + "epoch": 395.55, + "learning_rate": 8.608000000000001e-06, + "loss": 0.2944, + "step": 28480 + }, + { + "epoch": 395.69, + "learning_rate": 8.59657142857143e-06, + "loss": 0.295, + "step": 28490 + }, + { + "epoch": 395.83, + "learning_rate": 8.585142857142858e-06, + "loss": 0.2831, + "step": 28500 + }, + { + "epoch": 395.97, + "learning_rate": 8.573714285714287e-06, + "loss": 0.2895, + "step": 28510 + }, + { + "epoch": 396.0, + "eval_loss": 0.5691484808921814, + "eval_runtime": 127.4349, + "eval_samples_per_second": 4.175, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2117374815195732, + "step": 28512 + }, + { + "epoch": 396.11, + "learning_rate": 8.562285714285715e-06, + "loss": 0.2976, + "step": 28520 + }, + { + "epoch": 396.25, + "learning_rate": 8.550857142857143e-06, + "loss": 0.2958, + "step": 28530 + }, + { + "epoch": 396.39, + "learning_rate": 8.539428571428572e-06, + "loss": 0.2907, + "step": 28540 + }, + { + "epoch": 396.53, + "learning_rate": 8.528e-06, + "loss": 0.2852, + "step": 28550 + }, + { + "epoch": 396.66, + "learning_rate": 8.516571428571429e-06, + "loss": 0.3017, + "step": 28560 + }, + { + "epoch": 396.8, + "learning_rate": 8.505142857142857e-06, + "loss": 0.2922, + "step": 28570 + }, + { + "epoch": 396.94, + "learning_rate": 8.493714285714286e-06, + "loss": 0.2887, + "step": 28580 + }, + { + "epoch": 397.0, + "eval_loss": 0.565529465675354, + "eval_runtime": 127.6106, + "eval_samples_per_second": 4.169, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2118017612650254, + "step": 28584 + }, + { + "epoch": 397.08, + "learning_rate": 8.482285714285716e-06, + "loss": 0.3018, + "step": 28590 + }, + { + "epoch": 397.22, + "learning_rate": 8.470857142857144e-06, + "loss": 0.2992, + "step": 28600 + }, + { + "epoch": 397.36, + "learning_rate": 8.459428571428571e-06, + "loss": 0.2831, + "step": 28610 + }, + { + "epoch": 397.5, + "learning_rate": 8.448000000000001e-06, + "loss": 0.2996, + "step": 28620 + }, + { + "epoch": 397.64, + "learning_rate": 8.43657142857143e-06, + "loss": 0.2818, + "step": 28630 + }, + { + "epoch": 397.78, + "learning_rate": 8.425142857142858e-06, + "loss": 0.2996, + "step": 28640 + }, + { + "epoch": 397.91, + "learning_rate": 8.413714285714286e-06, + "loss": 0.2987, + "step": 28650 + }, + { + "epoch": 398.0, + "eval_loss": 0.5748226046562195, + "eval_runtime": 127.0685, + "eval_samples_per_second": 4.187, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21328019541042617, + "step": 28656 + }, + { + "epoch": 398.06, + "learning_rate": 8.402285714285715e-06, + "loss": 0.2979, + "step": 28660 + }, + { + "epoch": 398.19, + "learning_rate": 8.390857142857143e-06, + "loss": 0.2949, + "step": 28670 + }, + { + "epoch": 398.33, + "learning_rate": 8.379428571428572e-06, + "loss": 0.2903, + "step": 28680 + }, + { + "epoch": 398.47, + "learning_rate": 8.368e-06, + "loss": 0.2969, + "step": 28690 + }, + { + "epoch": 398.61, + "learning_rate": 8.356571428571429e-06, + "loss": 0.2931, + "step": 28700 + }, + { + "epoch": 398.75, + "learning_rate": 8.345142857142859e-06, + "loss": 0.2973, + "step": 28710 + }, + { + "epoch": 398.89, + "learning_rate": 8.333714285714285e-06, + "loss": 0.2945, + "step": 28720 + }, + { + "epoch": 399.0, + "eval_loss": 0.5620297193527222, + "eval_runtime": 127.5242, + "eval_samples_per_second": 4.172, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21527286751944463, + "step": 28728 + }, + { + "epoch": 399.03, + "learning_rate": 8.322285714285716e-06, + "loss": 0.3023, + "step": 28730 + }, + { + "epoch": 399.17, + "learning_rate": 8.310857142857144e-06, + "loss": 0.2967, + "step": 28740 + }, + { + "epoch": 399.3, + "learning_rate": 8.29942857142857e-06, + "loss": 0.2885, + "step": 28750 + }, + { + "epoch": 399.44, + "learning_rate": 8.288000000000001e-06, + "loss": 0.294, + "step": 28760 + }, + { + "epoch": 399.58, + "learning_rate": 8.27657142857143e-06, + "loss": 0.2845, + "step": 28770 + }, + { + "epoch": 399.72, + "learning_rate": 8.265142857142858e-06, + "loss": 0.2984, + "step": 28780 + }, + { + "epoch": 399.86, + "learning_rate": 8.253714285714286e-06, + "loss": 0.2946, + "step": 28790 + }, + { + "epoch": 400.0, + "learning_rate": 8.242285714285715e-06, + "loss": 0.2869, + "step": 28800 + }, + { + "epoch": 400.0, + "eval_loss": 0.5762408375740051, + "eval_runtime": 127.1188, + "eval_samples_per_second": 4.185, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21315163591952177, + "step": 28800 + }, + { + "epoch": 400.14, + "learning_rate": 8.230857142857143e-06, + "loss": 0.2976, + "step": 28810 + }, + { + "epoch": 400.28, + "learning_rate": 8.219428571428573e-06, + "loss": 0.2864, + "step": 28820 + }, + { + "epoch": 400.42, + "learning_rate": 8.208e-06, + "loss": 0.285, + "step": 28830 + }, + { + "epoch": 400.55, + "learning_rate": 8.196571428571428e-06, + "loss": 0.2996, + "step": 28840 + }, + { + "epoch": 400.69, + "learning_rate": 8.185142857142859e-06, + "loss": 0.2968, + "step": 28850 + }, + { + "epoch": 400.83, + "learning_rate": 8.173714285714285e-06, + "loss": 0.286, + "step": 28860 + }, + { + "epoch": 400.97, + "learning_rate": 8.162285714285715e-06, + "loss": 0.3009, + "step": 28870 + }, + { + "epoch": 401.0, + "eval_loss": 0.5554483532905579, + "eval_runtime": 127.1755, + "eval_samples_per_second": 4.183, + "eval_steps_per_second": 0.527, + "eval_wer": 0.20743073857427524, + "step": 28872 + }, + { + "epoch": 401.11, + "learning_rate": 8.150857142857144e-06, + "loss": 0.2928, + "step": 28880 + }, + { + "epoch": 401.25, + "learning_rate": 8.139428571428572e-06, + "loss": 0.2892, + "step": 28890 + }, + { + "epoch": 401.39, + "learning_rate": 8.128e-06, + "loss": 0.2943, + "step": 28900 + }, + { + "epoch": 401.53, + "learning_rate": 8.11657142857143e-06, + "loss": 0.2995, + "step": 28910 + }, + { + "epoch": 401.66, + "learning_rate": 8.105142857142858e-06, + "loss": 0.2982, + "step": 28920 + }, + { + "epoch": 401.8, + "learning_rate": 8.093714285714286e-06, + "loss": 0.2953, + "step": 28930 + }, + { + "epoch": 401.94, + "learning_rate": 8.082285714285715e-06, + "loss": 0.2973, + "step": 28940 + }, + { + "epoch": 402.0, + "eval_loss": 0.5747002959251404, + "eval_runtime": 127.5137, + "eval_samples_per_second": 4.172, + "eval_steps_per_second": 0.525, + "eval_wer": 0.20968052966510253, + "step": 28944 + }, + { + "epoch": 402.08, + "learning_rate": 8.070857142857143e-06, + "loss": 0.2904, + "step": 28950 + }, + { + "epoch": 402.22, + "learning_rate": 8.059428571428573e-06, + "loss": 0.2941, + "step": 28960 + }, + { + "epoch": 402.36, + "learning_rate": 8.048e-06, + "loss": 0.2836, + "step": 28970 + }, + { + "epoch": 402.5, + "learning_rate": 8.036571428571428e-06, + "loss": 0.2992, + "step": 28980 + }, + { + "epoch": 402.64, + "learning_rate": 8.025142857142858e-06, + "loss": 0.2825, + "step": 28990 + }, + { + "epoch": 402.78, + "learning_rate": 8.013714285714287e-06, + "loss": 0.2867, + "step": 29000 + }, + { + "epoch": 402.91, + "learning_rate": 8.002285714285715e-06, + "loss": 0.303, + "step": 29010 + }, + { + "epoch": 403.0, + "eval_loss": 0.5816003680229187, + "eval_runtime": 127.9487, + "eval_samples_per_second": 4.158, + "eval_steps_per_second": 0.524, + "eval_wer": 0.21212315999228643, + "step": 29016 + }, + { + "epoch": 403.06, + "learning_rate": 7.990857142857144e-06, + "loss": 0.2901, + "step": 29020 + }, + { + "epoch": 403.19, + "learning_rate": 7.979428571428572e-06, + "loss": 0.2997, + "step": 29030 + }, + { + "epoch": 403.33, + "learning_rate": 7.968e-06, + "loss": 0.2876, + "step": 29040 + }, + { + "epoch": 403.47, + "learning_rate": 7.956571428571429e-06, + "loss": 0.286, + "step": 29050 + }, + { + "epoch": 403.61, + "learning_rate": 7.945142857142857e-06, + "loss": 0.286, + "step": 29060 + }, + { + "epoch": 403.75, + "learning_rate": 7.933714285714288e-06, + "loss": 0.2922, + "step": 29070 + }, + { + "epoch": 403.89, + "learning_rate": 7.922285714285714e-06, + "loss": 0.2858, + "step": 29080 + }, + { + "epoch": 404.0, + "eval_loss": 0.5642435550689697, + "eval_runtime": 127.5199, + "eval_samples_per_second": 4.172, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21302307642861734, + "step": 29088 + }, + { + "epoch": 404.03, + "learning_rate": 7.910857142857143e-06, + "loss": 0.2908, + "step": 29090 + }, + { + "epoch": 404.17, + "learning_rate": 7.899428571428573e-06, + "loss": 0.2818, + "step": 29100 + }, + { + "epoch": 404.3, + "learning_rate": 7.888e-06, + "loss": 0.2865, + "step": 29110 + }, + { + "epoch": 404.44, + "learning_rate": 7.876571428571428e-06, + "loss": 0.2985, + "step": 29120 + }, + { + "epoch": 404.58, + "learning_rate": 7.865142857142858e-06, + "loss": 0.2853, + "step": 29130 + }, + { + "epoch": 404.72, + "learning_rate": 7.853714285714287e-06, + "loss": 0.2899, + "step": 29140 + }, + { + "epoch": 404.86, + "learning_rate": 7.842285714285715e-06, + "loss": 0.2831, + "step": 29150 + }, + { + "epoch": 405.0, + "learning_rate": 7.830857142857144e-06, + "loss": 0.2905, + "step": 29160 + }, + { + "epoch": 405.0, + "eval_loss": 0.5668894052505493, + "eval_runtime": 129.076, + "eval_samples_per_second": 4.122, + "eval_steps_per_second": 0.519, + "eval_wer": 0.2134730346467828, + "step": 29160 + }, + { + "epoch": 405.14, + "learning_rate": 7.819428571428572e-06, + "loss": 0.305, + "step": 29170 + }, + { + "epoch": 405.28, + "learning_rate": 7.808e-06, + "loss": 0.2946, + "step": 29180 + }, + { + "epoch": 405.42, + "learning_rate": 7.796571428571429e-06, + "loss": 0.2851, + "step": 29190 + }, + { + "epoch": 405.55, + "learning_rate": 7.785142857142857e-06, + "loss": 0.2896, + "step": 29200 + }, + { + "epoch": 405.69, + "learning_rate": 7.773714285714287e-06, + "loss": 0.2866, + "step": 29210 + }, + { + "epoch": 405.83, + "learning_rate": 7.762285714285714e-06, + "loss": 0.2915, + "step": 29220 + }, + { + "epoch": 405.97, + "learning_rate": 7.750857142857143e-06, + "loss": 0.2911, + "step": 29230 + }, + { + "epoch": 406.0, + "eval_loss": 0.5488747954368591, + "eval_runtime": 127.5196, + "eval_samples_per_second": 4.172, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21167320177412097, + "step": 29232 + }, + { + "epoch": 406.11, + "learning_rate": 7.739428571428573e-06, + "loss": 0.2901, + "step": 29240 + }, + { + "epoch": 406.25, + "learning_rate": 7.728000000000001e-06, + "loss": 0.2897, + "step": 29250 + }, + { + "epoch": 406.39, + "learning_rate": 7.71657142857143e-06, + "loss": 0.2845, + "step": 29260 + }, + { + "epoch": 406.53, + "learning_rate": 7.705142857142858e-06, + "loss": 0.2978, + "step": 29270 + }, + { + "epoch": 406.66, + "learning_rate": 7.693714285714287e-06, + "loss": 0.2926, + "step": 29280 + }, + { + "epoch": 406.8, + "learning_rate": 7.682285714285715e-06, + "loss": 0.2895, + "step": 29290 + }, + { + "epoch": 406.94, + "learning_rate": 7.670857142857143e-06, + "loss": 0.294, + "step": 29300 + }, + { + "epoch": 407.0, + "eval_loss": 0.5599918961524963, + "eval_runtime": 127.6376, + "eval_samples_per_second": 4.168, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21032332711962462, + "step": 29304 + }, + { + "epoch": 407.08, + "learning_rate": 7.659428571428572e-06, + "loss": 0.3001, + "step": 29310 + }, + { + "epoch": 407.22, + "learning_rate": 7.648e-06, + "loss": 0.2864, + "step": 29320 + }, + { + "epoch": 407.36, + "learning_rate": 7.636571428571429e-06, + "loss": 0.2935, + "step": 29330 + }, + { + "epoch": 407.5, + "learning_rate": 7.625142857142858e-06, + "loss": 0.2847, + "step": 29340 + }, + { + "epoch": 407.64, + "learning_rate": 7.6137142857142865e-06, + "loss": 0.2812, + "step": 29350 + }, + { + "epoch": 407.78, + "learning_rate": 7.602285714285716e-06, + "loss": 0.2907, + "step": 29360 + }, + { + "epoch": 407.91, + "learning_rate": 7.590857142857143e-06, + "loss": 0.2928, + "step": 29370 + }, + { + "epoch": 408.0, + "eval_loss": 0.5522825717926025, + "eval_runtime": 127.6251, + "eval_samples_per_second": 4.168, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2118017612650254, + "step": 29376 + }, + { + "epoch": 408.06, + "learning_rate": 7.579428571428572e-06, + "loss": 0.2929, + "step": 29380 + }, + { + "epoch": 408.19, + "learning_rate": 7.568000000000001e-06, + "loss": 0.2913, + "step": 29390 + }, + { + "epoch": 408.33, + "learning_rate": 7.556571428571429e-06, + "loss": 0.2909, + "step": 29400 + }, + { + "epoch": 408.47, + "learning_rate": 7.545142857142858e-06, + "loss": 0.2913, + "step": 29410 + }, + { + "epoch": 408.61, + "learning_rate": 7.533714285714286e-06, + "loss": 0.2781, + "step": 29420 + }, + { + "epoch": 408.75, + "learning_rate": 7.522285714285716e-06, + "loss": 0.2842, + "step": 29430 + }, + { + "epoch": 408.89, + "learning_rate": 7.510857142857143e-06, + "loss": 0.282, + "step": 29440 + }, + { + "epoch": 409.0, + "eval_loss": 0.5602902770042419, + "eval_runtime": 127.3543, + "eval_samples_per_second": 4.177, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2127659574468085, + "step": 29448 + }, + { + "epoch": 409.03, + "learning_rate": 7.499428571428572e-06, + "loss": 0.2886, + "step": 29450 + }, + { + "epoch": 409.17, + "learning_rate": 7.488000000000001e-06, + "loss": 0.2887, + "step": 29460 + }, + { + "epoch": 409.3, + "learning_rate": 7.476571428571429e-06, + "loss": 0.2882, + "step": 29470 + }, + { + "epoch": 409.44, + "learning_rate": 7.465142857142858e-06, + "loss": 0.2924, + "step": 29480 + }, + { + "epoch": 409.58, + "learning_rate": 7.453714285714286e-06, + "loss": 0.2878, + "step": 29490 + }, + { + "epoch": 409.72, + "learning_rate": 7.442285714285716e-06, + "loss": 0.2834, + "step": 29500 + }, + { + "epoch": 409.86, + "learning_rate": 7.430857142857143e-06, + "loss": 0.2748, + "step": 29510 + }, + { + "epoch": 410.0, + "learning_rate": 7.419428571428572e-06, + "loss": 0.2919, + "step": 29520 + }, + { + "epoch": 410.0, + "eval_loss": 0.5701452493667603, + "eval_runtime": 127.0581, + "eval_samples_per_second": 4.187, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2127016777013563, + "step": 29520 + }, + { + "epoch": 410.14, + "learning_rate": 7.408000000000001e-06, + "loss": 0.285, + "step": 29530 + }, + { + "epoch": 410.28, + "learning_rate": 7.396571428571429e-06, + "loss": 0.2931, + "step": 29540 + }, + { + "epoch": 410.42, + "learning_rate": 7.385142857142858e-06, + "loss": 0.2906, + "step": 29550 + }, + { + "epoch": 410.55, + "learning_rate": 7.373714285714286e-06, + "loss": 0.2818, + "step": 29560 + }, + { + "epoch": 410.69, + "learning_rate": 7.3622857142857155e-06, + "loss": 0.2913, + "step": 29570 + }, + { + "epoch": 410.83, + "learning_rate": 7.350857142857143e-06, + "loss": 0.2865, + "step": 29580 + }, + { + "epoch": 410.97, + "learning_rate": 7.3394285714285715e-06, + "loss": 0.3006, + "step": 29590 + }, + { + "epoch": 411.0, + "eval_loss": 0.5681251883506775, + "eval_runtime": 127.0015, + "eval_samples_per_second": 4.189, + "eval_steps_per_second": 0.528, + "eval_wer": 0.21360159413768723, + "step": 29592 + }, + { + "epoch": 411.11, + "learning_rate": 7.328000000000001e-06, + "loss": 0.2836, + "step": 29600 + }, + { + "epoch": 411.25, + "learning_rate": 7.316571428571429e-06, + "loss": 0.2802, + "step": 29610 + }, + { + "epoch": 411.39, + "learning_rate": 7.305142857142858e-06, + "loss": 0.2819, + "step": 29620 + }, + { + "epoch": 411.53, + "learning_rate": 7.293714285714286e-06, + "loss": 0.2981, + "step": 29630 + }, + { + "epoch": 411.66, + "learning_rate": 7.282285714285715e-06, + "loss": 0.2876, + "step": 29640 + }, + { + "epoch": 411.8, + "learning_rate": 7.270857142857144e-06, + "loss": 0.2962, + "step": 29650 + }, + { + "epoch": 411.94, + "learning_rate": 7.2594285714285715e-06, + "loss": 0.2882, + "step": 29660 + }, + { + "epoch": 412.0, + "eval_loss": 0.5607542991638184, + "eval_runtime": 127.9973, + "eval_samples_per_second": 4.156, + "eval_steps_per_second": 0.523, + "eval_wer": 0.21238027897409525, + "step": 29664 + }, + { + "epoch": 412.08, + "learning_rate": 7.248000000000001e-06, + "loss": 0.2931, + "step": 29670 + }, + { + "epoch": 412.22, + "learning_rate": 7.236571428571429e-06, + "loss": 0.2819, + "step": 29680 + }, + { + "epoch": 412.36, + "learning_rate": 7.225142857142858e-06, + "loss": 0.2784, + "step": 29690 + }, + { + "epoch": 412.5, + "learning_rate": 7.213714285714286e-06, + "loss": 0.2925, + "step": 29700 + }, + { + "epoch": 412.64, + "learning_rate": 7.202285714285715e-06, + "loss": 0.2838, + "step": 29710 + }, + { + "epoch": 412.78, + "learning_rate": 7.190857142857144e-06, + "loss": 0.2837, + "step": 29720 + }, + { + "epoch": 412.91, + "learning_rate": 7.179428571428571e-06, + "loss": 0.283, + "step": 29730 + }, + { + "epoch": 413.0, + "eval_loss": 0.5694901347160339, + "eval_runtime": 126.9317, + "eval_samples_per_second": 4.191, + "eval_steps_per_second": 0.528, + "eval_wer": 0.21385871311949606, + "step": 29736 + }, + { + "epoch": 413.06, + "learning_rate": 7.168000000000001e-06, + "loss": 0.2882, + "step": 29740 + }, + { + "epoch": 413.19, + "learning_rate": 7.156571428571429e-06, + "loss": 0.2871, + "step": 29750 + }, + { + "epoch": 413.33, + "learning_rate": 7.145142857142858e-06, + "loss": 0.2783, + "step": 29760 + }, + { + "epoch": 413.47, + "learning_rate": 7.133714285714286e-06, + "loss": 0.2893, + "step": 29770 + }, + { + "epoch": 413.61, + "learning_rate": 7.122285714285715e-06, + "loss": 0.2834, + "step": 29780 + }, + { + "epoch": 413.75, + "learning_rate": 7.110857142857144e-06, + "loss": 0.2914, + "step": 29790 + }, + { + "epoch": 413.89, + "learning_rate": 7.099428571428571e-06, + "loss": 0.2888, + "step": 29800 + }, + { + "epoch": 414.0, + "eval_loss": 0.5572978854179382, + "eval_runtime": 127.6614, + "eval_samples_per_second": 4.167, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2111589638105033, + "step": 29808 + }, + { + "epoch": 414.03, + "learning_rate": 7.088000000000001e-06, + "loss": 0.2914, + "step": 29810 + }, + { + "epoch": 414.17, + "learning_rate": 7.077714285714287e-06, + "loss": 0.2898, + "step": 29820 + }, + { + "epoch": 414.3, + "learning_rate": 7.0662857142857144e-06, + "loss": 0.2889, + "step": 29830 + }, + { + "epoch": 414.44, + "learning_rate": 7.054857142857143e-06, + "loss": 0.2899, + "step": 29840 + }, + { + "epoch": 414.58, + "learning_rate": 7.043428571428572e-06, + "loss": 0.2805, + "step": 29850 + }, + { + "epoch": 414.72, + "learning_rate": 7.0320000000000015e-06, + "loss": 0.2932, + "step": 29860 + }, + { + "epoch": 414.86, + "learning_rate": 7.020571428571429e-06, + "loss": 0.29, + "step": 29870 + }, + { + "epoch": 415.0, + "learning_rate": 7.0091428571428575e-06, + "loss": 0.2774, + "step": 29880 + }, + { + "epoch": 415.0, + "eval_loss": 0.5686434507369995, + "eval_runtime": 126.7639, + "eval_samples_per_second": 4.197, + "eval_steps_per_second": 0.529, + "eval_wer": 0.21167320177412097, + "step": 29880 + }, + { + "epoch": 415.14, + "learning_rate": 6.997714285714287e-06, + "loss": 0.2902, + "step": 29890 + }, + { + "epoch": 415.28, + "learning_rate": 6.986285714285714e-06, + "loss": 0.2876, + "step": 29900 + }, + { + "epoch": 415.42, + "learning_rate": 6.974857142857143e-06, + "loss": 0.2951, + "step": 29910 + }, + { + "epoch": 415.55, + "learning_rate": 6.963428571428572e-06, + "loss": 0.2855, + "step": 29920 + }, + { + "epoch": 415.69, + "learning_rate": 6.952000000000001e-06, + "loss": 0.2918, + "step": 29930 + }, + { + "epoch": 415.83, + "learning_rate": 6.940571428571429e-06, + "loss": 0.2842, + "step": 29940 + }, + { + "epoch": 415.97, + "learning_rate": 6.929142857142857e-06, + "loss": 0.2854, + "step": 29950 + }, + { + "epoch": 416.0, + "eval_loss": 0.5725164413452148, + "eval_runtime": 127.6196, + "eval_samples_per_second": 4.169, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2071736195924664, + "step": 29952 + }, + { + "epoch": 416.11, + "learning_rate": 6.917714285714287e-06, + "loss": 0.2872, + "step": 29960 + }, + { + "epoch": 416.25, + "learning_rate": 6.906285714285715e-06, + "loss": 0.2972, + "step": 29970 + }, + { + "epoch": 416.39, + "learning_rate": 6.894857142857143e-06, + "loss": 0.2829, + "step": 29980 + }, + { + "epoch": 416.53, + "learning_rate": 6.883428571428572e-06, + "loss": 0.2844, + "step": 29990 + }, + { + "epoch": 416.66, + "learning_rate": 6.872000000000001e-06, + "loss": 0.2939, + "step": 30000 + }, + { + "epoch": 416.8, + "learning_rate": 6.860571428571429e-06, + "loss": 0.278, + "step": 30010 + }, + { + "epoch": 416.94, + "learning_rate": 6.849142857142857e-06, + "loss": 0.2842, + "step": 30020 + }, + { + "epoch": 417.0, + "eval_loss": 0.5745316743850708, + "eval_runtime": 127.3966, + "eval_samples_per_second": 4.176, + "eval_steps_per_second": 0.526, + "eval_wer": 0.20839493475605836, + "step": 30024 + }, + { + "epoch": 417.08, + "learning_rate": 6.837714285714287e-06, + "loss": 0.2867, + "step": 30030 + }, + { + "epoch": 417.22, + "learning_rate": 6.826285714285715e-06, + "loss": 0.2901, + "step": 30040 + }, + { + "epoch": 417.36, + "learning_rate": 6.814857142857143e-06, + "loss": 0.2698, + "step": 30050 + }, + { + "epoch": 417.5, + "learning_rate": 6.803428571428572e-06, + "loss": 0.2814, + "step": 30060 + }, + { + "epoch": 417.64, + "learning_rate": 6.792000000000001e-06, + "loss": 0.2816, + "step": 30070 + }, + { + "epoch": 417.78, + "learning_rate": 6.780571428571429e-06, + "loss": 0.2825, + "step": 30080 + }, + { + "epoch": 417.91, + "learning_rate": 6.769142857142857e-06, + "loss": 0.2905, + "step": 30090 + }, + { + "epoch": 418.0, + "eval_loss": 0.574224591255188, + "eval_runtime": 127.3796, + "eval_samples_per_second": 4.176, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2101947676287202, + "step": 30096 + }, + { + "epoch": 418.06, + "learning_rate": 6.7577142857142865e-06, + "loss": 0.2902, + "step": 30100 + }, + { + "epoch": 418.19, + "learning_rate": 6.746285714285715e-06, + "loss": 0.2914, + "step": 30110 + }, + { + "epoch": 418.33, + "learning_rate": 6.734857142857143e-06, + "loss": 0.2746, + "step": 30120 + }, + { + "epoch": 418.47, + "learning_rate": 6.723428571428572e-06, + "loss": 0.2867, + "step": 30130 + }, + { + "epoch": 418.61, + "learning_rate": 6.712000000000001e-06, + "loss": 0.275, + "step": 30140 + }, + { + "epoch": 418.75, + "learning_rate": 6.7005714285714296e-06, + "loss": 0.2858, + "step": 30150 + }, + { + "epoch": 418.89, + "learning_rate": 6.689142857142857e-06, + "loss": 0.2841, + "step": 30160 + }, + { + "epoch": 419.0, + "eval_loss": 0.5666540861129761, + "eval_runtime": 129.0517, + "eval_samples_per_second": 4.122, + "eval_steps_per_second": 0.519, + "eval_wer": 0.20974480941055473, + "step": 30168 + }, + { + "epoch": 419.03, + "learning_rate": 6.6777142857142864e-06, + "loss": 0.2806, + "step": 30170 + }, + { + "epoch": 419.17, + "learning_rate": 6.666285714285715e-06, + "loss": 0.2808, + "step": 30180 + }, + { + "epoch": 419.3, + "learning_rate": 6.654857142857143e-06, + "loss": 0.2766, + "step": 30190 + }, + { + "epoch": 419.44, + "learning_rate": 6.643428571428572e-06, + "loss": 0.2928, + "step": 30200 + }, + { + "epoch": 419.58, + "learning_rate": 6.632000000000001e-06, + "loss": 0.2744, + "step": 30210 + }, + { + "epoch": 419.72, + "learning_rate": 6.6205714285714295e-06, + "loss": 0.2852, + "step": 30220 + }, + { + "epoch": 419.86, + "learning_rate": 6.609142857142857e-06, + "loss": 0.2809, + "step": 30230 + }, + { + "epoch": 420.0, + "learning_rate": 6.597714285714286e-06, + "loss": 0.2804, + "step": 30240 + }, + { + "epoch": 420.0, + "eval_loss": 0.5721257328987122, + "eval_runtime": 127.2515, + "eval_samples_per_second": 4.181, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21199460050138202, + "step": 30240 + }, + { + "epoch": 420.14, + "learning_rate": 6.586285714285715e-06, + "loss": 0.2886, + "step": 30250 + }, + { + "epoch": 420.28, + "learning_rate": 6.574857142857144e-06, + "loss": 0.2829, + "step": 30260 + }, + { + "epoch": 420.42, + "learning_rate": 6.563428571428572e-06, + "loss": 0.2786, + "step": 30270 + }, + { + "epoch": 420.55, + "learning_rate": 6.552000000000001e-06, + "loss": 0.287, + "step": 30280 + }, + { + "epoch": 420.69, + "learning_rate": 6.540571428571429e-06, + "loss": 0.2851, + "step": 30290 + }, + { + "epoch": 420.83, + "learning_rate": 6.529142857142857e-06, + "loss": 0.2803, + "step": 30300 + }, + { + "epoch": 420.97, + "learning_rate": 6.517714285714286e-06, + "loss": 0.2854, + "step": 30310 + }, + { + "epoch": 421.0, + "eval_loss": 0.5770949721336365, + "eval_runtime": 127.7285, + "eval_samples_per_second": 4.165, + "eval_steps_per_second": 0.525, + "eval_wer": 0.20993764864691136, + "step": 30312 + }, + { + "epoch": 421.11, + "learning_rate": 6.506285714285715e-06, + "loss": 0.2858, + "step": 30320 + }, + { + "epoch": 421.25, + "learning_rate": 6.494857142857144e-06, + "loss": 0.2953, + "step": 30330 + }, + { + "epoch": 421.39, + "learning_rate": 6.483428571428572e-06, + "loss": 0.2842, + "step": 30340 + }, + { + "epoch": 421.53, + "learning_rate": 6.472000000000001e-06, + "loss": 0.2883, + "step": 30350 + }, + { + "epoch": 421.66, + "learning_rate": 6.460571428571429e-06, + "loss": 0.287, + "step": 30360 + }, + { + "epoch": 421.8, + "learning_rate": 6.449142857142857e-06, + "loss": 0.2789, + "step": 30370 + }, + { + "epoch": 421.94, + "learning_rate": 6.437714285714286e-06, + "loss": 0.2834, + "step": 30380 + }, + { + "epoch": 422.0, + "eval_loss": 0.5773890614509583, + "eval_runtime": 127.4995, + "eval_samples_per_second": 4.173, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21212315999228643, + "step": 30384 + }, + { + "epoch": 422.08, + "learning_rate": 6.426285714285715e-06, + "loss": 0.2801, + "step": 30390 + }, + { + "epoch": 422.22, + "learning_rate": 6.414857142857144e-06, + "loss": 0.2833, + "step": 30400 + }, + { + "epoch": 422.36, + "learning_rate": 6.4034285714285715e-06, + "loss": 0.2891, + "step": 30410 + }, + { + "epoch": 422.5, + "learning_rate": 6.392000000000001e-06, + "loss": 0.2793, + "step": 30420 + }, + { + "epoch": 422.64, + "learning_rate": 6.380571428571429e-06, + "loss": 0.2815, + "step": 30430 + }, + { + "epoch": 422.78, + "learning_rate": 6.3691428571428585e-06, + "loss": 0.282, + "step": 30440 + }, + { + "epoch": 422.91, + "learning_rate": 6.357714285714286e-06, + "loss": 0.292, + "step": 30450 + }, + { + "epoch": 423.0, + "eval_loss": 0.5824567675590515, + "eval_runtime": 127.285, + "eval_samples_per_second": 4.18, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2127659574468085, + "step": 30456 + }, + { + "epoch": 423.06, + "learning_rate": 6.3462857142857146e-06, + "loss": 0.2861, + "step": 30460 + }, + { + "epoch": 423.19, + "learning_rate": 6.334857142857144e-06, + "loss": 0.2908, + "step": 30470 + }, + { + "epoch": 423.33, + "learning_rate": 6.3234285714285714e-06, + "loss": 0.2816, + "step": 30480 + }, + { + "epoch": 423.47, + "learning_rate": 6.312000000000001e-06, + "loss": 0.289, + "step": 30490 + }, + { + "epoch": 423.61, + "learning_rate": 6.300571428571429e-06, + "loss": 0.2757, + "step": 30500 + }, + { + "epoch": 423.75, + "learning_rate": 6.2891428571428584e-06, + "loss": 0.2936, + "step": 30510 + }, + { + "epoch": 423.89, + "learning_rate": 6.277714285714286e-06, + "loss": 0.2762, + "step": 30520 + }, + { + "epoch": 424.0, + "eval_loss": 0.5828635096549988, + "eval_runtime": 127.2503, + "eval_samples_per_second": 4.181, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21263739795590408, + "step": 30528 + }, + { + "epoch": 424.03, + "learning_rate": 6.2662857142857145e-06, + "loss": 0.2902, + "step": 30530 + }, + { + "epoch": 424.17, + "learning_rate": 6.254857142857144e-06, + "loss": 0.2841, + "step": 30540 + }, + { + "epoch": 424.3, + "learning_rate": 6.243428571428571e-06, + "loss": 0.2744, + "step": 30550 + }, + { + "epoch": 424.44, + "learning_rate": 6.232000000000001e-06, + "loss": 0.2871, + "step": 30560 + }, + { + "epoch": 424.58, + "learning_rate": 6.220571428571429e-06, + "loss": 0.2799, + "step": 30570 + }, + { + "epoch": 424.72, + "learning_rate": 6.209142857142858e-06, + "loss": 0.29, + "step": 30580 + }, + { + "epoch": 424.86, + "learning_rate": 6.197714285714286e-06, + "loss": 0.2827, + "step": 30590 + }, + { + "epoch": 425.0, + "learning_rate": 6.186285714285714e-06, + "loss": 0.2755, + "step": 30600 + }, + { + "epoch": 425.0, + "eval_loss": 0.5959154963493347, + "eval_runtime": 127.4997, + "eval_samples_per_second": 4.173, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21559426624670566, + "step": 30600 + }, + { + "epoch": 425.14, + "learning_rate": 6.174857142857144e-06, + "loss": 0.2829, + "step": 30610 + }, + { + "epoch": 425.28, + "learning_rate": 6.163428571428572e-06, + "loss": 0.2809, + "step": 30620 + }, + { + "epoch": 425.42, + "learning_rate": 6.1520000000000006e-06, + "loss": 0.2794, + "step": 30630 + }, + { + "epoch": 425.55, + "learning_rate": 6.140571428571429e-06, + "loss": 0.277, + "step": 30640 + }, + { + "epoch": 425.69, + "learning_rate": 6.129142857142858e-06, + "loss": 0.2961, + "step": 30650 + }, + { + "epoch": 425.83, + "learning_rate": 6.117714285714286e-06, + "loss": 0.2838, + "step": 30660 + }, + { + "epoch": 425.97, + "learning_rate": 6.106285714285714e-06, + "loss": 0.2866, + "step": 30670 + }, + { + "epoch": 426.0, + "eval_loss": 0.5843947529792786, + "eval_runtime": 127.0123, + "eval_samples_per_second": 4.189, + "eval_steps_per_second": 0.528, + "eval_wer": 0.21405155235585266, + "step": 30672 + }, + { + "epoch": 426.11, + "learning_rate": 6.094857142857144e-06, + "loss": 0.2997, + "step": 30680 + }, + { + "epoch": 426.25, + "learning_rate": 6.083428571428572e-06, + "loss": 0.2813, + "step": 30690 + }, + { + "epoch": 426.39, + "learning_rate": 6.0720000000000005e-06, + "loss": 0.2788, + "step": 30700 + }, + { + "epoch": 426.53, + "learning_rate": 6.060571428571429e-06, + "loss": 0.2844, + "step": 30710 + }, + { + "epoch": 426.66, + "learning_rate": 6.049142857142858e-06, + "loss": 0.2849, + "step": 30720 + }, + { + "epoch": 426.8, + "learning_rate": 6.037714285714287e-06, + "loss": 0.2934, + "step": 30730 + }, + { + "epoch": 426.94, + "learning_rate": 6.026285714285714e-06, + "loss": 0.2801, + "step": 30740 + }, + { + "epoch": 427.0, + "eval_loss": 0.588335394859314, + "eval_runtime": 128.3752, + "eval_samples_per_second": 4.144, + "eval_steps_per_second": 0.522, + "eval_wer": 0.2157871054830623, + "step": 30744 + }, + { + "epoch": 427.08, + "learning_rate": 6.0148571428571435e-06, + "loss": 0.2915, + "step": 30750 + }, + { + "epoch": 427.22, + "learning_rate": 6.003428571428572e-06, + "loss": 0.2973, + "step": 30760 + }, + { + "epoch": 427.36, + "learning_rate": 5.993142857142857e-06, + "loss": 0.2652, + "step": 30770 + }, + { + "epoch": 427.5, + "learning_rate": 5.981714285714287e-06, + "loss": 0.2874, + "step": 30780 + }, + { + "epoch": 427.64, + "learning_rate": 5.970285714285715e-06, + "loss": 0.2759, + "step": 30790 + }, + { + "epoch": 427.78, + "learning_rate": 5.958857142857143e-06, + "loss": 0.2743, + "step": 30800 + }, + { + "epoch": 427.91, + "learning_rate": 5.947428571428572e-06, + "loss": 0.2882, + "step": 30810 + }, + { + "epoch": 428.0, + "eval_loss": 0.5844987034797668, + "eval_runtime": 128.1032, + "eval_samples_per_second": 4.153, + "eval_steps_per_second": 0.523, + "eval_wer": 0.21475862955582695, + "step": 30816 + }, + { + "epoch": 428.06, + "learning_rate": 5.9360000000000004e-06, + "loss": 0.2898, + "step": 30820 + }, + { + "epoch": 428.19, + "learning_rate": 5.92457142857143e-06, + "loss": 0.2908, + "step": 30830 + }, + { + "epoch": 428.33, + "learning_rate": 5.913142857142857e-06, + "loss": 0.2785, + "step": 30840 + }, + { + "epoch": 428.47, + "learning_rate": 5.901714285714287e-06, + "loss": 0.2899, + "step": 30850 + }, + { + "epoch": 428.61, + "learning_rate": 5.890285714285715e-06, + "loss": 0.2729, + "step": 30860 + }, + { + "epoch": 428.75, + "learning_rate": 5.878857142857143e-06, + "loss": 0.278, + "step": 30870 + }, + { + "epoch": 428.89, + "learning_rate": 5.867428571428572e-06, + "loss": 0.2718, + "step": 30880 + }, + { + "epoch": 429.0, + "eval_loss": 0.5864471197128296, + "eval_runtime": 127.6992, + "eval_samples_per_second": 4.166, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21160892202866877, + "step": 30888 + }, + { + "epoch": 429.03, + "learning_rate": 5.856e-06, + "loss": 0.2766, + "step": 30890 + }, + { + "epoch": 429.17, + "learning_rate": 5.84457142857143e-06, + "loss": 0.2944, + "step": 30900 + }, + { + "epoch": 429.3, + "learning_rate": 5.833142857142857e-06, + "loss": 0.2846, + "step": 30910 + }, + { + "epoch": 429.44, + "learning_rate": 5.8217142857142865e-06, + "loss": 0.2823, + "step": 30920 + }, + { + "epoch": 429.58, + "learning_rate": 5.810285714285715e-06, + "loss": 0.282, + "step": 30930 + }, + { + "epoch": 429.72, + "learning_rate": 5.798857142857144e-06, + "loss": 0.2785, + "step": 30940 + }, + { + "epoch": 429.86, + "learning_rate": 5.787428571428572e-06, + "loss": 0.2763, + "step": 30950 + }, + { + "epoch": 430.0, + "learning_rate": 5.776e-06, + "loss": 0.2687, + "step": 30960 + }, + { + "epoch": 430.0, + "eval_loss": 0.5664164423942566, + "eval_runtime": 127.2406, + "eval_samples_per_second": 4.181, + "eval_steps_per_second": 0.527, + "eval_wer": 0.20929485119238928, + "step": 30960 + }, + { + "epoch": 430.14, + "learning_rate": 5.7645714285714295e-06, + "loss": 0.2835, + "step": 30970 + }, + { + "epoch": 430.28, + "learning_rate": 5.753142857142857e-06, + "loss": 0.2899, + "step": 30980 + }, + { + "epoch": 430.42, + "learning_rate": 5.7417142857142864e-06, + "loss": 0.2882, + "step": 30990 + }, + { + "epoch": 430.55, + "learning_rate": 5.730285714285715e-06, + "loss": 0.2767, + "step": 31000 + }, + { + "epoch": 430.69, + "learning_rate": 5.718857142857144e-06, + "loss": 0.2889, + "step": 31010 + }, + { + "epoch": 430.83, + "learning_rate": 5.707428571428572e-06, + "loss": 0.2763, + "step": 31020 + }, + { + "epoch": 430.97, + "learning_rate": 5.696e-06, + "loss": 0.2896, + "step": 31030 + }, + { + "epoch": 431.0, + "eval_loss": 0.5712748765945435, + "eval_runtime": 128.5319, + "eval_samples_per_second": 4.139, + "eval_steps_per_second": 0.521, + "eval_wer": 0.21148036253776434, + "step": 31032 + }, + { + "epoch": 431.11, + "learning_rate": 5.6845714285714295e-06, + "loss": 0.2808, + "step": 31040 + }, + { + "epoch": 431.25, + "learning_rate": 5.673142857142857e-06, + "loss": 0.2708, + "step": 31050 + }, + { + "epoch": 431.39, + "learning_rate": 5.661714285714286e-06, + "loss": 0.2823, + "step": 31060 + }, + { + "epoch": 431.53, + "learning_rate": 5.650285714285715e-06, + "loss": 0.2814, + "step": 31070 + }, + { + "epoch": 431.66, + "learning_rate": 5.638857142857144e-06, + "loss": 0.281, + "step": 31080 + }, + { + "epoch": 431.8, + "learning_rate": 5.627428571428572e-06, + "loss": 0.2813, + "step": 31090 + }, + { + "epoch": 431.94, + "learning_rate": 5.616e-06, + "loss": 0.2816, + "step": 31100 + }, + { + "epoch": 432.0, + "eval_loss": 0.5756629705429077, + "eval_runtime": 127.581, + "eval_samples_per_second": 4.17, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21315163591952177, + "step": 31104 + }, + { + "epoch": 432.08, + "learning_rate": 5.604571428571429e-06, + "loss": 0.2748, + "step": 31110 + }, + { + "epoch": 432.22, + "learning_rate": 5.593142857142858e-06, + "loss": 0.2829, + "step": 31120 + }, + { + "epoch": 432.36, + "learning_rate": 5.581714285714286e-06, + "loss": 0.2756, + "step": 31130 + }, + { + "epoch": 432.5, + "learning_rate": 5.570285714285715e-06, + "loss": 0.2836, + "step": 31140 + }, + { + "epoch": 432.64, + "learning_rate": 5.558857142857144e-06, + "loss": 0.2741, + "step": 31150 + }, + { + "epoch": 432.78, + "learning_rate": 5.547428571428572e-06, + "loss": 0.2877, + "step": 31160 + }, + { + "epoch": 432.91, + "learning_rate": 5.536e-06, + "loss": 0.2817, + "step": 31170 + }, + { + "epoch": 433.0, + "eval_loss": 0.5831404328346252, + "eval_runtime": 127.3022, + "eval_samples_per_second": 4.179, + "eval_steps_per_second": 0.526, + "eval_wer": 0.21315163591952177, + "step": 31176 + }, + { + "epoch": 433.06, + "learning_rate": 5.524571428571429e-06, + "loss": 0.288, + "step": 31180 + }, + { + "epoch": 433.19, + "learning_rate": 5.513142857142858e-06, + "loss": 0.2891, + "step": 31190 + }, + { + "epoch": 433.33, + "learning_rate": 5.501714285714286e-06, + "loss": 0.2764, + "step": 31200 + }, + { + "epoch": 433.47, + "learning_rate": 5.490285714285715e-06, + "loss": 0.2772, + "step": 31210 + }, + { + "epoch": 433.61, + "learning_rate": 5.478857142857144e-06, + "loss": 0.2648, + "step": 31220 + }, + { + "epoch": 433.75, + "learning_rate": 5.467428571428572e-06, + "loss": 0.2798, + "step": 31230 + }, + { + "epoch": 433.89, + "learning_rate": 5.456e-06, + "loss": 0.2816, + "step": 31240 + }, + { + "epoch": 434.0, + "eval_loss": 0.5841153860092163, + "eval_runtime": 128.1155, + "eval_samples_per_second": 4.153, + "eval_steps_per_second": 0.523, + "eval_wer": 0.21212315999228643, + "step": 31248 + }, + { + "epoch": 434.03, + "learning_rate": 5.444571428571429e-06, + "loss": 0.2846, + "step": 31250 + }, + { + "epoch": 434.17, + "learning_rate": 5.433142857142858e-06, + "loss": 0.2801, + "step": 31260 + }, + { + "epoch": 434.3, + "learning_rate": 5.421714285714286e-06, + "loss": 0.2775, + "step": 31270 + }, + { + "epoch": 434.44, + "learning_rate": 5.4102857142857145e-06, + "loss": 0.283, + "step": 31280 + }, + { + "epoch": 434.58, + "learning_rate": 5.398857142857144e-06, + "loss": 0.2762, + "step": 31290 + }, + { + "epoch": 434.72, + "learning_rate": 5.387428571428572e-06, + "loss": 0.2873, + "step": 31300 + }, + { + "epoch": 434.86, + "learning_rate": 5.376e-06, + "loss": 0.2821, + "step": 31310 + }, + { + "epoch": 435.0, + "learning_rate": 5.364571428571429e-06, + "loss": 0.2757, + "step": 31320 + }, + { + "epoch": 435.0, + "eval_loss": 0.5849021077156067, + "eval_runtime": 127.5651, + "eval_samples_per_second": 4.17, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21552998650125346, + "step": 31320 + }, + { + "epoch": 435.14, + "learning_rate": 5.353142857142858e-06, + "loss": 0.2881, + "step": 31330 + }, + { + "epoch": 435.28, + "learning_rate": 5.341714285714286e-06, + "loss": 0.2822, + "step": 31340 + }, + { + "epoch": 435.42, + "learning_rate": 5.3302857142857145e-06, + "loss": 0.2782, + "step": 31350 + }, + { + "epoch": 435.55, + "learning_rate": 5.318857142857144e-06, + "loss": 0.2706, + "step": 31360 + }, + { + "epoch": 435.69, + "learning_rate": 5.307428571428572e-06, + "loss": 0.2766, + "step": 31370 + }, + { + "epoch": 435.83, + "learning_rate": 5.296e-06, + "loss": 0.2648, + "step": 31380 + }, + { + "epoch": 435.97, + "learning_rate": 5.284571428571429e-06, + "loss": 0.2871, + "step": 31390 + }, + { + "epoch": 436.0, + "eval_loss": 0.591614305973053, + "eval_runtime": 127.5888, + "eval_samples_per_second": 4.17, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21450151057401812, + "step": 31392 + }, + { + "epoch": 436.11, + "learning_rate": 5.2731428571428575e-06, + "loss": 0.2912, + "step": 31400 + }, + { + "epoch": 436.25, + "learning_rate": 5.261714285714287e-06, + "loss": 0.2698, + "step": 31410 + }, + { + "epoch": 436.39, + "learning_rate": 5.250285714285714e-06, + "loss": 0.2755, + "step": 31420 + }, + { + "epoch": 436.53, + "learning_rate": 5.238857142857144e-06, + "loss": 0.2779, + "step": 31430 + }, + { + "epoch": 436.66, + "learning_rate": 5.227428571428572e-06, + "loss": 0.2857, + "step": 31440 + }, + { + "epoch": 436.8, + "learning_rate": 5.216e-06, + "loss": 0.2803, + "step": 31450 + }, + { + "epoch": 436.94, + "learning_rate": 5.204571428571429e-06, + "loss": 0.2741, + "step": 31460 + }, + { + "epoch": 437.0, + "eval_loss": 0.5873463153839111, + "eval_runtime": 127.5515, + "eval_samples_per_second": 4.171, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21360159413768723, + "step": 31464 + }, + { + "epoch": 437.08, + "learning_rate": 5.193142857142857e-06, + "loss": 0.2649, + "step": 31470 + }, + { + "epoch": 437.22, + "learning_rate": 5.181714285714287e-06, + "loss": 0.2744, + "step": 31480 + }, + { + "epoch": 437.36, + "learning_rate": 5.170285714285714e-06, + "loss": 0.2757, + "step": 31490 + }, + { + "epoch": 437.5, + "learning_rate": 5.158857142857144e-06, + "loss": 0.2799, + "step": 31500 + }, + { + "epoch": 437.64, + "learning_rate": 5.147428571428572e-06, + "loss": 0.2849, + "step": 31510 + }, + { + "epoch": 437.78, + "learning_rate": 5.136e-06, + "loss": 0.2913, + "step": 31520 + }, + { + "epoch": 437.91, + "learning_rate": 5.124571428571429e-06, + "loss": 0.2911, + "step": 31530 + }, + { + "epoch": 438.0, + "eval_loss": 0.5922967791557312, + "eval_runtime": 127.7496, + "eval_samples_per_second": 4.164, + "eval_steps_per_second": 0.524, + "eval_wer": 0.21205888024683422, + "step": 31536 + }, + { + "epoch": 438.06, + "learning_rate": 5.113142857142857e-06, + "loss": 0.2831, + "step": 31540 + }, + { + "epoch": 438.19, + "learning_rate": 5.101714285714287e-06, + "loss": 0.2936, + "step": 31550 + }, + { + "epoch": 438.33, + "learning_rate": 5.090285714285714e-06, + "loss": 0.2732, + "step": 31560 + }, + { + "epoch": 438.47, + "learning_rate": 5.0788571428571435e-06, + "loss": 0.2919, + "step": 31570 + }, + { + "epoch": 438.61, + "learning_rate": 5.067428571428572e-06, + "loss": 0.2678, + "step": 31580 + }, + { + "epoch": 438.75, + "learning_rate": 5.056000000000001e-06, + "loss": 0.2789, + "step": 31590 + }, + { + "epoch": 438.89, + "learning_rate": 5.044571428571429e-06, + "loss": 0.275, + "step": 31600 + }, + { + "epoch": 439.0, + "eval_loss": 0.5811768770217896, + "eval_runtime": 127.309, + "eval_samples_per_second": 4.179, + "eval_steps_per_second": 0.526, + "eval_wer": 0.21662274217394098, + "step": 31608 + }, + { + "epoch": 439.03, + "learning_rate": 5.033142857142857e-06, + "loss": 0.286, + "step": 31610 + }, + { + "epoch": 439.17, + "learning_rate": 5.0217142857142865e-06, + "loss": 0.2836, + "step": 31620 + }, + { + "epoch": 439.3, + "learning_rate": 5.010285714285714e-06, + "loss": 0.2761, + "step": 31630 + }, + { + "epoch": 439.44, + "learning_rate": 4.998857142857143e-06, + "loss": 0.284, + "step": 31640 + }, + { + "epoch": 439.58, + "learning_rate": 4.987428571428572e-06, + "loss": 0.2783, + "step": 31650 + }, + { + "epoch": 439.72, + "learning_rate": 4.976e-06, + "loss": 0.2859, + "step": 31660 + }, + { + "epoch": 439.86, + "learning_rate": 4.964571428571429e-06, + "loss": 0.2748, + "step": 31670 + }, + { + "epoch": 440.0, + "learning_rate": 4.953142857142857e-06, + "loss": 0.2686, + "step": 31680 + }, + { + "epoch": 440.0, + "eval_loss": 0.5934348106384277, + "eval_runtime": 127.7535, + "eval_samples_per_second": 4.164, + "eval_steps_per_second": 0.524, + "eval_wer": 0.21540142701034903, + "step": 31680 + }, + { + "epoch": 440.14, + "learning_rate": 4.9417142857142865e-06, + "loss": 0.287, + "step": 31690 + }, + { + "epoch": 440.28, + "learning_rate": 4.930285714285715e-06, + "loss": 0.2734, + "step": 31700 + }, + { + "epoch": 440.42, + "learning_rate": 4.918857142857143e-06, + "loss": 0.2772, + "step": 31710 + }, + { + "epoch": 440.55, + "learning_rate": 4.907428571428572e-06, + "loss": 0.2775, + "step": 31720 + }, + { + "epoch": 440.69, + "learning_rate": 4.896e-06, + "loss": 0.2806, + "step": 31730 + }, + { + "epoch": 440.83, + "learning_rate": 4.884571428571429e-06, + "loss": 0.2831, + "step": 31740 + }, + { + "epoch": 440.97, + "learning_rate": 4.873142857142857e-06, + "loss": 0.285, + "step": 31750 + }, + { + "epoch": 441.0, + "eval_loss": 0.5915161371231079, + "eval_runtime": 127.8523, + "eval_samples_per_second": 4.161, + "eval_steps_per_second": 0.524, + "eval_wer": 0.21559426624670566, + "step": 31752 + }, + { + "epoch": 441.11, + "learning_rate": 4.861714285714286e-06, + "loss": 0.281, + "step": 31760 + }, + { + "epoch": 441.25, + "learning_rate": 4.850285714285715e-06, + "loss": 0.2771, + "step": 31770 + }, + { + "epoch": 441.39, + "learning_rate": 4.838857142857143e-06, + "loss": 0.2748, + "step": 31780 + }, + { + "epoch": 441.53, + "learning_rate": 4.827428571428572e-06, + "loss": 0.2846, + "step": 31790 + }, + { + "epoch": 441.66, + "learning_rate": 4.816e-06, + "loss": 0.2743, + "step": 31800 + }, + { + "epoch": 441.8, + "learning_rate": 4.804571428571429e-06, + "loss": 0.2868, + "step": 31810 + }, + { + "epoch": 441.94, + "learning_rate": 4.793142857142857e-06, + "loss": 0.2896, + "step": 31820 + }, + { + "epoch": 442.0, + "eval_loss": 0.6024762988090515, + "eval_runtime": 127.5652, + "eval_samples_per_second": 4.17, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2134087549013306, + "step": 31824 + }, + { + "epoch": 442.08, + "learning_rate": 4.781714285714286e-06, + "loss": 0.2797, + "step": 31830 + }, + { + "epoch": 442.22, + "learning_rate": 4.770285714285715e-06, + "loss": 0.278, + "step": 31840 + }, + { + "epoch": 442.36, + "learning_rate": 4.758857142857143e-06, + "loss": 0.2717, + "step": 31850 + }, + { + "epoch": 442.5, + "learning_rate": 4.747428571428572e-06, + "loss": 0.2767, + "step": 31860 + }, + { + "epoch": 442.64, + "learning_rate": 4.736000000000001e-06, + "loss": 0.2741, + "step": 31870 + }, + { + "epoch": 442.78, + "learning_rate": 4.724571428571429e-06, + "loss": 0.2909, + "step": 31880 + }, + { + "epoch": 442.91, + "learning_rate": 4.713142857142858e-06, + "loss": 0.2857, + "step": 31890 + }, + { + "epoch": 443.0, + "eval_loss": 0.5970373153686523, + "eval_runtime": 127.4091, + "eval_samples_per_second": 4.176, + "eval_steps_per_second": 0.526, + "eval_wer": 0.21559426624670566, + "step": 31896 + }, + { + "epoch": 443.06, + "learning_rate": 4.701714285714286e-06, + "loss": 0.2898, + "step": 31900 + }, + { + "epoch": 443.19, + "learning_rate": 4.690285714285715e-06, + "loss": 0.2843, + "step": 31910 + }, + { + "epoch": 443.33, + "learning_rate": 4.678857142857143e-06, + "loss": 0.2593, + "step": 31920 + }, + { + "epoch": 443.47, + "learning_rate": 4.6674285714285715e-06, + "loss": 0.2925, + "step": 31930 + }, + { + "epoch": 443.61, + "learning_rate": 4.656000000000001e-06, + "loss": 0.2711, + "step": 31940 + }, + { + "epoch": 443.75, + "learning_rate": 4.644571428571429e-06, + "loss": 0.2765, + "step": 31950 + }, + { + "epoch": 443.89, + "learning_rate": 4.633142857142858e-06, + "loss": 0.2757, + "step": 31960 + }, + { + "epoch": 444.0, + "eval_loss": 0.5788788795471191, + "eval_runtime": 127.6085, + "eval_samples_per_second": 4.169, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2168155814102976, + "step": 31968 + }, + { + "epoch": 444.03, + "learning_rate": 4.621714285714286e-06, + "loss": 0.2976, + "step": 31970 + }, + { + "epoch": 444.17, + "learning_rate": 4.610285714285715e-06, + "loss": 0.2841, + "step": 31980 + }, + { + "epoch": 444.3, + "learning_rate": 4.598857142857143e-06, + "loss": 0.2852, + "step": 31990 + }, + { + "epoch": 444.44, + "learning_rate": 4.5874285714285715e-06, + "loss": 0.2753, + "step": 32000 + }, + { + "epoch": 444.58, + "learning_rate": 4.576000000000001e-06, + "loss": 0.2684, + "step": 32010 + }, + { + "epoch": 444.72, + "learning_rate": 4.564571428571429e-06, + "loss": 0.2854, + "step": 32020 + }, + { + "epoch": 444.86, + "learning_rate": 4.553142857142858e-06, + "loss": 0.2631, + "step": 32030 + }, + { + "epoch": 445.0, + "learning_rate": 4.541714285714286e-06, + "loss": 0.2878, + "step": 32040 + }, + { + "epoch": 445.0, + "eval_loss": 0.5882827639579773, + "eval_runtime": 128.1737, + "eval_samples_per_second": 4.151, + "eval_steps_per_second": 0.523, + "eval_wer": 0.21366587388313943, + "step": 32040 + }, + { + "epoch": 445.14, + "learning_rate": 4.5302857142857145e-06, + "loss": 0.2897, + "step": 32050 + }, + { + "epoch": 445.28, + "learning_rate": 4.518857142857143e-06, + "loss": 0.2793, + "step": 32060 + }, + { + "epoch": 445.42, + "learning_rate": 4.507428571428572e-06, + "loss": 0.2729, + "step": 32070 + }, + { + "epoch": 445.55, + "learning_rate": 4.496000000000001e-06, + "loss": 0.2756, + "step": 32080 + }, + { + "epoch": 445.69, + "learning_rate": 4.484571428571429e-06, + "loss": 0.286, + "step": 32090 + }, + { + "epoch": 445.83, + "learning_rate": 4.4731428571428575e-06, + "loss": 0.2734, + "step": 32100 + }, + { + "epoch": 445.97, + "learning_rate": 4.461714285714286e-06, + "loss": 0.2824, + "step": 32110 + }, + { + "epoch": 446.0, + "eval_loss": 0.597919225692749, + "eval_runtime": 127.6282, + "eval_samples_per_second": 4.168, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21707270039210644, + "step": 32112 + }, + { + "epoch": 446.11, + "learning_rate": 4.450285714285714e-06, + "loss": 0.2805, + "step": 32120 + }, + { + "epoch": 446.25, + "learning_rate": 4.438857142857143e-06, + "loss": 0.2807, + "step": 32130 + }, + { + "epoch": 446.39, + "learning_rate": 4.427428571428572e-06, + "loss": 0.2866, + "step": 32140 + }, + { + "epoch": 446.53, + "learning_rate": 4.416000000000001e-06, + "loss": 0.2855, + "step": 32150 + }, + { + "epoch": 446.66, + "learning_rate": 4.404571428571429e-06, + "loss": 0.2777, + "step": 32160 + }, + { + "epoch": 446.8, + "learning_rate": 4.3931428571428575e-06, + "loss": 0.2763, + "step": 32170 + }, + { + "epoch": 446.94, + "learning_rate": 4.381714285714286e-06, + "loss": 0.2809, + "step": 32180 + }, + { + "epoch": 447.0, + "eval_loss": 0.59099942445755, + "eval_runtime": 127.9864, + "eval_samples_per_second": 4.157, + "eval_steps_per_second": 0.523, + "eval_wer": 0.2142443915922093, + "step": 32184 + }, + { + "epoch": 447.08, + "learning_rate": 4.370285714285714e-06, + "loss": 0.287, + "step": 32190 + }, + { + "epoch": 447.22, + "learning_rate": 4.358857142857143e-06, + "loss": 0.2724, + "step": 32200 + }, + { + "epoch": 447.36, + "learning_rate": 4.347428571428572e-06, + "loss": 0.2697, + "step": 32210 + }, + { + "epoch": 447.5, + "learning_rate": 4.3360000000000005e-06, + "loss": 0.2775, + "step": 32220 + }, + { + "epoch": 447.64, + "learning_rate": 4.324571428571429e-06, + "loss": 0.2714, + "step": 32230 + }, + { + "epoch": 447.78, + "learning_rate": 4.313142857142857e-06, + "loss": 0.279, + "step": 32240 + }, + { + "epoch": 447.91, + "learning_rate": 4.301714285714287e-06, + "loss": 0.2899, + "step": 32250 + }, + { + "epoch": 448.0, + "eval_loss": 0.5900712609291077, + "eval_runtime": 128.1271, + "eval_samples_per_second": 4.152, + "eval_steps_per_second": 0.523, + "eval_wer": 0.2157228257376101, + "step": 32256 + }, + { + "epoch": 448.06, + "learning_rate": 4.290285714285714e-06, + "loss": 0.2854, + "step": 32260 + }, + { + "epoch": 448.19, + "learning_rate": 4.278857142857143e-06, + "loss": 0.2857, + "step": 32270 + }, + { + "epoch": 448.33, + "learning_rate": 4.267428571428572e-06, + "loss": 0.2784, + "step": 32280 + }, + { + "epoch": 448.47, + "learning_rate": 4.256e-06, + "loss": 0.2825, + "step": 32290 + }, + { + "epoch": 448.61, + "learning_rate": 4.244571428571429e-06, + "loss": 0.272, + "step": 32300 + }, + { + "epoch": 448.75, + "learning_rate": 4.233142857142857e-06, + "loss": 0.2714, + "step": 32310 + }, + { + "epoch": 448.89, + "learning_rate": 4.221714285714287e-06, + "loss": 0.2688, + "step": 32320 + }, + { + "epoch": 449.0, + "eval_loss": 0.5914981961250305, + "eval_runtime": 127.6663, + "eval_samples_per_second": 4.167, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21334447515587837, + "step": 32328 + }, + { + "epoch": 449.03, + "learning_rate": 4.210285714285714e-06, + "loss": 0.288, + "step": 32330 + }, + { + "epoch": 449.17, + "learning_rate": 4.1988571428571435e-06, + "loss": 0.2779, + "step": 32340 + }, + { + "epoch": 449.3, + "learning_rate": 4.187428571428572e-06, + "loss": 0.2768, + "step": 32350 + }, + { + "epoch": 449.44, + "learning_rate": 4.176e-06, + "loss": 0.2711, + "step": 32360 + }, + { + "epoch": 449.58, + "learning_rate": 4.164571428571429e-06, + "loss": 0.2753, + "step": 32370 + }, + { + "epoch": 449.72, + "learning_rate": 4.153142857142857e-06, + "loss": 0.2821, + "step": 32380 + }, + { + "epoch": 449.86, + "learning_rate": 4.1417142857142865e-06, + "loss": 0.2704, + "step": 32390 + }, + { + "epoch": 450.0, + "learning_rate": 4.130285714285714e-06, + "loss": 0.2785, + "step": 32400 + }, + { + "epoch": 450.0, + "eval_loss": 0.5902188420295715, + "eval_runtime": 128.624, + "eval_samples_per_second": 4.136, + "eval_steps_per_second": 0.521, + "eval_wer": 0.21456579031947035, + "step": 32400 + }, + { + "epoch": 450.14, + "learning_rate": 4.118857142857143e-06, + "loss": 0.2786, + "step": 32410 + }, + { + "epoch": 450.28, + "learning_rate": 4.107428571428572e-06, + "loss": 0.2771, + "step": 32420 + }, + { + "epoch": 450.42, + "learning_rate": 4.096e-06, + "loss": 0.28, + "step": 32430 + }, + { + "epoch": 450.55, + "learning_rate": 4.084571428571429e-06, + "loss": 0.279, + "step": 32440 + }, + { + "epoch": 450.69, + "learning_rate": 4.073142857142858e-06, + "loss": 0.2777, + "step": 32450 + }, + { + "epoch": 450.83, + "learning_rate": 4.061714285714286e-06, + "loss": 0.2828, + "step": 32460 + }, + { + "epoch": 450.97, + "learning_rate": 4.050285714285714e-06, + "loss": 0.2807, + "step": 32470 + }, + { + "epoch": 451.0, + "eval_loss": 0.5859866142272949, + "eval_runtime": 127.8086, + "eval_samples_per_second": 4.162, + "eval_steps_per_second": 0.524, + "eval_wer": 0.21597994471941892, + "step": 32472 + }, + { + "epoch": 451.11, + "learning_rate": 4.038857142857143e-06, + "loss": 0.2865, + "step": 32480 + }, + { + "epoch": 451.25, + "learning_rate": 4.027428571428572e-06, + "loss": 0.2745, + "step": 32490 + }, + { + "epoch": 451.39, + "learning_rate": 4.016e-06, + "loss": 0.2683, + "step": 32500 + }, + { + "epoch": 451.53, + "learning_rate": 4.004571428571429e-06, + "loss": 0.2737, + "step": 32510 + }, + { + "epoch": 451.66, + "learning_rate": 3.993142857142858e-06, + "loss": 0.2687, + "step": 32520 + }, + { + "epoch": 451.8, + "learning_rate": 3.981714285714286e-06, + "loss": 0.2717, + "step": 32530 + }, + { + "epoch": 451.94, + "learning_rate": 3.970285714285715e-06, + "loss": 0.2936, + "step": 32540 + }, + { + "epoch": 452.0, + "eval_loss": 0.5842635035514832, + "eval_runtime": 127.8192, + "eval_samples_per_second": 4.162, + "eval_steps_per_second": 0.524, + "eval_wer": 0.21379443337404383, + "step": 32544 + }, + { + "epoch": 452.08, + "learning_rate": 3.958857142857143e-06, + "loss": 0.2862, + "step": 32550 + }, + { + "epoch": 452.22, + "learning_rate": 3.947428571428572e-06, + "loss": 0.2834, + "step": 32560 + }, + { + "epoch": 452.36, + "learning_rate": 3.936e-06, + "loss": 0.267, + "step": 32570 + }, + { + "epoch": 452.5, + "learning_rate": 3.9245714285714285e-06, + "loss": 0.281, + "step": 32580 + }, + { + "epoch": 452.64, + "learning_rate": 3.913142857142858e-06, + "loss": 0.2804, + "step": 32590 + }, + { + "epoch": 452.78, + "learning_rate": 3.901714285714286e-06, + "loss": 0.2661, + "step": 32600 + }, + { + "epoch": 452.91, + "learning_rate": 3.890285714285715e-06, + "loss": 0.2842, + "step": 32610 + }, + { + "epoch": 453.0, + "eval_loss": 0.5815262198448181, + "eval_runtime": 128.2955, + "eval_samples_per_second": 4.147, + "eval_steps_per_second": 0.522, + "eval_wer": 0.21463007006492255, + "step": 32616 + }, + { + "epoch": 453.06, + "learning_rate": 3.878857142857143e-06, + "loss": 0.2769, + "step": 32620 + }, + { + "epoch": 453.19, + "learning_rate": 3.8674285714285716e-06, + "loss": 0.2857, + "step": 32630 + }, + { + "epoch": 453.33, + "learning_rate": 3.856e-06, + "loss": 0.2789, + "step": 32640 + }, + { + "epoch": 453.47, + "learning_rate": 3.8445714285714285e-06, + "loss": 0.2759, + "step": 32650 + }, + { + "epoch": 453.61, + "learning_rate": 3.833142857142858e-06, + "loss": 0.258, + "step": 32660 + }, + { + "epoch": 453.75, + "learning_rate": 3.821714285714286e-06, + "loss": 0.278, + "step": 32670 + }, + { + "epoch": 453.89, + "learning_rate": 3.8102857142857146e-06, + "loss": 0.2825, + "step": 32680 + }, + { + "epoch": 454.0, + "eval_loss": 0.5888230204582214, + "eval_runtime": 128.0171, + "eval_samples_per_second": 4.156, + "eval_steps_per_second": 0.523, + "eval_wer": 0.21713698013755867, + "step": 32688 + }, + { + "epoch": 454.03, + "learning_rate": 3.798857142857143e-06, + "loss": 0.282, + "step": 32690 + }, + { + "epoch": 454.17, + "learning_rate": 3.787428571428572e-06, + "loss": 0.2672, + "step": 32700 + }, + { + "epoch": 454.3, + "learning_rate": 3.7760000000000004e-06, + "loss": 0.2732, + "step": 32710 + }, + { + "epoch": 454.44, + "learning_rate": 3.7645714285714292e-06, + "loss": 0.2728, + "step": 32720 + }, + { + "epoch": 454.58, + "learning_rate": 3.7531428571428572e-06, + "loss": 0.2779, + "step": 32730 + }, + { + "epoch": 454.72, + "learning_rate": 3.7417142857142857e-06, + "loss": 0.2853, + "step": 32740 + }, + { + "epoch": 454.86, + "learning_rate": 3.7302857142857145e-06, + "loss": 0.2803, + "step": 32750 + }, + { + "epoch": 455.0, + "learning_rate": 3.718857142857143e-06, + "loss": 0.2906, + "step": 32760 + }, + { + "epoch": 455.0, + "eval_loss": 0.5870276093482971, + "eval_runtime": 127.7797, + "eval_samples_per_second": 4.163, + "eval_steps_per_second": 0.524, + "eval_wer": 0.2134730346467828, + "step": 32760 + }, + { + "epoch": 455.14, + "learning_rate": 3.707428571428572e-06, + "loss": 0.2718, + "step": 32770 + }, + { + "epoch": 455.28, + "learning_rate": 3.6960000000000003e-06, + "loss": 0.2692, + "step": 32780 + }, + { + "epoch": 455.42, + "learning_rate": 3.684571428571429e-06, + "loss": 0.2755, + "step": 32790 + }, + { + "epoch": 455.55, + "learning_rate": 3.673142857142857e-06, + "loss": 0.274, + "step": 32800 + }, + { + "epoch": 455.69, + "learning_rate": 3.661714285714286e-06, + "loss": 0.2737, + "step": 32810 + }, + { + "epoch": 455.83, + "learning_rate": 3.6502857142857145e-06, + "loss": 0.2802, + "step": 32820 + }, + { + "epoch": 455.97, + "learning_rate": 3.6388571428571433e-06, + "loss": 0.2809, + "step": 32830 + }, + { + "epoch": 456.0, + "eval_loss": 0.5915881991386414, + "eval_runtime": 127.5703, + "eval_samples_per_second": 4.17, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21533714726489683, + "step": 32832 + }, + { + "epoch": 456.11, + "learning_rate": 3.6274285714285718e-06, + "loss": 0.2743, + "step": 32840 + }, + { + "epoch": 456.25, + "learning_rate": 3.616e-06, + "loss": 0.2742, + "step": 32850 + }, + { + "epoch": 456.39, + "learning_rate": 3.604571428571429e-06, + "loss": 0.2777, + "step": 32860 + }, + { + "epoch": 456.53, + "learning_rate": 3.593142857142857e-06, + "loss": 0.2793, + "step": 32870 + }, + { + "epoch": 456.66, + "learning_rate": 3.581714285714286e-06, + "loss": 0.2755, + "step": 32880 + }, + { + "epoch": 456.8, + "learning_rate": 3.5702857142857144e-06, + "loss": 0.2694, + "step": 32890 + }, + { + "epoch": 456.94, + "learning_rate": 3.5588571428571432e-06, + "loss": 0.2786, + "step": 32900 + }, + { + "epoch": 457.0, + "eval_loss": 0.5958760380744934, + "eval_runtime": 127.4502, + "eval_samples_per_second": 4.174, + "eval_steps_per_second": 0.526, + "eval_wer": 0.21308735617406954, + "step": 32904 + }, + { + "epoch": 457.08, + "learning_rate": 3.5474285714285717e-06, + "loss": 0.273, + "step": 32910 + }, + { + "epoch": 457.22, + "learning_rate": 3.5360000000000005e-06, + "loss": 0.2697, + "step": 32920 + }, + { + "epoch": 457.36, + "learning_rate": 3.524571428571429e-06, + "loss": 0.2642, + "step": 32930 + }, + { + "epoch": 457.5, + "learning_rate": 3.513142857142857e-06, + "loss": 0.2706, + "step": 32940 + }, + { + "epoch": 457.64, + "learning_rate": 3.5017142857142863e-06, + "loss": 0.2747, + "step": 32950 + }, + { + "epoch": 457.78, + "learning_rate": 3.4902857142857143e-06, + "loss": 0.2846, + "step": 32960 + }, + { + "epoch": 457.91, + "learning_rate": 3.478857142857143e-06, + "loss": 0.2818, + "step": 32970 + }, + { + "epoch": 458.0, + "eval_loss": 0.5847172737121582, + "eval_runtime": 128.4309, + "eval_samples_per_second": 4.142, + "eval_steps_per_second": 0.522, + "eval_wer": 0.213537314392235, + "step": 32976 + }, + { + "epoch": 458.06, + "learning_rate": 3.4674285714285716e-06, + "loss": 0.2805, + "step": 32980 + }, + { + "epoch": 458.19, + "learning_rate": 3.4560000000000005e-06, + "loss": 0.2806, + "step": 32990 + }, + { + "epoch": 458.33, + "learning_rate": 3.444571428571429e-06, + "loss": 0.2739, + "step": 33000 + }, + { + "epoch": 458.47, + "learning_rate": 3.4331428571428578e-06, + "loss": 0.279, + "step": 33010 + }, + { + "epoch": 458.61, + "learning_rate": 3.421714285714286e-06, + "loss": 0.2751, + "step": 33020 + }, + { + "epoch": 458.75, + "learning_rate": 3.410285714285714e-06, + "loss": 0.2749, + "step": 33030 + }, + { + "epoch": 458.89, + "learning_rate": 3.398857142857143e-06, + "loss": 0.2696, + "step": 33040 + }, + { + "epoch": 459.0, + "eval_loss": 0.5830007195472717, + "eval_runtime": 127.8599, + "eval_samples_per_second": 4.161, + "eval_steps_per_second": 0.524, + "eval_wer": 0.21257311821045188, + "step": 33048 + }, + { + "epoch": 459.03, + "learning_rate": 3.3874285714285715e-06, + "loss": 0.2805, + "step": 33050 + }, + { + "epoch": 459.17, + "learning_rate": 3.3760000000000004e-06, + "loss": 0.2829, + "step": 33060 + }, + { + "epoch": 459.3, + "learning_rate": 3.364571428571429e-06, + "loss": 0.2712, + "step": 33070 + }, + { + "epoch": 459.44, + "learning_rate": 3.3531428571428577e-06, + "loss": 0.2776, + "step": 33080 + }, + { + "epoch": 459.58, + "learning_rate": 3.341714285714286e-06, + "loss": 0.2755, + "step": 33090 + }, + { + "epoch": 459.72, + "learning_rate": 3.330285714285715e-06, + "loss": 0.28, + "step": 33100 + }, + { + "epoch": 459.86, + "learning_rate": 3.318857142857143e-06, + "loss": 0.2723, + "step": 33110 + }, + { + "epoch": 460.0, + "learning_rate": 3.3074285714285714e-06, + "loss": 0.2761, + "step": 33120 + }, + { + "epoch": 460.0, + "eval_loss": 0.5934568643569946, + "eval_runtime": 127.82, + "eval_samples_per_second": 4.162, + "eval_steps_per_second": 0.524, + "eval_wer": 0.2134087549013306, + "step": 33120 + }, + { + "epoch": 460.14, + "learning_rate": 3.2960000000000003e-06, + "loss": 0.2722, + "step": 33130 + }, + { + "epoch": 460.28, + "learning_rate": 3.2845714285714287e-06, + "loss": 0.2772, + "step": 33140 + }, + { + "epoch": 460.42, + "learning_rate": 3.2731428571428576e-06, + "loss": 0.2874, + "step": 33150 + }, + { + "epoch": 460.55, + "learning_rate": 3.261714285714286e-06, + "loss": 0.2729, + "step": 33160 + }, + { + "epoch": 460.69, + "learning_rate": 3.250285714285715e-06, + "loss": 0.2658, + "step": 33170 + }, + { + "epoch": 460.83, + "learning_rate": 3.238857142857143e-06, + "loss": 0.2754, + "step": 33180 + }, + { + "epoch": 460.97, + "learning_rate": 3.2274285714285718e-06, + "loss": 0.2762, + "step": 33190 + }, + { + "epoch": 461.0, + "eval_loss": 0.5872820019721985, + "eval_runtime": 127.6195, + "eval_samples_per_second": 4.169, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21295879668316514, + "step": 33192 + }, + { + "epoch": 461.11, + "learning_rate": 3.216e-06, + "loss": 0.2745, + "step": 33200 + }, + { + "epoch": 461.25, + "learning_rate": 3.204571428571429e-06, + "loss": 0.2694, + "step": 33210 + }, + { + "epoch": 461.39, + "learning_rate": 3.1931428571428575e-06, + "loss": 0.2747, + "step": 33220 + }, + { + "epoch": 461.53, + "learning_rate": 3.181714285714286e-06, + "loss": 0.2726, + "step": 33230 + }, + { + "epoch": 461.66, + "learning_rate": 3.170285714285715e-06, + "loss": 0.2867, + "step": 33240 + }, + { + "epoch": 461.8, + "learning_rate": 3.158857142857143e-06, + "loss": 0.2747, + "step": 33250 + }, + { + "epoch": 461.94, + "learning_rate": 3.1474285714285717e-06, + "loss": 0.2795, + "step": 33260 + }, + { + "epoch": 462.0, + "eval_loss": 0.5932377576828003, + "eval_runtime": 128.0223, + "eval_samples_per_second": 4.156, + "eval_steps_per_second": 0.523, + "eval_wer": 0.21360159413768723, + "step": 33264 + }, + { + "epoch": 462.08, + "learning_rate": 3.136e-06, + "loss": 0.2783, + "step": 33270 + }, + { + "epoch": 462.22, + "learning_rate": 3.124571428571429e-06, + "loss": 0.2697, + "step": 33280 + }, + { + "epoch": 462.36, + "learning_rate": 3.1131428571428574e-06, + "loss": 0.2714, + "step": 33290 + }, + { + "epoch": 462.5, + "learning_rate": 3.1017142857142863e-06, + "loss": 0.2765, + "step": 33300 + }, + { + "epoch": 462.64, + "learning_rate": 3.0902857142857147e-06, + "loss": 0.2726, + "step": 33310 + }, + { + "epoch": 462.78, + "learning_rate": 3.0788571428571427e-06, + "loss": 0.2863, + "step": 33320 + }, + { + "epoch": 462.91, + "learning_rate": 3.0674285714285716e-06, + "loss": 0.276, + "step": 33330 + }, + { + "epoch": 463.0, + "eval_loss": 0.5970369577407837, + "eval_runtime": 127.1347, + "eval_samples_per_second": 4.185, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21366587388313943, + "step": 33336 + }, + { + "epoch": 463.06, + "learning_rate": 3.056e-06, + "loss": 0.2766, + "step": 33340 + }, + { + "epoch": 463.19, + "learning_rate": 3.044571428571429e-06, + "loss": 0.2787, + "step": 33350 + }, + { + "epoch": 463.33, + "learning_rate": 3.0331428571428573e-06, + "loss": 0.2672, + "step": 33360 + }, + { + "epoch": 463.47, + "learning_rate": 3.021714285714286e-06, + "loss": 0.2658, + "step": 33370 + }, + { + "epoch": 463.61, + "learning_rate": 3.0102857142857147e-06, + "loss": 0.2647, + "step": 33380 + }, + { + "epoch": 463.75, + "learning_rate": 2.9988571428571435e-06, + "loss": 0.2789, + "step": 33390 + }, + { + "epoch": 463.89, + "learning_rate": 2.9874285714285715e-06, + "loss": 0.2788, + "step": 33400 + }, + { + "epoch": 464.0, + "eval_loss": 0.5909742116928101, + "eval_runtime": 127.8539, + "eval_samples_per_second": 4.161, + "eval_steps_per_second": 0.524, + "eval_wer": 0.2141801118467571, + "step": 33408 + }, + { + "epoch": 464.03, + "learning_rate": 2.976e-06, + "loss": 0.2732, + "step": 33410 + }, + { + "epoch": 464.17, + "learning_rate": 2.964571428571429e-06, + "loss": 0.2766, + "step": 33420 + }, + { + "epoch": 464.3, + "learning_rate": 2.9531428571428573e-06, + "loss": 0.2854, + "step": 33430 + }, + { + "epoch": 464.44, + "learning_rate": 2.941714285714286e-06, + "loss": 0.2694, + "step": 33440 + }, + { + "epoch": 464.58, + "learning_rate": 2.9302857142857146e-06, + "loss": 0.27, + "step": 33450 + }, + { + "epoch": 464.72, + "learning_rate": 2.9188571428571434e-06, + "loss": 0.2768, + "step": 33460 + }, + { + "epoch": 464.86, + "learning_rate": 2.9074285714285714e-06, + "loss": 0.272, + "step": 33470 + }, + { + "epoch": 465.0, + "learning_rate": 2.8960000000000003e-06, + "loss": 0.2624, + "step": 33480 + }, + { + "epoch": 465.0, + "eval_loss": 0.5864557027816772, + "eval_runtime": 128.2027, + "eval_samples_per_second": 4.15, + "eval_steps_per_second": 0.523, + "eval_wer": 0.21212315999228643, + "step": 33480 + }, + { + "epoch": 465.14, + "learning_rate": 2.8845714285714287e-06, + "loss": 0.2683, + "step": 33490 + }, + { + "epoch": 465.28, + "learning_rate": 2.873142857142857e-06, + "loss": 0.2683, + "step": 33500 + }, + { + "epoch": 465.42, + "learning_rate": 2.861714285714286e-06, + "loss": 0.2722, + "step": 33510 + }, + { + "epoch": 465.55, + "learning_rate": 2.8502857142857145e-06, + "loss": 0.2701, + "step": 33520 + }, + { + "epoch": 465.69, + "learning_rate": 2.8388571428571434e-06, + "loss": 0.2791, + "step": 33530 + }, + { + "epoch": 465.83, + "learning_rate": 2.8274285714285714e-06, + "loss": 0.2781, + "step": 33540 + }, + { + "epoch": 465.97, + "learning_rate": 2.8160000000000002e-06, + "loss": 0.2878, + "step": 33550 + }, + { + "epoch": 466.0, + "eval_loss": 0.5836173892021179, + "eval_runtime": 127.8337, + "eval_samples_per_second": 4.162, + "eval_steps_per_second": 0.524, + "eval_wer": 0.21167320177412097, + "step": 33552 + }, + { + "epoch": 466.11, + "learning_rate": 2.8045714285714287e-06, + "loss": 0.283, + "step": 33560 + }, + { + "epoch": 466.25, + "learning_rate": 2.7931428571428575e-06, + "loss": 0.2846, + "step": 33570 + }, + { + "epoch": 466.39, + "learning_rate": 2.781714285714286e-06, + "loss": 0.2654, + "step": 33580 + }, + { + "epoch": 466.53, + "learning_rate": 2.7702857142857144e-06, + "loss": 0.2769, + "step": 33590 + }, + { + "epoch": 466.66, + "learning_rate": 2.7588571428571433e-06, + "loss": 0.2748, + "step": 33600 + }, + { + "epoch": 466.8, + "learning_rate": 2.7474285714285713e-06, + "loss": 0.258, + "step": 33610 + }, + { + "epoch": 466.94, + "learning_rate": 2.736e-06, + "loss": 0.2691, + "step": 33620 + }, + { + "epoch": 467.0, + "eval_loss": 0.5880076885223389, + "eval_runtime": 127.6716, + "eval_samples_per_second": 4.167, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2127016777013563, + "step": 33624 + }, + { + "epoch": 467.08, + "learning_rate": 2.7245714285714286e-06, + "loss": 0.2788, + "step": 33630 + }, + { + "epoch": 467.22, + "learning_rate": 2.7131428571428574e-06, + "loss": 0.2752, + "step": 33640 + }, + { + "epoch": 467.36, + "learning_rate": 2.701714285714286e-06, + "loss": 0.2586, + "step": 33650 + }, + { + "epoch": 467.5, + "learning_rate": 2.6902857142857147e-06, + "loss": 0.2727, + "step": 33660 + }, + { + "epoch": 467.64, + "learning_rate": 2.678857142857143e-06, + "loss": 0.2619, + "step": 33670 + }, + { + "epoch": 467.78, + "learning_rate": 2.667428571428572e-06, + "loss": 0.2773, + "step": 33680 + }, + { + "epoch": 467.91, + "learning_rate": 2.656e-06, + "loss": 0.2796, + "step": 33690 + }, + { + "epoch": 468.0, + "eval_loss": 0.5910577774047852, + "eval_runtime": 127.1938, + "eval_samples_per_second": 4.183, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2142443915922093, + "step": 33696 + }, + { + "epoch": 468.06, + "learning_rate": 2.6445714285714285e-06, + "loss": 0.2783, + "step": 33700 + }, + { + "epoch": 468.19, + "learning_rate": 2.6331428571428574e-06, + "loss": 0.2734, + "step": 33710 + }, + { + "epoch": 468.33, + "learning_rate": 2.621714285714286e-06, + "loss": 0.2727, + "step": 33720 + }, + { + "epoch": 468.47, + "learning_rate": 2.6102857142857147e-06, + "loss": 0.281, + "step": 33730 + }, + { + "epoch": 468.61, + "learning_rate": 2.598857142857143e-06, + "loss": 0.2689, + "step": 33740 + }, + { + "epoch": 468.75, + "learning_rate": 2.587428571428572e-06, + "loss": 0.2615, + "step": 33750 + }, + { + "epoch": 468.89, + "learning_rate": 2.576e-06, + "loss": 0.2663, + "step": 33760 + }, + { + "epoch": 469.0, + "eval_loss": 0.6015689373016357, + "eval_runtime": 127.6708, + "eval_samples_per_second": 4.167, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21398727261040046, + "step": 33768 + }, + { + "epoch": 469.03, + "learning_rate": 2.564571428571429e-06, + "loss": 0.2718, + "step": 33770 + }, + { + "epoch": 469.17, + "learning_rate": 2.5531428571428573e-06, + "loss": 0.2753, + "step": 33780 + }, + { + "epoch": 469.3, + "learning_rate": 2.5417142857142857e-06, + "loss": 0.2688, + "step": 33790 + }, + { + "epoch": 469.44, + "learning_rate": 2.5302857142857146e-06, + "loss": 0.2714, + "step": 33800 + }, + { + "epoch": 469.58, + "learning_rate": 2.518857142857143e-06, + "loss": 0.2662, + "step": 33810 + }, + { + "epoch": 469.72, + "learning_rate": 2.507428571428572e-06, + "loss": 0.286, + "step": 33820 + }, + { + "epoch": 469.86, + "learning_rate": 2.496e-06, + "loss": 0.2661, + "step": 33830 + }, + { + "epoch": 470.0, + "learning_rate": 2.4845714285714288e-06, + "loss": 0.2743, + "step": 33840 + }, + { + "epoch": 470.0, + "eval_loss": 0.5917323231697083, + "eval_runtime": 127.961, + "eval_samples_per_second": 4.158, + "eval_steps_per_second": 0.524, + "eval_wer": 0.21199460050138202, + "step": 33840 + }, + { + "epoch": 470.14, + "learning_rate": 2.473142857142857e-06, + "loss": 0.2817, + "step": 33850 + }, + { + "epoch": 470.28, + "learning_rate": 2.461714285714286e-06, + "loss": 0.2689, + "step": 33860 + }, + { + "epoch": 470.42, + "learning_rate": 2.4502857142857145e-06, + "loss": 0.2787, + "step": 33870 + }, + { + "epoch": 470.55, + "learning_rate": 2.438857142857143e-06, + "loss": 0.2728, + "step": 33880 + }, + { + "epoch": 470.69, + "learning_rate": 2.427428571428572e-06, + "loss": 0.2694, + "step": 33890 + }, + { + "epoch": 470.83, + "learning_rate": 2.4160000000000002e-06, + "loss": 0.2726, + "step": 33900 + }, + { + "epoch": 470.97, + "learning_rate": 2.4045714285714287e-06, + "loss": 0.2735, + "step": 33910 + }, + { + "epoch": 471.0, + "eval_loss": 0.5953284502029419, + "eval_runtime": 127.3858, + "eval_samples_per_second": 4.176, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2141158321013049, + "step": 33912 + }, + { + "epoch": 471.11, + "learning_rate": 2.393142857142857e-06, + "loss": 0.2659, + "step": 33920 + }, + { + "epoch": 471.25, + "learning_rate": 2.381714285714286e-06, + "loss": 0.2702, + "step": 33930 + }, + { + "epoch": 471.39, + "learning_rate": 2.3702857142857144e-06, + "loss": 0.2738, + "step": 33940 + }, + { + "epoch": 471.53, + "learning_rate": 2.358857142857143e-06, + "loss": 0.2803, + "step": 33950 + }, + { + "epoch": 471.66, + "learning_rate": 2.3474285714285717e-06, + "loss": 0.2697, + "step": 33960 + }, + { + "epoch": 471.8, + "learning_rate": 2.336e-06, + "loss": 0.2704, + "step": 33970 + }, + { + "epoch": 471.94, + "learning_rate": 2.3245714285714286e-06, + "loss": 0.2959, + "step": 33980 + }, + { + "epoch": 472.0, + "eval_loss": 0.5901468396186829, + "eval_runtime": 128.1861, + "eval_samples_per_second": 4.15, + "eval_steps_per_second": 0.523, + "eval_wer": 0.21315163591952177, + "step": 33984 + }, + { + "epoch": 472.08, + "learning_rate": 2.3131428571428575e-06, + "loss": 0.2836, + "step": 33990 + }, + { + "epoch": 472.22, + "learning_rate": 2.301714285714286e-06, + "loss": 0.2839, + "step": 34000 + }, + { + "epoch": 472.36, + "learning_rate": 2.2902857142857143e-06, + "loss": 0.2703, + "step": 34010 + }, + { + "epoch": 472.5, + "learning_rate": 2.2788571428571428e-06, + "loss": 0.2686, + "step": 34020 + }, + { + "epoch": 472.64, + "learning_rate": 2.2674285714285716e-06, + "loss": 0.2725, + "step": 34030 + }, + { + "epoch": 472.78, + "learning_rate": 2.256e-06, + "loss": 0.2844, + "step": 34040 + }, + { + "epoch": 472.91, + "learning_rate": 2.2445714285714285e-06, + "loss": 0.2732, + "step": 34050 + }, + { + "epoch": 473.0, + "eval_loss": 0.5878883600234985, + "eval_runtime": 127.1328, + "eval_samples_per_second": 4.185, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21077328533779005, + "step": 34056 + }, + { + "epoch": 473.06, + "learning_rate": 2.2331428571428574e-06, + "loss": 0.2793, + "step": 34060 + }, + { + "epoch": 473.19, + "learning_rate": 2.221714285714286e-06, + "loss": 0.2803, + "step": 34070 + }, + { + "epoch": 473.33, + "learning_rate": 2.2102857142857147e-06, + "loss": 0.2633, + "step": 34080 + }, + { + "epoch": 473.47, + "learning_rate": 2.198857142857143e-06, + "loss": 0.2789, + "step": 34090 + }, + { + "epoch": 473.61, + "learning_rate": 2.1874285714285716e-06, + "loss": 0.2803, + "step": 34100 + }, + { + "epoch": 473.75, + "learning_rate": 2.176e-06, + "loss": 0.2699, + "step": 34110 + }, + { + "epoch": 473.89, + "learning_rate": 2.164571428571429e-06, + "loss": 0.2659, + "step": 34120 + }, + { + "epoch": 474.0, + "eval_loss": 0.5865457057952881, + "eval_runtime": 127.9363, + "eval_samples_per_second": 4.158, + "eval_steps_per_second": 0.524, + "eval_wer": 0.21083756508324228, + "step": 34128 + }, + { + "epoch": 474.03, + "learning_rate": 2.1531428571428573e-06, + "loss": 0.2768, + "step": 34130 + }, + { + "epoch": 474.17, + "learning_rate": 2.1417142857142857e-06, + "loss": 0.2788, + "step": 34140 + }, + { + "epoch": 474.3, + "learning_rate": 2.1302857142857146e-06, + "loss": 0.2684, + "step": 34150 + }, + { + "epoch": 474.44, + "learning_rate": 2.118857142857143e-06, + "loss": 0.2714, + "step": 34160 + }, + { + "epoch": 474.58, + "learning_rate": 2.1074285714285715e-06, + "loss": 0.2574, + "step": 34170 + }, + { + "epoch": 474.72, + "learning_rate": 2.0960000000000003e-06, + "loss": 0.2774, + "step": 34180 + }, + { + "epoch": 474.86, + "learning_rate": 2.0845714285714288e-06, + "loss": 0.2712, + "step": 34190 + }, + { + "epoch": 475.0, + "learning_rate": 2.0731428571428572e-06, + "loss": 0.2706, + "step": 34200 + }, + { + "epoch": 475.0, + "eval_loss": 0.5861235857009888, + "eval_runtime": 127.3009, + "eval_samples_per_second": 4.179, + "eval_steps_per_second": 0.526, + "eval_wer": 0.20910201195603265, + "step": 34200 + }, + { + "epoch": 475.14, + "learning_rate": 2.0617142857142857e-06, + "loss": 0.2754, + "step": 34210 + }, + { + "epoch": 475.28, + "learning_rate": 2.0502857142857145e-06, + "loss": 0.2669, + "step": 34220 + }, + { + "epoch": 475.42, + "learning_rate": 2.038857142857143e-06, + "loss": 0.2626, + "step": 34230 + }, + { + "epoch": 475.55, + "learning_rate": 2.0274285714285714e-06, + "loss": 0.2681, + "step": 34240 + }, + { + "epoch": 475.69, + "learning_rate": 2.0160000000000003e-06, + "loss": 0.2801, + "step": 34250 + }, + { + "epoch": 475.83, + "learning_rate": 2.0045714285714287e-06, + "loss": 0.2623, + "step": 34260 + }, + { + "epoch": 475.97, + "learning_rate": 1.9931428571428576e-06, + "loss": 0.2766, + "step": 34270 + }, + { + "epoch": 476.0, + "eval_loss": 0.5886086821556091, + "eval_runtime": 127.7453, + "eval_samples_per_second": 4.165, + "eval_steps_per_second": 0.524, + "eval_wer": 0.2112232435559555, + "step": 34272 + }, + { + "epoch": 476.11, + "learning_rate": 1.981714285714286e-06, + "loss": 0.2814, + "step": 34280 + }, + { + "epoch": 476.25, + "learning_rate": 1.9702857142857144e-06, + "loss": 0.2625, + "step": 34290 + }, + { + "epoch": 476.39, + "learning_rate": 1.958857142857143e-06, + "loss": 0.267, + "step": 34300 + }, + { + "epoch": 476.53, + "learning_rate": 1.9474285714285713e-06, + "loss": 0.2735, + "step": 34310 + }, + { + "epoch": 476.66, + "learning_rate": 1.936e-06, + "loss": 0.2692, + "step": 34320 + }, + { + "epoch": 476.8, + "learning_rate": 1.9245714285714286e-06, + "loss": 0.2734, + "step": 34330 + }, + { + "epoch": 476.94, + "learning_rate": 1.9131428571428575e-06, + "loss": 0.2727, + "step": 34340 + }, + { + "epoch": 477.0, + "eval_loss": 0.5934135913848877, + "eval_runtime": 128.0867, + "eval_samples_per_second": 4.153, + "eval_steps_per_second": 0.523, + "eval_wer": 0.2128945169377129, + "step": 34344 + }, + { + "epoch": 477.08, + "learning_rate": 1.901714285714286e-06, + "loss": 0.2782, + "step": 34350 + }, + { + "epoch": 477.22, + "learning_rate": 1.8902857142857146e-06, + "loss": 0.2765, + "step": 34360 + }, + { + "epoch": 477.36, + "learning_rate": 1.878857142857143e-06, + "loss": 0.253, + "step": 34370 + }, + { + "epoch": 477.5, + "learning_rate": 1.8674285714285717e-06, + "loss": 0.2734, + "step": 34380 + }, + { + "epoch": 477.64, + "learning_rate": 1.856e-06, + "loss": 0.2825, + "step": 34390 + }, + { + "epoch": 477.78, + "learning_rate": 1.8445714285714285e-06, + "loss": 0.2689, + "step": 34400 + }, + { + "epoch": 477.91, + "learning_rate": 1.8331428571428572e-06, + "loss": 0.2616, + "step": 34410 + }, + { + "epoch": 478.0, + "eval_loss": 0.5943305492401123, + "eval_runtime": 127.0489, + "eval_samples_per_second": 4.187, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21218743973773863, + "step": 34416 + }, + { + "epoch": 478.06, + "learning_rate": 1.8217142857142858e-06, + "loss": 0.2709, + "step": 34420 + }, + { + "epoch": 478.19, + "learning_rate": 1.8102857142857145e-06, + "loss": 0.2804, + "step": 34430 + }, + { + "epoch": 478.33, + "learning_rate": 1.798857142857143e-06, + "loss": 0.2705, + "step": 34440 + }, + { + "epoch": 478.47, + "learning_rate": 1.7874285714285716e-06, + "loss": 0.2795, + "step": 34450 + }, + { + "epoch": 478.61, + "learning_rate": 1.7760000000000002e-06, + "loss": 0.2697, + "step": 34460 + }, + { + "epoch": 478.75, + "learning_rate": 1.7645714285714289e-06, + "loss": 0.2608, + "step": 34470 + }, + { + "epoch": 478.89, + "learning_rate": 1.7531428571428573e-06, + "loss": 0.259, + "step": 34480 + }, + { + "epoch": 479.0, + "eval_loss": 0.5931774973869324, + "eval_runtime": 128.3165, + "eval_samples_per_second": 4.146, + "eval_steps_per_second": 0.522, + "eval_wer": 0.21257311821045188, + "step": 34488 + }, + { + "epoch": 479.03, + "learning_rate": 1.7417142857142858e-06, + "loss": 0.2811, + "step": 34490 + }, + { + "epoch": 479.17, + "learning_rate": 1.7302857142857144e-06, + "loss": 0.2832, + "step": 34500 + }, + { + "epoch": 479.3, + "learning_rate": 1.7188571428571429e-06, + "loss": 0.2661, + "step": 34510 + }, + { + "epoch": 479.44, + "learning_rate": 1.7074285714285715e-06, + "loss": 0.2738, + "step": 34520 + }, + { + "epoch": 479.58, + "learning_rate": 1.6960000000000002e-06, + "loss": 0.261, + "step": 34530 + }, + { + "epoch": 479.72, + "learning_rate": 1.6845714285714288e-06, + "loss": 0.2762, + "step": 34540 + }, + { + "epoch": 479.86, + "learning_rate": 1.6731428571428572e-06, + "loss": 0.2634, + "step": 34550 + }, + { + "epoch": 480.0, + "learning_rate": 1.6617142857142859e-06, + "loss": 0.2745, + "step": 34560 + }, + { + "epoch": 480.0, + "eval_loss": 0.595533013343811, + "eval_runtime": 127.4383, + "eval_samples_per_second": 4.175, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2111589638105033, + "step": 34560 + }, + { + "epoch": 480.14, + "learning_rate": 1.6502857142857145e-06, + "loss": 0.2791, + "step": 34570 + }, + { + "epoch": 480.28, + "learning_rate": 1.6388571428571428e-06, + "loss": 0.268, + "step": 34580 + }, + { + "epoch": 480.42, + "learning_rate": 1.6274285714285714e-06, + "loss": 0.2816, + "step": 34590 + }, + { + "epoch": 480.55, + "learning_rate": 1.616e-06, + "loss": 0.2621, + "step": 34600 + }, + { + "epoch": 480.69, + "learning_rate": 1.6045714285714287e-06, + "loss": 0.2798, + "step": 34610 + }, + { + "epoch": 480.83, + "learning_rate": 1.5931428571428574e-06, + "loss": 0.2632, + "step": 34620 + }, + { + "epoch": 480.97, + "learning_rate": 1.5817142857142858e-06, + "loss": 0.2738, + "step": 34630 + }, + { + "epoch": 481.0, + "eval_loss": 0.5909281373023987, + "eval_runtime": 127.5993, + "eval_samples_per_second": 4.169, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21051616635598122, + "step": 34632 + }, + { + "epoch": 481.11, + "learning_rate": 1.5702857142857145e-06, + "loss": 0.2777, + "step": 34640 + }, + { + "epoch": 481.25, + "learning_rate": 1.5588571428571431e-06, + "loss": 0.2666, + "step": 34650 + }, + { + "epoch": 481.39, + "learning_rate": 1.5474285714285718e-06, + "loss": 0.2732, + "step": 34660 + }, + { + "epoch": 481.53, + "learning_rate": 1.536e-06, + "loss": 0.2781, + "step": 34670 + }, + { + "epoch": 481.66, + "learning_rate": 1.5245714285714286e-06, + "loss": 0.2792, + "step": 34680 + }, + { + "epoch": 481.8, + "learning_rate": 1.5131428571428573e-06, + "loss": 0.2746, + "step": 34690 + }, + { + "epoch": 481.94, + "learning_rate": 1.5017142857142857e-06, + "loss": 0.2659, + "step": 34700 + }, + { + "epoch": 482.0, + "eval_loss": 0.589744508266449, + "eval_runtime": 126.9751, + "eval_samples_per_second": 4.19, + "eval_steps_per_second": 0.528, + "eval_wer": 0.21148036253776434, + "step": 34704 + }, + { + "epoch": 482.08, + "learning_rate": 1.4902857142857144e-06, + "loss": 0.2633, + "step": 34710 + }, + { + "epoch": 482.22, + "learning_rate": 1.478857142857143e-06, + "loss": 0.2768, + "step": 34720 + }, + { + "epoch": 482.36, + "learning_rate": 1.4674285714285717e-06, + "loss": 0.2615, + "step": 34730 + }, + { + "epoch": 482.5, + "learning_rate": 1.4560000000000001e-06, + "loss": 0.2669, + "step": 34740 + }, + { + "epoch": 482.64, + "learning_rate": 1.4445714285714288e-06, + "loss": 0.2664, + "step": 34750 + }, + { + "epoch": 482.78, + "learning_rate": 1.4331428571428574e-06, + "loss": 0.2638, + "step": 34760 + }, + { + "epoch": 482.91, + "learning_rate": 1.4217142857142856e-06, + "loss": 0.2666, + "step": 34770 + }, + { + "epoch": 483.0, + "eval_loss": 0.5927045941352844, + "eval_runtime": 127.4513, + "eval_samples_per_second": 4.174, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2102590473741724, + "step": 34776 + }, + { + "epoch": 483.06, + "learning_rate": 1.4102857142857143e-06, + "loss": 0.2798, + "step": 34780 + }, + { + "epoch": 483.19, + "learning_rate": 1.398857142857143e-06, + "loss": 0.2664, + "step": 34790 + }, + { + "epoch": 483.33, + "learning_rate": 1.3874285714285716e-06, + "loss": 0.276, + "step": 34800 + }, + { + "epoch": 483.47, + "learning_rate": 1.376e-06, + "loss": 0.2765, + "step": 34810 + }, + { + "epoch": 483.61, + "learning_rate": 1.3645714285714287e-06, + "loss": 0.2728, + "step": 34820 + }, + { + "epoch": 483.75, + "learning_rate": 1.3531428571428573e-06, + "loss": 0.2675, + "step": 34830 + }, + { + "epoch": 483.89, + "learning_rate": 1.341714285714286e-06, + "loss": 0.2779, + "step": 34840 + }, + { + "epoch": 484.0, + "eval_loss": 0.587812602519989, + "eval_runtime": 127.6167, + "eval_samples_per_second": 4.169, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2111589638105033, + "step": 34848 + }, + { + "epoch": 484.03, + "learning_rate": 1.3302857142857144e-06, + "loss": 0.2649, + "step": 34850 + }, + { + "epoch": 484.17, + "learning_rate": 1.3188571428571429e-06, + "loss": 0.2646, + "step": 34860 + }, + { + "epoch": 484.3, + "learning_rate": 1.3074285714285715e-06, + "loss": 0.2619, + "step": 34870 + }, + { + "epoch": 484.44, + "learning_rate": 1.296e-06, + "loss": 0.2801, + "step": 34880 + }, + { + "epoch": 484.58, + "learning_rate": 1.2845714285714286e-06, + "loss": 0.2722, + "step": 34890 + }, + { + "epoch": 484.72, + "learning_rate": 1.2731428571428573e-06, + "loss": 0.2783, + "step": 34900 + }, + { + "epoch": 484.86, + "learning_rate": 1.261714285714286e-06, + "loss": 0.2773, + "step": 34910 + }, + { + "epoch": 485.0, + "learning_rate": 1.2502857142857143e-06, + "loss": 0.2697, + "step": 34920 + }, + { + "epoch": 485.0, + "eval_loss": 0.5891386270523071, + "eval_runtime": 127.6378, + "eval_samples_per_second": 4.168, + "eval_steps_per_second": 0.525, + "eval_wer": 0.21231599922864305, + "step": 34920 + }, + { + "epoch": 485.14, + "learning_rate": 1.238857142857143e-06, + "loss": 0.2824, + "step": 34930 + }, + { + "epoch": 485.28, + "learning_rate": 1.2274285714285714e-06, + "loss": 0.2622, + "step": 34940 + }, + { + "epoch": 485.42, + "learning_rate": 1.216e-06, + "loss": 0.2841, + "step": 34950 + }, + { + "epoch": 485.55, + "learning_rate": 1.2045714285714287e-06, + "loss": 0.2598, + "step": 34960 + }, + { + "epoch": 485.69, + "learning_rate": 1.1931428571428574e-06, + "loss": 0.2723, + "step": 34970 + }, + { + "epoch": 485.83, + "learning_rate": 1.1817142857142858e-06, + "loss": 0.2683, + "step": 34980 + }, + { + "epoch": 485.97, + "learning_rate": 1.1702857142857143e-06, + "loss": 0.2693, + "step": 34990 + }, + { + "epoch": 486.0, + "eval_loss": 0.5904868245124817, + "eval_runtime": 127.8657, + "eval_samples_per_second": 4.161, + "eval_steps_per_second": 0.524, + "eval_wer": 0.21360159413768723, + "step": 34992 + }, + { + "epoch": 486.11, + "learning_rate": 1.158857142857143e-06, + "loss": 0.2765, + "step": 35000 + }, + { + "epoch": 486.25, + "learning_rate": 1.1474285714285716e-06, + "loss": 0.2726, + "step": 35010 + }, + { + "epoch": 486.39, + "learning_rate": 1.1371428571428572e-06, + "loss": 0.2675, + "step": 35020 + }, + { + "epoch": 486.53, + "learning_rate": 1.1257142857142859e-06, + "loss": 0.2669, + "step": 35030 + }, + { + "epoch": 486.66, + "learning_rate": 1.1142857142857145e-06, + "loss": 0.2735, + "step": 35040 + }, + { + "epoch": 486.8, + "learning_rate": 1.102857142857143e-06, + "loss": 0.2585, + "step": 35050 + }, + { + "epoch": 486.94, + "learning_rate": 1.0914285714285714e-06, + "loss": 0.279, + "step": 35060 + }, + { + "epoch": 487.0, + "eval_loss": 0.589709997177124, + "eval_runtime": 127.7721, + "eval_samples_per_second": 4.164, + "eval_steps_per_second": 0.524, + "eval_wer": 0.21250883846499968, + "step": 35064 + }, + { + "epoch": 487.08, + "learning_rate": 1.08e-06, + "loss": 0.278, + "step": 35070 + }, + { + "epoch": 487.22, + "learning_rate": 1.0685714285714287e-06, + "loss": 0.2704, + "step": 35080 + }, + { + "epoch": 487.36, + "learning_rate": 1.0571428571428573e-06, + "loss": 0.2714, + "step": 35090 + }, + { + "epoch": 487.5, + "learning_rate": 1.0457142857142858e-06, + "loss": 0.2682, + "step": 35100 + }, + { + "epoch": 487.64, + "learning_rate": 1.0342857142857144e-06, + "loss": 0.2755, + "step": 35110 + }, + { + "epoch": 487.78, + "learning_rate": 1.0228571428571429e-06, + "loss": 0.2702, + "step": 35120 + }, + { + "epoch": 487.91, + "learning_rate": 1.0114285714285715e-06, + "loss": 0.2738, + "step": 35130 + }, + { + "epoch": 488.0, + "eval_loss": 0.5914762020111084, + "eval_runtime": 128.1415, + "eval_samples_per_second": 4.152, + "eval_steps_per_second": 0.523, + "eval_wer": 0.21128752330140774, + "step": 35136 + }, + { + "epoch": 488.06, + "learning_rate": 1.0000000000000002e-06, + "loss": 0.2666, + "step": 35140 + }, + { + "epoch": 488.19, + "learning_rate": 9.885714285714286e-07, + "loss": 0.2728, + "step": 35150 + }, + { + "epoch": 488.33, + "learning_rate": 9.771428571428573e-07, + "loss": 0.2681, + "step": 35160 + }, + { + "epoch": 488.47, + "learning_rate": 9.657142857142857e-07, + "loss": 0.2743, + "step": 35170 + }, + { + "epoch": 488.61, + "learning_rate": 9.542857142857143e-07, + "loss": 0.2571, + "step": 35180 + }, + { + "epoch": 488.75, + "learning_rate": 9.42857142857143e-07, + "loss": 0.2706, + "step": 35190 + }, + { + "epoch": 488.89, + "learning_rate": 9.314285714285714e-07, + "loss": 0.2784, + "step": 35200 + }, + { + "epoch": 489.0, + "eval_loss": 0.5955053567886353, + "eval_runtime": 127.7624, + "eval_samples_per_second": 4.164, + "eval_steps_per_second": 0.524, + "eval_wer": 0.2111589638105033, + "step": 35208 + }, + { + "epoch": 489.03, + "learning_rate": 9.200000000000001e-07, + "loss": 0.269, + "step": 35210 + }, + { + "epoch": 489.17, + "learning_rate": 9.085714285714286e-07, + "loss": 0.2674, + "step": 35220 + }, + { + "epoch": 489.3, + "learning_rate": 8.971428571428573e-07, + "loss": 0.259, + "step": 35230 + }, + { + "epoch": 489.44, + "learning_rate": 8.857142857142857e-07, + "loss": 0.274, + "step": 35240 + }, + { + "epoch": 489.58, + "learning_rate": 8.742857142857144e-07, + "loss": 0.2749, + "step": 35250 + }, + { + "epoch": 489.72, + "learning_rate": 8.628571428571429e-07, + "loss": 0.2754, + "step": 35260 + }, + { + "epoch": 489.86, + "learning_rate": 8.514285714285716e-07, + "loss": 0.2597, + "step": 35270 + }, + { + "epoch": 490.0, + "learning_rate": 8.400000000000001e-07, + "loss": 0.2777, + "step": 35280 + }, + { + "epoch": 490.0, + "eval_loss": 0.5983956456184387, + "eval_runtime": 127.2531, + "eval_samples_per_second": 4.181, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2119303207559298, + "step": 35280 + }, + { + "epoch": 490.14, + "learning_rate": 8.285714285714285e-07, + "loss": 0.2798, + "step": 35290 + }, + { + "epoch": 490.28, + "learning_rate": 8.171428571428572e-07, + "loss": 0.2654, + "step": 35300 + }, + { + "epoch": 490.42, + "learning_rate": 8.057142857142857e-07, + "loss": 0.272, + "step": 35310 + }, + { + "epoch": 490.55, + "learning_rate": 7.942857142857144e-07, + "loss": 0.2754, + "step": 35320 + }, + { + "epoch": 490.69, + "learning_rate": 7.828571428571429e-07, + "loss": 0.2744, + "step": 35330 + }, + { + "epoch": 490.83, + "learning_rate": 7.714285714285715e-07, + "loss": 0.2674, + "step": 35340 + }, + { + "epoch": 490.97, + "learning_rate": 7.6e-07, + "loss": 0.2654, + "step": 35350 + }, + { + "epoch": 491.0, + "eval_loss": 0.598686695098877, + "eval_runtime": 127.2673, + "eval_samples_per_second": 4.18, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2134730346467828, + "step": 35352 + }, + { + "epoch": 491.11, + "learning_rate": 7.485714285714287e-07, + "loss": 0.2719, + "step": 35360 + }, + { + "epoch": 491.25, + "learning_rate": 7.371428571428572e-07, + "loss": 0.2709, + "step": 35370 + }, + { + "epoch": 491.39, + "learning_rate": 7.257142857142857e-07, + "loss": 0.2715, + "step": 35380 + }, + { + "epoch": 491.53, + "learning_rate": 7.142857142857143e-07, + "loss": 0.2661, + "step": 35390 + }, + { + "epoch": 491.66, + "learning_rate": 7.028571428571429e-07, + "loss": 0.2742, + "step": 35400 + }, + { + "epoch": 491.8, + "learning_rate": 6.914285714285715e-07, + "loss": 0.2616, + "step": 35410 + }, + { + "epoch": 491.94, + "learning_rate": 6.800000000000001e-07, + "loss": 0.2739, + "step": 35420 + }, + { + "epoch": 492.0, + "eval_loss": 0.5963639616966248, + "eval_runtime": 126.8471, + "eval_samples_per_second": 4.194, + "eval_steps_per_second": 0.528, + "eval_wer": 0.21321591566497397, + "step": 35424 + }, + { + "epoch": 492.08, + "learning_rate": 6.685714285714286e-07, + "loss": 0.2699, + "step": 35430 + }, + { + "epoch": 492.22, + "learning_rate": 6.571428571428571e-07, + "loss": 0.2768, + "step": 35440 + }, + { + "epoch": 492.36, + "learning_rate": 6.457142857142858e-07, + "loss": 0.2653, + "step": 35450 + }, + { + "epoch": 492.5, + "learning_rate": 6.342857142857143e-07, + "loss": 0.2687, + "step": 35460 + }, + { + "epoch": 492.64, + "learning_rate": 6.228571428571429e-07, + "loss": 0.261, + "step": 35470 + }, + { + "epoch": 492.78, + "learning_rate": 6.114285714285715e-07, + "loss": 0.2657, + "step": 35480 + }, + { + "epoch": 492.91, + "learning_rate": 6.000000000000001e-07, + "loss": 0.2655, + "step": 35490 + }, + { + "epoch": 493.0, + "eval_loss": 0.5973246693611145, + "eval_runtime": 127.0779, + "eval_samples_per_second": 4.186, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2127016777013563, + "step": 35496 + }, + { + "epoch": 493.06, + "learning_rate": 5.885714285714286e-07, + "loss": 0.2826, + "step": 35500 + }, + { + "epoch": 493.19, + "learning_rate": 5.771428571428572e-07, + "loss": 0.2693, + "step": 35510 + }, + { + "epoch": 493.33, + "learning_rate": 5.657142857142857e-07, + "loss": 0.2564, + "step": 35520 + }, + { + "epoch": 493.47, + "learning_rate": 5.542857142857144e-07, + "loss": 0.2563, + "step": 35530 + }, + { + "epoch": 493.61, + "learning_rate": 5.428571428571429e-07, + "loss": 0.2611, + "step": 35540 + }, + { + "epoch": 493.75, + "learning_rate": 5.314285714285715e-07, + "loss": 0.2769, + "step": 35550 + }, + { + "epoch": 493.89, + "learning_rate": 5.2e-07, + "loss": 0.271, + "step": 35560 + }, + { + "epoch": 494.0, + "eval_loss": 0.5960769653320312, + "eval_runtime": 127.1897, + "eval_samples_per_second": 4.183, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21032332711962462, + "step": 35568 + }, + { + "epoch": 494.03, + "learning_rate": 5.085714285714286e-07, + "loss": 0.2687, + "step": 35570 + }, + { + "epoch": 494.17, + "learning_rate": 4.971428571428572e-07, + "loss": 0.2702, + "step": 35580 + }, + { + "epoch": 494.3, + "learning_rate": 4.857142857142857e-07, + "loss": 0.2705, + "step": 35590 + }, + { + "epoch": 494.44, + "learning_rate": 4.7428571428571434e-07, + "loss": 0.2752, + "step": 35600 + }, + { + "epoch": 494.58, + "learning_rate": 4.628571428571429e-07, + "loss": 0.2665, + "step": 35610 + }, + { + "epoch": 494.72, + "learning_rate": 4.514285714285715e-07, + "loss": 0.2726, + "step": 35620 + }, + { + "epoch": 494.86, + "learning_rate": 4.4e-07, + "loss": 0.2655, + "step": 35630 + }, + { + "epoch": 495.0, + "learning_rate": 4.285714285714286e-07, + "loss": 0.2594, + "step": 35640 + }, + { + "epoch": 495.0, + "eval_loss": 0.5962747931480408, + "eval_runtime": 127.4835, + "eval_samples_per_second": 4.173, + "eval_steps_per_second": 0.526, + "eval_wer": 0.21308735617406954, + "step": 35640 + }, + { + "epoch": 495.14, + "learning_rate": 4.171428571428572e-07, + "loss": 0.2767, + "step": 35650 + }, + { + "epoch": 495.28, + "learning_rate": 4.0571428571428576e-07, + "loss": 0.257, + "step": 35660 + }, + { + "epoch": 495.42, + "learning_rate": 3.9428571428571436e-07, + "loss": 0.269, + "step": 35670 + }, + { + "epoch": 495.55, + "learning_rate": 3.8285714285714285e-07, + "loss": 0.2589, + "step": 35680 + }, + { + "epoch": 495.69, + "learning_rate": 3.7142857142857145e-07, + "loss": 0.268, + "step": 35690 + }, + { + "epoch": 495.83, + "learning_rate": 3.6e-07, + "loss": 0.2707, + "step": 35700 + }, + { + "epoch": 495.97, + "learning_rate": 3.485714285714286e-07, + "loss": 0.2783, + "step": 35710 + }, + { + "epoch": 496.0, + "eval_loss": 0.5968417525291443, + "eval_runtime": 127.469, + "eval_samples_per_second": 4.174, + "eval_steps_per_second": 0.526, + "eval_wer": 0.21218743973773863, + "step": 35712 + }, + { + "epoch": 496.11, + "learning_rate": 3.371428571428572e-07, + "loss": 0.2679, + "step": 35720 + }, + { + "epoch": 496.25, + "learning_rate": 3.2571428571428573e-07, + "loss": 0.2656, + "step": 35730 + }, + { + "epoch": 496.39, + "learning_rate": 3.1428571428571433e-07, + "loss": 0.2589, + "step": 35740 + }, + { + "epoch": 496.53, + "learning_rate": 3.028571428571429e-07, + "loss": 0.2721, + "step": 35750 + }, + { + "epoch": 496.66, + "learning_rate": 2.914285714285715e-07, + "loss": 0.2773, + "step": 35760 + }, + { + "epoch": 496.8, + "learning_rate": 2.8e-07, + "loss": 0.2703, + "step": 35770 + }, + { + "epoch": 496.94, + "learning_rate": 2.685714285714286e-07, + "loss": 0.2748, + "step": 35780 + }, + { + "epoch": 497.0, + "eval_loss": 0.5944899916648865, + "eval_runtime": 127.1656, + "eval_samples_per_second": 4.184, + "eval_steps_per_second": 0.527, + "eval_wer": 0.2128302371922607, + "step": 35784 + }, + { + "epoch": 497.08, + "learning_rate": 2.5714285714285716e-07, + "loss": 0.2625, + "step": 35790 + }, + { + "epoch": 497.22, + "learning_rate": 2.457142857142857e-07, + "loss": 0.2683, + "step": 35800 + }, + { + "epoch": 497.36, + "learning_rate": 2.3428571428571428e-07, + "loss": 0.2696, + "step": 35810 + }, + { + "epoch": 497.5, + "learning_rate": 2.228571428571429e-07, + "loss": 0.282, + "step": 35820 + }, + { + "epoch": 497.64, + "learning_rate": 2.1142857142857145e-07, + "loss": 0.2632, + "step": 35830 + }, + { + "epoch": 497.78, + "learning_rate": 2.0000000000000002e-07, + "loss": 0.2693, + "step": 35840 + }, + { + "epoch": 497.91, + "learning_rate": 1.885714285714286e-07, + "loss": 0.2707, + "step": 35850 + }, + { + "epoch": 498.0, + "eval_loss": 0.5948219299316406, + "eval_runtime": 127.2162, + "eval_samples_per_second": 4.182, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21218743973773863, + "step": 35856 + }, + { + "epoch": 498.06, + "learning_rate": 1.7714285714285716e-07, + "loss": 0.2682, + "step": 35860 + }, + { + "epoch": 498.19, + "learning_rate": 1.657142857142857e-07, + "loss": 0.2708, + "step": 35870 + }, + { + "epoch": 498.33, + "learning_rate": 1.542857142857143e-07, + "loss": 0.2673, + "step": 35880 + }, + { + "epoch": 498.47, + "learning_rate": 1.4285714285714287e-07, + "loss": 0.2703, + "step": 35890 + }, + { + "epoch": 498.61, + "learning_rate": 1.3142857142857144e-07, + "loss": 0.2654, + "step": 35900 + }, + { + "epoch": 498.75, + "learning_rate": 1.2000000000000002e-07, + "loss": 0.2631, + "step": 35910 + }, + { + "epoch": 498.89, + "learning_rate": 1.0857142857142857e-07, + "loss": 0.2686, + "step": 35920 + }, + { + "epoch": 499.0, + "eval_loss": 0.5948572754859924, + "eval_runtime": 128.1208, + "eval_samples_per_second": 4.152, + "eval_steps_per_second": 0.523, + "eval_wer": 0.21199460050138202, + "step": 35928 + }, + { + "epoch": 499.03, + "learning_rate": 9.714285714285714e-08, + "loss": 0.2782, + "step": 35930 + }, + { + "epoch": 499.17, + "learning_rate": 8.571428571428573e-08, + "loss": 0.2721, + "step": 35940 + }, + { + "epoch": 499.3, + "learning_rate": 7.428571428571429e-08, + "loss": 0.2622, + "step": 35950 + }, + { + "epoch": 499.44, + "learning_rate": 6.285714285714286e-08, + "loss": 0.2637, + "step": 35960 + }, + { + "epoch": 499.58, + "learning_rate": 5.142857142857143e-08, + "loss": 0.2625, + "step": 35970 + }, + { + "epoch": 499.72, + "learning_rate": 4e-08, + "loss": 0.2736, + "step": 35980 + }, + { + "epoch": 499.86, + "learning_rate": 2.8571428571428575e-08, + "loss": 0.27, + "step": 35990 + }, + { + "epoch": 500.0, + "learning_rate": 1.7142857142857143e-08, + "loss": 0.2699, + "step": 36000 + }, + { + "epoch": 500.0, + "eval_loss": 0.5942903161048889, + "eval_runtime": 127.0427, + "eval_samples_per_second": 4.188, + "eval_steps_per_second": 0.527, + "eval_wer": 0.21263739795590408, + "step": 36000 + }, + { + "epoch": 500.0, + "step": 36000, + "total_flos": 1.360166857740454e+21, + "train_loss": 0.3826021006438467, + "train_runtime": 953283.2249, + "train_samples_per_second": 2.422, "train_steps_per_second": 0.038 } ], - "max_steps": 3600, - "num_train_epochs": 50, - "total_flos": 1.3601359172236221e+20, + "max_steps": 36000, + "num_train_epochs": 500, + "total_flos": 1.360166857740454e+21, "trial_name": null, "trial_params": null }